diff --git a/.github/workflows/comment_bot.yml b/.github/workflows/comment_bot.yml
index 35d889152fb..b78ae80fb97 100644
--- a/.github/workflows/comment_bot.yml
+++ b/.github/workflows/comment_bot.yml
@@ -95,8 +95,8 @@ jobs:
           set -ex
           export PATH=/home/runner/.local/bin:$PATH
           python3 -m pip install --upgrade pip setuptools wheel
-          python3 -m pip install -r dev/archery/requirements-lint.txt
-          python3 run-cmake-format.py
+          python3 -m pip install -e dev/archery[lint]
+          archery lint --cmake-format --fix
       - name: Run clang-format on cpp
         if: env.CLANG_FORMAT_CPP == 'true' || endsWith(github.event.comment.body, 'everything')
         run: |
diff --git a/.github/workflows/r.yml b/.github/workflows/r.yml
index 5acb47a0ae0..e160ba8128a 100644
--- a/.github/workflows/r.yml
+++ b/.github/workflows/r.yml
@@ -247,6 +247,7 @@ jobs:
           Sys.setenv(
             RWINLIB_LOCAL = file.path(Sys.getenv("GITHUB_WORKSPACE"), "libarrow.zip"),
             MAKEFLAGS = paste0("-j", parallel::detectCores()),
+            ARROW_R_DEV = TRUE,
             "_R_CHECK_FORCE_SUGGESTS_" = FALSE
           )
           rcmdcheck::rcmdcheck("r",
diff --git a/c_glib/arrow-dataset-glib/arrow-dataset-glib.h b/c_glib/arrow-dataset-glib/arrow-dataset-glib.h
index 03e56516112..58f4e216cc7 100644
--- a/c_glib/arrow-dataset-glib/arrow-dataset-glib.h
+++ b/c_glib/arrow-dataset-glib/arrow-dataset-glib.h
@@ -23,6 +23,8 @@
 
 #include <arrow-dataset-glib/dataset-factory.h>
 #include <arrow-dataset-glib/dataset.h>
+#include <arrow-dataset-glib/enums.h>
 #include <arrow-dataset-glib/file-format.h>
 #include <arrow-dataset-glib/fragment.h>
+#include <arrow-dataset-glib/partitioning.h>
 #include <arrow-dataset-glib/scanner.h>
diff --git a/c_glib/arrow-dataset-glib/arrow-dataset-glib.hpp b/c_glib/arrow-dataset-glib/arrow-dataset-glib.hpp
index 65341b9b77e..8e996506884 100644
--- a/c_glib/arrow-dataset-glib/arrow-dataset-glib.hpp
+++ b/c_glib/arrow-dataset-glib/arrow-dataset-glib.hpp
@@ -25,4 +25,5 @@
 #include <arrow-dataset-glib/dataset.hpp>
 #include <arrow-dataset-glib/file-format.hpp>
 #include <arrow-dataset-glib/fragment.hpp>
+#include <arrow-dataset-glib/partitioning.hpp>
 #include <arrow-dataset-glib/scanner.hpp>
diff --git a/c_glib/arrow-dataset-glib/dataset-factory.cpp b/c_glib/arrow-dataset-glib/dataset-factory.cpp
index 146db69adfc..433e58b2031 100644
--- a/c_glib/arrow-dataset-glib/dataset-factory.cpp
+++ b/c_glib/arrow-dataset-glib/dataset-factory.cpp
@@ -23,6 +23,7 @@
 #include <arrow-dataset-glib/dataset-factory.hpp>
 #include <arrow-dataset-glib/dataset.hpp>
 #include <arrow-dataset-glib/file-format.hpp>
+#include <arrow-dataset-glib/partitioning.hpp>
 
 G_BEGIN_DECLS
 
@@ -142,6 +143,7 @@ gadataset_dataset_factory_finish(GADatasetDatasetFactory *factory,
 typedef struct GADatasetFileSystemDatasetFactoryPrivate_ {
   GADatasetFileFormat *format;
   GArrowFileSystem *file_system;
+  GADatasetPartitioning *partitioning;
   GList *files;
   arrow::dataset::FileSystemFactoryOptions options;
 } GADatasetFileSystemDatasetFactoryPrivate;
@@ -149,6 +151,8 @@ typedef struct GADatasetFileSystemDatasetFactoryPrivate_ {
 enum {
   PROP_FORMAT = 1,
   PROP_FILE_SYSTEM,
+  PROP_PARTITIONING,
+  PROP_PARTITION_BASE_DIR,
 };
 
 G_DEFINE_TYPE_WITH_PRIVATE(GADatasetFileSystemDatasetFactory,
@@ -175,6 +179,11 @@ gadataset_file_system_dataset_factory_dispose(GObject *object)
     priv->file_system = NULL;
   }
 
+  if (priv->partitioning) {
+    g_object_unref(priv->partitioning);
+    priv->partitioning = NULL;
+  }
+
   if (priv->files) {
     g_list_free_full(priv->files, g_object_unref);
     priv->files = NULL;
@@ -205,6 +214,29 @@ gadataset_file_system_dataset_factory_set_property(GObject *object,
   case PROP_FORMAT:
     priv->format = GADATASET_FILE_FORMAT(g_value_dup_object(value));
     break;
+  case PROP_PARTITIONING:
+    {
+      auto partitioning = g_value_get_object(value);
+      if (partitioning == priv->partitioning) {
+        break;
+      }
+      auto old_partitioning = priv->partitioning;
+      if (partitioning) {
+        g_object_ref(partitioning);
+        priv->partitioning = GADATASET_PARTITIONING(partitioning);
+        priv->options.partitioning =
+          gadataset_partitioning_get_raw(priv->partitioning);
+      } else {
+        priv->options.partitioning = arrow::dataset::Partitioning::Default();
+      }
+      if (old_partitioning) {
+        g_object_unref(old_partitioning);
+      }
+    }
+    break;
+  case PROP_PARTITION_BASE_DIR:
+    priv->options.partition_base_dir = g_value_get_string(value);
+    break;
   default:
     G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
     break;
@@ -226,6 +258,12 @@ gadataset_file_system_dataset_factory_get_property(GObject *object,
   case PROP_FILE_SYSTEM:
     g_value_set_object(value, priv->file_system);
     break;
+  case PROP_PARTITIONING:
+    g_value_set_object(value, priv->partitioning);
+    break;
+  case PROP_PARTITION_BASE_DIR:
+    g_value_set_string(value, priv->options.partition_base_dir.c_str());
+    break;
   default:
     G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
     break;
@@ -279,6 +317,35 @@ gadataset_file_system_dataset_factory_class_init(
                              GARROW_TYPE_FILE_SYSTEM,
                              static_cast<GParamFlags>(G_PARAM_READABLE));
   g_object_class_install_property(gobject_class, PROP_FILE_SYSTEM, spec);
+
+  /**
+   * GADatasetFileSystemDatasetFactory:partitioning:
+   *
+   * Partitioning used by #GADatasetFileSystemDataset.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_object("partitioning",
+                             "Partitioning",
+                             "Partitioning used by GADatasetFileSystemDataset",
+                             GADATASET_TYPE_PARTITIONING,
+                             static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class, PROP_PARTITIONING, spec);
+
+  /**
+   * GADatasetFileSystemDatasetFactory:partition-base-dir:
+   *
+   * Partition base directory used by #GADatasetFileSystemDataset.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_string("partition-base-dir",
+                             "Partition base directory",
+                             "Partition base directory "
+                             "used by GADatasetFileSystemDataset",
+                             NULL,
+                             static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class, PROP_PARTITION_BASE_DIR, spec);
 }
 
 /**
@@ -454,6 +521,7 @@ gadataset_file_system_dataset_factory_finish(
                               "dataset", &arrow_dataset,
                               "file-system", priv->file_system,
                               "format", priv->format,
+                              "partitioning", priv->partitioning,
                               NULL));
 }
 
diff --git a/c_glib/arrow-dataset-glib/dataset.cpp b/c_glib/arrow-dataset-glib/dataset.cpp
index 3bd62f99ef3..8613bedad42 100644
--- a/c_glib/arrow-dataset-glib/dataset.cpp
+++ b/c_glib/arrow-dataset-glib/dataset.cpp
@@ -18,11 +18,14 @@
  */
 
 #include <arrow-glib/error.hpp>
+#include <arrow-glib/file-system.hpp>
 #include <arrow-glib/table.hpp>
 
 #include <arrow-dataset-glib/dataset-factory.hpp>
 #include <arrow-dataset-glib/dataset.hpp>
-#include <arrow-dataset-glib/scanner.h>
+#include <arrow-dataset-glib/file-format.hpp>
+#include <arrow-dataset-glib/partitioning.hpp>
+#include <arrow-dataset-glib/scanner.hpp>
 
 G_BEGIN_DECLS
 
@@ -36,13 +39,8 @@ G_BEGIN_DECLS
  *
  * #GADatasetFileSystemDataset is a class for file system dataset.
  *
- * #GADatasetFileFormat is a base class for file formats.
- *
- * #GADatasetCSVFileFormat is a class for CSV file format.
- *
- * #GADatasetIPCFileFormat is a class for IPC file format.
- *
- * #GADatasetParquetFileFormat is a class for Apache Parquet file format.
+ * #GADatasetFileSystemDatasetWriteOptions is a class for options to
+ * write a dataset to file system dataset.
  *
  * Since: 5.0.0
  */
@@ -190,14 +188,326 @@ gadataset_dataset_get_type_name(GADatasetDataset *dataset)
 }
 
 
+typedef struct GADatasetFileSystemDatasetWriteOptionsPrivate_ {
+  arrow::dataset::FileSystemDatasetWriteOptions options;
+  GADatasetFileWriteOptions *file_write_options;
+  GArrowFileSystem *file_system;
+  GADatasetPartitioning *partitioning;
+} GADatasetFileSystemDatasetWriteOptionsPrivate;
+
+enum {
+  PROP_FILE_WRITE_OPTIONS = 1,
+  PROP_FILE_SYSTEM,
+  PROP_BASE_DIR,
+  PROP_PARTITIONING,
+  PROP_MAX_PARTITIONS,
+  PROP_BASE_NAME_TEMPLATE,
+};
+
+G_DEFINE_TYPE_WITH_PRIVATE(GADatasetFileSystemDatasetWriteOptions,
+                           gadataset_file_system_dataset_write_options,
+                           G_TYPE_OBJECT)
+
+#define GADATASET_FILE_SYSTEM_DATASET_WRITE_OPTIONS_GET_PRIVATE(obj)    \
+  static_cast<GADatasetFileSystemDatasetWriteOptionsPrivate *>(         \
+    gadataset_file_system_dataset_write_options_get_instance_private(   \
+      GADATASET_FILE_SYSTEM_DATASET_WRITE_OPTIONS(obj)))
+
+static void
+gadataset_file_system_dataset_write_options_finalize(GObject *object)
+{
+  auto priv = GADATASET_FILE_SYSTEM_DATASET_WRITE_OPTIONS_GET_PRIVATE(object);
+  priv->options.~FileSystemDatasetWriteOptions();
+  G_OBJECT_CLASS(gadataset_file_system_dataset_write_options_parent_class)->
+    finalize(object);
+}
+
+static void
+gadataset_file_system_dataset_write_options_dispose(GObject *object)
+{
+  auto priv = GADATASET_FILE_SYSTEM_DATASET_WRITE_OPTIONS_GET_PRIVATE(object);
+
+  if (priv->file_write_options) {
+    g_object_unref(priv->file_write_options);
+    priv->file_write_options = NULL;
+  }
+
+  if (priv->file_system) {
+    g_object_unref(priv->file_system);
+    priv->file_system = NULL;
+  }
+
+  if (priv->partitioning) {
+    g_object_unref(priv->partitioning);
+    priv->partitioning = NULL;
+  }
+
+  G_OBJECT_CLASS(gadataset_file_system_dataset_write_options_parent_class)->
+    dispose(object);
+}
+
+static void
+gadataset_file_system_dataset_write_options_set_property(GObject *object,
+                                                         guint prop_id,
+                                                         const GValue *value,
+                                                         GParamSpec *pspec)
+{
+  auto priv = GADATASET_FILE_SYSTEM_DATASET_WRITE_OPTIONS_GET_PRIVATE(object);
+
+  switch (prop_id) {
+  case PROP_FILE_WRITE_OPTIONS:
+    {
+      auto file_write_options = g_value_get_object(value);
+      if (file_write_options == priv->file_write_options) {
+        break;
+      }
+      auto old_file_write_options = priv->file_write_options;
+      if (file_write_options) {
+        g_object_ref(file_write_options);
+        priv->file_write_options =
+          GADATASET_FILE_WRITE_OPTIONS(file_write_options);
+        priv->options.file_write_options =
+          gadataset_file_write_options_get_raw(priv->file_write_options);
+      } else {
+        priv->options.file_write_options = nullptr;
+      }
+      if (old_file_write_options) {
+        g_object_unref(old_file_write_options);
+      }
+    }
+    break;
+  case PROP_FILE_SYSTEM:
+    {
+      auto file_system = g_value_get_object(value);
+      if (file_system == priv->file_system) {
+        break;
+      }
+      auto old_file_system = priv->file_system;
+      if (file_system) {
+        g_object_ref(file_system);
+        priv->file_system = GARROW_FILE_SYSTEM(file_system);
+        priv->options.filesystem = garrow_file_system_get_raw(priv->file_system);
+      } else {
+        priv->options.filesystem = nullptr;
+      }
+      if (old_file_system) {
+        g_object_unref(old_file_system);
+      }
+    }
+    break;
+  case PROP_BASE_DIR:
+    priv->options.base_dir = g_value_get_string(value);
+    break;
+  case PROP_PARTITIONING:
+    {
+      auto partitioning = g_value_get_object(value);
+      if (partitioning == priv->partitioning) {
+        break;
+      }
+      auto old_partitioning = priv->partitioning;
+      if (partitioning) {
+        g_object_ref(partitioning);
+        priv->partitioning = GADATASET_PARTITIONING(partitioning);
+        priv->options.partitioning =
+          gadataset_partitioning_get_raw(priv->partitioning);
+      } else {
+        priv->options.partitioning = arrow::dataset::Partitioning::Default();
+      }
+      if (old_partitioning) {
+        g_object_unref(old_partitioning);
+      }
+    }
+    break;
+  case PROP_MAX_PARTITIONS:
+    priv->options.max_partitions = g_value_get_uint(value);
+    break;
+  case PROP_BASE_NAME_TEMPLATE:
+    priv->options.basename_template = g_value_get_string(value);
+    break;
+  default:
+    G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
+    break;
+  }
+}
+
+static void
+gadataset_file_system_dataset_write_options_get_property(GObject *object,
+                                                         guint prop_id,
+                                                         GValue *value,
+                                                         GParamSpec *pspec)
+{
+  auto priv = GADATASET_FILE_SYSTEM_DATASET_WRITE_OPTIONS_GET_PRIVATE(object);
+
+  switch (prop_id) {
+  case PROP_FILE_WRITE_OPTIONS:
+    g_value_set_object(value, priv->file_write_options);
+    break;
+  case PROP_FILE_SYSTEM:
+    g_value_set_object(value, priv->file_system);
+    break;
+  case PROP_BASE_DIR:
+    g_value_set_string(value, priv->options.base_dir.c_str());
+    break;
+  case PROP_PARTITIONING:
+    g_value_set_object(value, priv->partitioning);
+    break;
+  case PROP_MAX_PARTITIONS:
+    g_value_set_uint(value, priv->options.max_partitions);
+    break;
+  case PROP_BASE_NAME_TEMPLATE:
+    g_value_set_string(value, priv->options.basename_template.c_str());
+    break;
+  default:
+    G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
+    break;
+  }
+}
+
+static void
+gadataset_file_system_dataset_write_options_init(
+  GADatasetFileSystemDatasetWriteOptions *object)
+{
+  auto priv = GADATASET_FILE_SYSTEM_DATASET_WRITE_OPTIONS_GET_PRIVATE(object);
+  new(&(priv->options)) arrow::dataset::FileSystemDatasetWriteOptions;
+  priv->options.partitioning = arrow::dataset::Partitioning::Default();
+}
+
+static void
+gadataset_file_system_dataset_write_options_class_init(
+  GADatasetFileSystemDatasetWriteOptionsClass *klass)
+{
+  auto gobject_class = G_OBJECT_CLASS(klass);
+  gobject_class->finalize =
+    gadataset_file_system_dataset_write_options_finalize;
+  gobject_class->dispose =
+    gadataset_file_system_dataset_write_options_dispose;
+  gobject_class->set_property =
+    gadataset_file_system_dataset_write_options_set_property;
+  gobject_class->get_property =
+    gadataset_file_system_dataset_write_options_get_property;
+
+  arrow::dataset::FileSystemDatasetWriteOptions default_options;
+  GParamSpec *spec;
+  /**
+   * GADatasetFileSystemDatasetWriteOptions:file_write_options:
+   *
+   * Options for individual fragment writing.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_object("file-write-options",
+                             "File write options",
+                             "Options for individual fragment writing",
+                             GADATASET_TYPE_FILE_WRITE_OPTIONS,
+                             static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class, PROP_FILE_WRITE_OPTIONS, spec);
+
+  /**
+   * GADatasetFileSystemDatasetWriteOptions:file_system:
+   *
+   * #GArrowFileSystem into which a dataset will be written.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_object("file-system",
+                             "File system",
+                             "GArrowFileSystem into which "
+                             "a dataset will be written",
+                             GARROW_TYPE_FILE_SYSTEM,
+                             static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class, PROP_FILE_SYSTEM, spec);
+
+  /**
+   * GADatasetFileSystemDatasetWriteOptions:base_dir:
+   *
+   * Root directory into which the dataset will be written.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_string("base-dir",
+                             "Base directory",
+                             "Root directory into which "
+                             "the dataset will be written",
+                             NULL,
+                             static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class, PROP_BASE_DIR, spec);
+
+  /**
+   * GADatasetFileSystemDatasetWriteOptions:partitioning:
+   *
+   * #GADatasetPartitioning used to generate fragment paths.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_object("partitioning",
+                             "Partitioning",
+                             "GADatasetPartitioning used to "
+                             "generate fragment paths",
+                             GADATASET_TYPE_PARTITIONING,
+                             static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class, PROP_PARTITIONING, spec);
+
+  /**
+   * GADatasetFileSystemDatasetWriteOptions:max-partitions:
+   *
+   * Maximum number of partitions any batch may be written into.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_uint("max-partitions",
+                           "Max partitions",
+                           "Maximum number of partitions "
+                           "any batch may be written into",
+                           0,
+                           G_MAXINT,
+                           default_options.max_partitions,
+                           static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class, PROP_MAX_PARTITIONS, spec);
+
+  /**
+   * GADatasetFileSystemDatasetWriteOptions:base-name-template:
+   *
+   * Template string used to generate fragment base names. {i} will be
+   * replaced by an auto incremented integer.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_string("base-name-template",
+                             "Base name template",
+                             "Template string used to generate fragment "
+                             "base names. {i} will be replaced by "
+                             "an auto incremented integer",
+                             NULL,
+                             static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class, PROP_BASE_NAME_TEMPLATE, spec);
+}
+
+/**
+ * gadataset_file_system_dataset_write_options_new:
+ *
+ * Returns: The newly created #GADatasetFileSystemDatasetWriteOptions.
+ *
+ * Since: 6.0.0
+ */
+GADatasetFileSystemDatasetWriteOptions *
+gadataset_file_system_dataset_write_options_new(void)
+{
+  return GADATASET_FILE_SYSTEM_DATASET_WRITE_OPTIONS(
+    g_object_new(GADATASET_TYPE_FILE_SYSTEM_DATASET_WRITE_OPTIONS,
+                 NULL));
+}
+
+
 typedef struct GADatasetFileSystemDatasetPrivate_ {
   GADatasetFileFormat *format;
   GArrowFileSystem *file_system;
+  GADatasetPartitioning *partitioning;
 } GADatasetFileSystemDatasetPrivate;
 
 enum {
-  PROP_FORMAT = 1,
-  PROP_FILE_SYSTEM,
+  PROP_FILE_SYSTEM_DATASET_FORMAT = 1,
+  PROP_FILE_SYSTEM_DATASET_FILE_SYSTEM,
+  PROP_FILE_SYSTEM_DATASET_PARTITIONING,
 };
 
 G_DEFINE_TYPE_WITH_PRIVATE(GADatasetFileSystemDataset,
@@ -236,12 +546,15 @@ gadataset_file_system_dataset_set_property(GObject *object,
   auto priv = GADATASET_FILE_SYSTEM_DATASET_GET_PRIVATE(object);
 
   switch (prop_id) {
-  case PROP_FORMAT:
+  case PROP_FILE_SYSTEM_DATASET_FORMAT:
     priv->format = GADATASET_FILE_FORMAT(g_value_dup_object(value));
     break;
-  case PROP_FILE_SYSTEM:
+  case PROP_FILE_SYSTEM_DATASET_FILE_SYSTEM:
     priv->file_system = GARROW_FILE_SYSTEM(g_value_dup_object(value));
     break;
+  case PROP_FILE_SYSTEM_DATASET_PARTITIONING:
+    priv->partitioning = GADATASET_PARTITIONING(g_value_dup_object(value));
+    break;
   default:
     G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
     break;
@@ -257,12 +570,15 @@ gadataset_file_system_dataset_get_property(GObject *object,
   auto priv = GADATASET_FILE_SYSTEM_DATASET_GET_PRIVATE(object);
 
   switch (prop_id) {
-  case PROP_FORMAT:
+  case PROP_FILE_SYSTEM_DATASET_FORMAT:
     g_value_set_object(value, priv->format);
     break;
-  case PROP_FILE_SYSTEM:
+  case PROP_FILE_SYSTEM_DATASET_FILE_SYSTEM:
     g_value_set_object(value, priv->file_system);
     break;
+  case PROP_FILE_SYSTEM_DATASET_PARTITIONING:
+    g_value_set_object(value, priv->partitioning);
+    break;
   default:
     G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
     break;
@@ -296,7 +612,9 @@ gadataset_file_system_dataset_class_init(GADatasetFileSystemDatasetClass *klass)
                              GADATASET_TYPE_FILE_FORMAT,
                              static_cast<GParamFlags>(G_PARAM_READWRITE |
                                                       G_PARAM_CONSTRUCT_ONLY));
-  g_object_class_install_property(gobject_class, PROP_FORMAT, spec);
+  g_object_class_install_property(gobject_class,
+                                  PROP_FILE_SYSTEM_DATASET_FORMAT,
+                                  spec);
 
   /**
    * GADatasetFileSystemDataset:file-system:
@@ -311,7 +629,52 @@ gadataset_file_system_dataset_class_init(GADatasetFileSystemDatasetClass *klass)
                              GARROW_TYPE_FILE_SYSTEM,
                              static_cast<GParamFlags>(G_PARAM_READWRITE |
                                                       G_PARAM_CONSTRUCT_ONLY));
-  g_object_class_install_property(gobject_class, PROP_FILE_SYSTEM, spec);
+  g_object_class_install_property(gobject_class,
+                                  PROP_FILE_SYSTEM_DATASET_FILE_SYSTEM,
+                                  spec);
+
+  /**
+   * GADatasetFileSystemDataset:partitioning:
+   *
+   * Partitioning of the dataset.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_object("partitioning",
+                             "Partitioning",
+                             "Partitioning of the dataset",
+                             GADATASET_TYPE_PARTITIONING,
+                             static_cast<GParamFlags>(G_PARAM_READWRITE |
+                                                      G_PARAM_CONSTRUCT_ONLY));
+  g_object_class_install_property(gobject_class,
+                                  PROP_FILE_SYSTEM_DATASET_PARTITIONING,
+                                  spec);
+}
+
+/**
+ * gadataset_file_system_dataset_write_scanner:
+ * @scanner: A #GADatasetScanner that produces data to be written.
+ * @options: A #GADatasetFileSystemDatasetWriteOptions.
+ * @error: (nullable): Return location for a #GError or %NULL.
+ *
+ * Returns: %TRUE on success, %FALSE on error.
+ *
+ * Since: 6.0.0
+ */
+gboolean
+gadataset_file_system_dataset_write_scanner(
+  GADatasetScanner *scanner,
+  GADatasetFileSystemDatasetWriteOptions *options,
+  GError **error)
+{
+  auto arrow_scanner = gadataset_scanner_get_raw(scanner);
+  auto arrow_options =
+    gadataset_file_system_dataset_write_options_get_raw(options);
+  auto status =
+    arrow::dataset::FileSystemDataset::Write(*arrow_options, arrow_scanner);
+  return garrow::check(error,
+                       status,
+                       "[file-system-dataset][write-scanner]");
 }
 
 
@@ -363,3 +726,11 @@ gadataset_dataset_get_raw(GADatasetDataset *dataset)
   auto priv = GADATASET_DATASET_GET_PRIVATE(dataset);
   return priv->dataset;
 }
+
+arrow::dataset::FileSystemDatasetWriteOptions *
+gadataset_file_system_dataset_write_options_get_raw(
+  GADatasetFileSystemDatasetWriteOptions *options)
+{
+  auto priv = GADATASET_FILE_SYSTEM_DATASET_WRITE_OPTIONS_GET_PRIVATE(options);
+  return &(priv->options);
+}
diff --git a/c_glib/arrow-dataset-glib/dataset.h b/c_glib/arrow-dataset-glib/dataset.h
index 97cf35d74d7..86d077caa98 100644
--- a/c_glib/arrow-dataset-glib/dataset.h
+++ b/c_glib/arrow-dataset-glib/dataset.h
@@ -24,6 +24,7 @@
 G_BEGIN_DECLS
 
 typedef struct _GADatasetScannerBuilder GADatasetScannerBuilder;
+typedef struct _GADatasetScanner GADatasetScanner;
 
 #define GADATASET_TYPE_DATASET (gadataset_dataset_get_type())
 G_DECLARE_DERIVABLE_TYPE(GADatasetDataset,
@@ -49,6 +50,23 @@ gchar *
 gadataset_dataset_get_type_name(GADatasetDataset *dataset);
 
 
+#define GADATASET_TYPE_FILE_SYSTEM_DATASET_WRITE_OPTIONS        \
+  (gadataset_file_system_dataset_write_options_get_type())
+G_DECLARE_DERIVABLE_TYPE(GADatasetFileSystemDatasetWriteOptions,
+                         gadataset_file_system_dataset_write_options,
+                         GADATASET,
+                         FILE_SYSTEM_DATASET_WRITE_OPTIONS,
+                         GObject)
+struct _GADatasetFileSystemDatasetWriteOptionsClass
+{
+  GObjectClass parent_class;
+};
+
+GARROW_AVAILABLE_IN_6_0
+GADatasetFileSystemDatasetWriteOptions *
+gadataset_file_system_dataset_write_options_new(void);
+
+
 #define GADATASET_TYPE_FILE_SYSTEM_DATASET      \
   (gadataset_file_system_dataset_get_type())
 G_DECLARE_DERIVABLE_TYPE(GADatasetFileSystemDataset,
@@ -61,5 +79,12 @@ struct _GADatasetFileSystemDatasetClass
   GADatasetDatasetClass parent_class;
 };
 
+GARROW_AVAILABLE_IN_6_0
+gboolean
+gadataset_file_system_dataset_write_scanner(
+  GADatasetScanner *scanner,
+  GADatasetFileSystemDatasetWriteOptions *options,
+  GError **error);
+
 
 G_END_DECLS
diff --git a/c_glib/arrow-dataset-glib/dataset.hpp b/c_glib/arrow-dataset-glib/dataset.hpp
index 94dddd2eb7a..1dab391e8af 100644
--- a/c_glib/arrow-dataset-glib/dataset.hpp
+++ b/c_glib/arrow-dataset-glib/dataset.hpp
@@ -23,6 +23,7 @@
 
 #include <arrow-dataset-glib/dataset.h>
 
+
 GADatasetDataset *
 gadataset_dataset_new_raw(
   std::shared_ptr<arrow::dataset::Dataset> *arrow_dataset);
@@ -39,10 +40,7 @@ gadataset_dataset_new_raw_valist(
 std::shared_ptr<arrow::dataset::Dataset>
 gadataset_dataset_get_raw(GADatasetDataset *dataset);
 
-GADatasetFileFormat *
-gadataset_file_format_new_raw(
-  std::shared_ptr<arrow::dataset::FileFormat> *arrow_format);
-std::shared_ptr<arrow::dataset::Dataset>
-gadataset_dataset_get_raw(GADatasetDataset *dataset);
-
 
+arrow::dataset::FileSystemDatasetWriteOptions *
+gadataset_file_system_dataset_write_options_get_raw(
+  GADatasetFileSystemDatasetWriteOptions *options);
diff --git a/c_glib/arrow-dataset-glib/enums.c.template b/c_glib/arrow-dataset-glib/enums.c.template
new file mode 100644
index 00000000000..8921ab06252
--- /dev/null
+++ b/c_glib/arrow-dataset-glib/enums.c.template
@@ -0,0 +1,52 @@
+/*** BEGIN file-header ***/
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include <arrow-dataset-glib/arrow-dataset-glib.h>
+/*** END file-header ***/
+
+/*** BEGIN file-production ***/
+
+/* enumerations from "@filename@" */
+/*** END file-production ***/
+
+/*** BEGIN value-header ***/
+GType
+@enum_name@_get_type(void)
+{
+  static GType etype = 0;
+  if (G_UNLIKELY(etype == 0)) {
+    static const G@Type@Value values[] = {
+/*** END value-header ***/
+
+/*** BEGIN value-production ***/
+      {@VALUENAME@, "@VALUENAME@", "@valuenick@"},
+/*** END value-production ***/
+
+/*** BEGIN value-tail ***/
+      {0, NULL, NULL}
+    };
+    etype = g_@type@_register_static(g_intern_static_string("@EnumName@"), values);
+  }
+  return etype;
+}
+/*** END value-tail ***/
+
+/*** BEGIN file-tail ***/
+/*** END file-tail ***/
diff --git a/c_glib/arrow-dataset-glib/enums.h.template b/c_glib/arrow-dataset-glib/enums.h.template
new file mode 100644
index 00000000000..d6a0a455f5a
--- /dev/null
+++ b/c_glib/arrow-dataset-glib/enums.h.template
@@ -0,0 +1,41 @@
+/*** BEGIN file-header ***/
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#pragma once
+
+#include <arrow-dataset-glib/partitioning.h>
+
+G_BEGIN_DECLS
+/*** END file-header ***/
+
+/*** BEGIN file-production ***/
+
+/* enumerations from "@filename@" */
+/*** END file-production ***/
+
+/*** BEGIN value-header ***/
+GType @enum_name@_get_type(void) G_GNUC_CONST;
+#define @ENUMPREFIX@_TYPE_@ENUMSHORT@ (@enum_name@_get_type())
+/*** END value-header ***/
+
+/*** BEGIN file-tail ***/
+
+G_END_DECLS
+/*** END file-tail ***/
diff --git a/c_glib/arrow-dataset-glib/file-format.cpp b/c_glib/arrow-dataset-glib/file-format.cpp
index 43f6a198f23..c0c92d966f8 100644
--- a/c_glib/arrow-dataset-glib/file-format.cpp
+++ b/c_glib/arrow-dataset-glib/file-format.cpp
@@ -18,6 +18,11 @@
  */
 
 #include <arrow-glib/error.hpp>
+#include <arrow-glib/file-system.hpp>
+#include <arrow-glib/output-stream.hpp>
+#include <arrow-glib/record-batch.hpp>
+#include <arrow-glib/reader.hpp>
+#include <arrow-glib/schema.hpp>
 
 #include <arrow-dataset-glib/file-format.hpp>
 
@@ -29,6 +34,11 @@ G_BEGIN_DECLS
  * @title: File format classes
  * @include: arrow-dataset-glib/arrow-dataset-glib.h
  *
+ * #GADatasetFileWriteOptions is a class for options to write a file
+ * of this format.
+ *
+ * #GADatasetFileWriter is a class for writing a file of this format.
+ *
  * #GADatasetFileFormat is a base class for file format classes.
  *
  * #GADatasetCSVFileFormat is a class for CSV file format.
@@ -40,12 +50,218 @@ G_BEGIN_DECLS
  * Since: 3.0.0
  */
 
+typedef struct GADatasetFileWriteOptionsPrivate_ {
+  std::shared_ptr<arrow::dataset::FileWriteOptions> options;
+} GADatasetFileWriteOptionsPrivate;
+
+enum {
+  PROP_OPTIONS = 1,
+};
+
+G_DEFINE_TYPE_WITH_PRIVATE(GADatasetFileWriteOptions,
+                           gadataset_file_write_options,
+                           G_TYPE_OBJECT)
+
+#define GADATASET_FILE_WRITE_OPTIONS_GET_PRIVATE(obj)       \
+  static_cast<GADatasetFileWriteOptionsPrivate *>(          \
+    gadataset_file_write_options_get_instance_private(      \
+      GADATASET_FILE_WRITE_OPTIONS(obj)))
+
+static void
+gadataset_file_write_options_finalize(GObject *object)
+{
+  auto priv = GADATASET_FILE_WRITE_OPTIONS_GET_PRIVATE(object);
+  priv->options.~shared_ptr();
+  G_OBJECT_CLASS(gadataset_file_write_options_parent_class)->finalize(object);
+}
+
+static void
+gadataset_file_write_options_set_property(GObject *object,
+                                          guint prop_id,
+                                          const GValue *value,
+                                          GParamSpec *pspec)
+{
+  auto priv = GADATASET_FILE_WRITE_OPTIONS_GET_PRIVATE(object);
+
+  switch (prop_id) {
+  case PROP_OPTIONS:
+    priv->options =
+      *static_cast<std::shared_ptr<arrow::dataset::FileWriteOptions> *>(
+        g_value_get_pointer(value));
+    break;
+  default:
+    G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
+    break;
+  }
+}
+
+static void
+gadataset_file_write_options_init(GADatasetFileWriteOptions *object)
+{
+  auto priv = GADATASET_FILE_WRITE_OPTIONS_GET_PRIVATE(object);
+  new(&priv->options) std::shared_ptr<arrow::dataset::FileWriteOptions>;
+}
+
+static void
+gadataset_file_write_options_class_init(GADatasetFileWriteOptionsClass *klass)
+{
+  auto gobject_class = G_OBJECT_CLASS(klass);
+
+  gobject_class->finalize     = gadataset_file_write_options_finalize;
+  gobject_class->set_property = gadataset_file_write_options_set_property;
+
+  GParamSpec *spec;
+  spec = g_param_spec_pointer("options",
+                              "Options",
+                              "The raw "
+                              "std::shared<arrow::dataset::FileWriteOptions> *",
+                              static_cast<GParamFlags>(G_PARAM_WRITABLE |
+                                                       G_PARAM_CONSTRUCT_ONLY));
+  g_object_class_install_property(gobject_class, PROP_OPTIONS, spec);
+}
+
+
+typedef struct GADatasetFileWriterPrivate_ {
+  std::shared_ptr<arrow::dataset::FileWriter> writer;
+} GADatasetFileWriterPrivate;
+
+enum {
+  PROP_WRITER = 1,
+};
+
+G_DEFINE_TYPE_WITH_PRIVATE(GADatasetFileWriter,
+                           gadataset_file_writer,
+                           G_TYPE_OBJECT)
+
+#define GADATASET_FILE_WRITER_GET_PRIVATE(obj)              \
+  static_cast<GADatasetFileWriterPrivate *>(                \
+    gadataset_file_writer_get_instance_private(             \
+      GADATASET_FILE_WRITER(obj)))
+
+static void
+gadataset_file_writer_finalize(GObject *object)
+{
+  auto priv = GADATASET_FILE_WRITER_GET_PRIVATE(object);
+  priv->writer.~shared_ptr();
+  G_OBJECT_CLASS(gadataset_file_writer_parent_class)->finalize(object);
+}
+
+static void
+gadataset_file_writer_set_property(GObject *object,
+                                   guint prop_id,
+                                   const GValue *value,
+                                   GParamSpec *pspec)
+{
+  auto priv = GADATASET_FILE_WRITER_GET_PRIVATE(object);
+
+  switch (prop_id) {
+  case PROP_WRITER:
+    priv->writer =
+      *static_cast<std::shared_ptr<arrow::dataset::FileWriter> *>(
+        g_value_get_pointer(value));
+    break;
+  default:
+    G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
+    break;
+  }
+}
+
+static void
+gadataset_file_writer_init(GADatasetFileWriter *object)
+{
+  auto priv = GADATASET_FILE_WRITER_GET_PRIVATE(object);
+  new(&(priv->writer)) std::shared_ptr<arrow::dataset::FileWriter>;
+}
+
+static void
+gadataset_file_writer_class_init(GADatasetFileWriterClass *klass)
+{
+  auto gobject_class = G_OBJECT_CLASS(klass);
+
+  gobject_class->finalize     = gadataset_file_writer_finalize;
+  gobject_class->set_property = gadataset_file_writer_set_property;
+
+  GParamSpec *spec;
+  spec = g_param_spec_pointer("writer",
+                              "Writer",
+                              "The raw "
+                              "std::shared<arrow::dataset::FileWriter> *",
+                              static_cast<GParamFlags>(G_PARAM_WRITABLE |
+                                                       G_PARAM_CONSTRUCT_ONLY));
+  g_object_class_install_property(gobject_class, PROP_WRITER, spec);
+}
+
+/**
+ * gadataset_file_writer_write_record_batch:
+ * @writer: A #GADatasetFileWriter.
+ * @record_batch: A #GArrowRecordBatch to be written.
+ * @error: (nullable): Return location for a #GError or %NULL.
+ *
+ * Returns: %TRUE on success, %FALSE on error.
+ *
+ * Since: 6.0.0
+ */
+gboolean
+gadataset_file_writer_write_record_batch(GADatasetFileWriter *writer,
+                                         GArrowRecordBatch *record_batch,
+                                         GError **error)
+{
+  const auto arrow_writer = gadataset_file_writer_get_raw(writer);
+  const auto arrow_record_batch = garrow_record_batch_get_raw(record_batch);
+  auto status = arrow_writer->Write(arrow_record_batch);
+  return garrow::check(error, status, "[file-writer][write-record-batch]");
+}
+
+/**
+ * gadataset_file_writer_write_record_batch_reader:
+ * @writer: A #GADatasetFileWriter.
+ * @reader: A #GArrowRecordBatchReader to be written.
+ * @error: (nullable): Return location for a #GError or %NULL.
+ *
+ * Returns: %TRUE on success, %FALSE on error.
+ *
+ * Since: 6.0.0
+ */
+gboolean
+gadataset_file_writer_write_record_batch_reader(GADatasetFileWriter *writer,
+                                                GArrowRecordBatchReader *reader,
+                                                GError **error)
+{
+  const auto arrow_writer = gadataset_file_writer_get_raw(writer);
+  auto arrow_reader = garrow_record_batch_reader_get_raw(reader);
+  auto status = arrow_writer->Write(arrow_reader.get());
+  return garrow::check(error,
+                       status,
+                       "[file-writer][write-record-batch-reader]");
+}
+
+/**
+ * gadataset_file_writer_finish:
+ * @writer: A #GADatasetFileWriter.
+ * @error: (nullable): Return location for a #GError or %NULL.
+ *
+ * Returns: %TRUE on success, %FALSE on error.
+ *
+ * Since: 6.0.0
+ */
+gboolean
+gadataset_file_writer_finish(GADatasetFileWriter *writer,
+                             GError **error)
+{
+  const auto arrow_writer = gadataset_file_writer_get_raw(writer);
+  auto status = arrow_writer->Finish();
+  return garrow::check(error,
+                       status,
+                       "[file-writer][finish]");
+}
+
+
 typedef struct GADatasetFileFormatPrivate_ {
-  std::shared_ptr<arrow::dataset::FileFormat> file_format;
+  std::shared_ptr<arrow::dataset::FileFormat> format;
 } GADatasetFileFormatPrivate;
 
 enum {
-  PROP_FILE_FORMAT = 1,
+  PROP_FORMAT = 1,
 };
 
 G_DEFINE_TYPE_WITH_PRIVATE(GADatasetFileFormat,
@@ -61,9 +277,7 @@ static void
 gadataset_file_format_finalize(GObject *object)
 {
   auto priv = GADATASET_FILE_FORMAT_GET_PRIVATE(object);
-
-  priv->file_format.~shared_ptr();
-
+  priv->format.~shared_ptr();
   G_OBJECT_CLASS(gadataset_file_format_parent_class)->finalize(object);
 }
 
@@ -76,8 +290,8 @@ gadataset_file_format_set_property(GObject *object,
   auto priv = GADATASET_FILE_FORMAT_GET_PRIVATE(object);
 
   switch (prop_id) {
-  case PROP_FILE_FORMAT:
-    priv->file_format =
+  case PROP_FORMAT:
+    priv->format =
       *static_cast<std::shared_ptr<arrow::dataset::FileFormat> *>(
         g_value_get_pointer(value));
     break;
@@ -91,7 +305,7 @@ static void
 gadataset_file_format_init(GADatasetFileFormat *object)
 {
   auto priv = GADATASET_FILE_FORMAT_GET_PRIVATE(object);
-  new(&priv->file_format) std::shared_ptr<arrow::dataset::FileFormat>;
+  new(&priv->format) std::shared_ptr<arrow::dataset::FileFormat>;
 }
 
 static void
@@ -103,49 +317,106 @@ gadataset_file_format_class_init(GADatasetFileFormatClass *klass)
   gobject_class->set_property = gadataset_file_format_set_property;
 
   GParamSpec *spec;
-  spec = g_param_spec_pointer("file-format",
-                              "FileFormat",
+  spec = g_param_spec_pointer("format",
+                              "Format",
                               "The raw std::shared<arrow::dataset::FileFormat> *",
                               static_cast<GParamFlags>(G_PARAM_WRITABLE |
                                                        G_PARAM_CONSTRUCT_ONLY));
-  g_object_class_install_property(gobject_class, PROP_FILE_FORMAT, spec);
+  g_object_class_install_property(gobject_class, PROP_FORMAT, spec);
 }
 
 /**
  * gadataset_file_format_get_type_name:
- * @file_format: A #GADatasetFileFormat.
+ * @format: A #GADatasetFileFormat.
  *
- * Returns: The type name of @file_format.
+ * Returns: The type name of @format.
  *
  *   It should be freed with g_free() when no longer needed.
  *
  * Since: 3.0.0
  */
 gchar *
-gadataset_file_format_get_type_name(GADatasetFileFormat *file_format)
+gadataset_file_format_get_type_name(GADatasetFileFormat *format)
 {
-  const auto arrow_file_format = gadataset_file_format_get_raw(file_format);
-  const auto &type_name = arrow_file_format->type_name();
+  const auto arrow_format = gadataset_file_format_get_raw(format);
+  const auto &type_name = arrow_format->type_name();
   return g_strndup(type_name.data(), type_name.size());
 }
 
+/**
+ * gadataset_file_format_get_default_write_options:
+ * @format: A #GADatasetFileFormat.
+ *
+ * Returns: (transfer full): The default #GADatasetFileWriteOptions of @format.
+ *
+ * Since: 6.0.0
+ */
+GADatasetFileWriteOptions *
+gadataset_file_format_get_default_write_options(GADatasetFileFormat *format)
+{
+  const auto arrow_format = gadataset_file_format_get_raw(format);
+  auto arrow_options = arrow_format->DefaultWriteOptions();
+  return gadataset_file_write_options_new_raw(&arrow_options);
+}
+
+/**
+ * gadataset_file_format_open_writer:
+ * @format: A #GADatasetFileFormat.
+ * @destination: A #GArrowOutputStream.
+ * @file_system: The #GArrowFileSystem of @destination.
+ * @path: The path of @destination.
+ * @schema: A #GArrowSchema that is used by written record batches.
+ * @options: A #GADatasetFileWriteOptions.
+ * @error: (nullable): Return location for a #GError or %NULL.
+ *
+ * Returns: (transfer full): The newly created #GADatasetFileWriter of @format
+ *   on success, %NULL on error.
+ *
+ * Since: 6.0.0
+ */
+GADatasetFileWriter *
+gadataset_file_format_open_writer(GADatasetFileFormat *format,
+                                  GArrowOutputStream *destination,
+                                  GArrowFileSystem *file_system,
+                                  const gchar *path,
+                                  GArrowSchema *schema,
+                                  GADatasetFileWriteOptions *options,
+                                  GError **error)
+{
+  const auto arrow_format = gadataset_file_format_get_raw(format);
+  auto arrow_destination = garrow_output_stream_get_raw(destination);
+  auto arrow_file_system = garrow_file_system_get_raw(file_system);
+  auto arrow_schema = garrow_schema_get_raw(schema);
+  auto arrow_options = gadataset_file_write_options_get_raw(options);
+  auto arrow_writer_result =
+    arrow_format->MakeWriter(arrow_destination,
+                             arrow_schema,
+                             arrow_options,
+                             {arrow_file_system, path});
+  if (garrow::check(error, arrow_writer_result, "[file-format][open-writer]")) {
+    auto arrow_writer = *arrow_writer_result;
+    return gadataset_file_writer_new_raw(&arrow_writer);
+  } else {
+    return NULL;
+  }
+}
+
 /**
  * gadataset_file_format_equal:
- * @file_format: A #GADatasetFileFormat.
- * @other_file_format: A #GADatasetFileFormat to be compared.
+ * @format: A #GADatasetFileFormat.
+ * @other_format: A #GADatasetFileFormat to be compared.
  *
  * Returns: %TRUE if they are the same content file format, %FALSE otherwise.
  *
  * Since: 3.0.0
  */
 gboolean
-gadataset_file_format_equal(GADatasetFileFormat *file_format,
-                      GADatasetFileFormat *other_file_format)
+gadataset_file_format_equal(GADatasetFileFormat *format,
+                            GADatasetFileFormat *other_format)
 {
-  const auto arrow_file_format = gadataset_file_format_get_raw(file_format);
-  const auto arrow_other_file_format =
-    gadataset_file_format_get_raw(other_file_format);
-  return arrow_file_format->Equals(*arrow_other_file_format);
+  const auto arrow_format = gadataset_file_format_get_raw(format);
+  const auto arrow_other_format = gadataset_file_format_get_raw(other_format);
+  return arrow_format->Equals(*arrow_other_format);
 }
 
 
@@ -173,10 +444,9 @@ gadataset_csv_file_format_class_init(GADatasetCSVFileFormatClass *klass)
 GADatasetCSVFileFormat *
 gadataset_csv_file_format_new(void)
 {
-  std::shared_ptr<arrow::dataset::FileFormat> arrow_file_format =
+  std::shared_ptr<arrow::dataset::FileFormat> arrow_format =
     std::make_shared<arrow::dataset::CsvFileFormat>();
-  return GADATASET_CSV_FILE_FORMAT(
-    gadataset_file_format_new_raw(&arrow_file_format));
+  return GADATASET_CSV_FILE_FORMAT(gadataset_file_format_new_raw(&arrow_format));
 }
 
 
@@ -204,10 +474,9 @@ gadataset_ipc_file_format_class_init(GADatasetIPCFileFormatClass *klass)
 GADatasetIPCFileFormat *
 gadataset_ipc_file_format_new(void)
 {
-  std::shared_ptr<arrow::dataset::FileFormat> arrow_file_format =
+  std::shared_ptr<arrow::dataset::FileFormat> arrow_format =
     std::make_shared<arrow::dataset::IpcFileFormat>();
-  return GADATASET_IPC_FILE_FORMAT(
-    gadataset_file_format_new_raw(&arrow_file_format));
+  return GADATASET_IPC_FILE_FORMAT(gadataset_file_format_new_raw(&arrow_format));
 }
 
 
@@ -235,21 +504,56 @@ gadataset_parquet_file_format_class_init(GADatasetParquetFileFormatClass *klass)
 GADatasetParquetFileFormat *
 gadataset_parquet_file_format_new(void)
 {
-  std::shared_ptr<arrow::dataset::FileFormat> arrow_file_format =
+  std::shared_ptr<arrow::dataset::FileFormat> arrow_format =
     std::make_shared<arrow::dataset::ParquetFileFormat>();
   return GADATASET_PARQUET_FILE_FORMAT(
-    gadataset_file_format_new_raw(&arrow_file_format));
+    gadataset_file_format_new_raw(&arrow_format));
 }
 
 
 G_END_DECLS
 
+GADatasetFileWriteOptions *
+gadataset_file_write_options_new_raw(
+  std::shared_ptr<arrow::dataset::FileWriteOptions> *arrow_options)
+{
+  return GADATASET_FILE_WRITE_OPTIONS(
+    g_object_new(GADATASET_TYPE_FILE_WRITE_OPTIONS,
+                 "options", arrow_options,
+                 NULL));
+}
+
+std::shared_ptr<arrow::dataset::FileWriteOptions>
+gadataset_file_write_options_get_raw(GADatasetFileWriteOptions *options)
+{
+  auto priv = GADATASET_FILE_WRITE_OPTIONS_GET_PRIVATE(options);
+  return priv->options;
+}
+
+
+GADatasetFileWriter *
+gadataset_file_writer_new_raw(
+  std::shared_ptr<arrow::dataset::FileWriter> *arrow_writer)
+{
+  return GADATASET_FILE_WRITER(g_object_new(GADATASET_TYPE_FILE_WRITER,
+                                            "writer", arrow_writer,
+                                            NULL));
+}
+
+std::shared_ptr<arrow::dataset::FileWriter>
+gadataset_file_writer_get_raw(GADatasetFileWriter *writer)
+{
+  auto priv = GADATASET_FILE_WRITER_GET_PRIVATE(writer);
+  return priv->writer;
+}
+
+
 GADatasetFileFormat *
 gadataset_file_format_new_raw(
-  std::shared_ptr<arrow::dataset::FileFormat> *arrow_file_format)
+  std::shared_ptr<arrow::dataset::FileFormat> *arrow_format)
 {
   GType type = GADATASET_TYPE_FILE_FORMAT;
-  const auto &type_name = (*arrow_file_format)->type_name();
+  const auto &type_name = (*arrow_format)->type_name();
   if (type_name == "csv") {
     type = GADATASET_TYPE_CSV_FILE_FORMAT;
   } else if (type_name == "ipc") {
@@ -258,13 +562,13 @@ gadataset_file_format_new_raw(
     type = GADATASET_TYPE_PARQUET_FILE_FORMAT;
   }
   return GADATASET_FILE_FORMAT(g_object_new(type,
-                                            "file-format", arrow_file_format,
+                                            "format", arrow_format,
                                             NULL));
 }
 
 std::shared_ptr<arrow::dataset::FileFormat>
-gadataset_file_format_get_raw(GADatasetFileFormat *file_format)
+gadataset_file_format_get_raw(GADatasetFileFormat *format)
 {
-  auto priv = GADATASET_FILE_FORMAT_GET_PRIVATE(file_format);
-  return priv->file_format;
+  auto priv = GADATASET_FILE_FORMAT_GET_PRIVATE(format);
+  return priv->format;
 }
diff --git a/c_glib/arrow-dataset-glib/file-format.h b/c_glib/arrow-dataset-glib/file-format.h
index 7a6f46f56e9..16a8340747c 100644
--- a/c_glib/arrow-dataset-glib/file-format.h
+++ b/c_glib/arrow-dataset-glib/file-format.h
@@ -23,6 +23,47 @@
 
 G_BEGIN_DECLS
 
+#define GADATASET_TYPE_FILE_WRITE_OPTIONS       \
+  (gadataset_file_write_options_get_type())
+G_DECLARE_DERIVABLE_TYPE(GADatasetFileWriteOptions,
+                         gadataset_file_write_options,
+                         GADATASET,
+                         FILE_WRITE_OPTIONS,
+                         GObject)
+struct _GADatasetFileWriteOptionsClass
+{
+  GObjectClass parent_class;
+};
+
+
+#define GADATASET_TYPE_FILE_WRITER              \
+  (gadataset_file_writer_get_type())
+G_DECLARE_DERIVABLE_TYPE(GADatasetFileWriter,
+                         gadataset_file_writer,
+                         GADATASET,
+                         FILE_WRITER,
+                         GObject)
+struct _GADatasetFileWriterClass
+{
+  GObjectClass parent_class;
+};
+
+GARROW_AVAILABLE_IN_6_0
+gboolean
+gadataset_file_writer_write_record_batch(GADatasetFileWriter *writer,
+                                         GArrowRecordBatch *record_batch,
+                                         GError **error);
+GARROW_AVAILABLE_IN_6_0
+gboolean
+gadataset_file_writer_write_record_batch_reader(GADatasetFileWriter *writer,
+                                                GArrowRecordBatchReader *reader,
+                                                GError **error);
+GARROW_AVAILABLE_IN_6_0
+gboolean
+gadataset_file_writer_finish(GADatasetFileWriter *writer,
+                             GError **error);
+
+
 #define GADATASET_TYPE_FILE_FORMAT (gadataset_file_format_get_type())
 G_DECLARE_DERIVABLE_TYPE(GADatasetFileFormat,
                          gadataset_file_format,
@@ -36,12 +77,24 @@ struct _GADatasetFileFormatClass
 
 GARROW_AVAILABLE_IN_3_0
 gchar *
-gadataset_file_format_get_type_name(GADatasetFileFormat *file_format);
+gadataset_file_format_get_type_name(GADatasetFileFormat *format);
+GARROW_AVAILABLE_IN_6_0
+GADatasetFileWriteOptions *
+gadataset_file_format_get_default_write_options(GADatasetFileFormat *format);
+GARROW_AVAILABLE_IN_6_0
+GADatasetFileWriter *
+gadataset_file_format_open_writer(GADatasetFileFormat *format,
+                                  GArrowOutputStream *destination,
+                                  GArrowFileSystem *file_system,
+                                  const gchar *path,
+                                  GArrowSchema *schema,
+                                  GADatasetFileWriteOptions *options,
+                                  GError **error);
 
 GARROW_AVAILABLE_IN_3_0
 gboolean
-gadataset_file_format_equal(GADatasetFileFormat *file_format,
-                            GADatasetFileFormat *other_file_format);
+gadataset_file_format_equal(GADatasetFileFormat *format,
+                            GADatasetFileFormat *other_format);
 
 
 #define GADATASET_TYPE_CSV_FILE_FORMAT (gadataset_csv_file_format_get_type())
diff --git a/c_glib/arrow-dataset-glib/file-format.hpp b/c_glib/arrow-dataset-glib/file-format.hpp
index 5dfb20b3caa..636dc5c015b 100644
--- a/c_glib/arrow-dataset-glib/file-format.hpp
+++ b/c_glib/arrow-dataset-glib/file-format.hpp
@@ -23,8 +23,22 @@
 
 #include <arrow-dataset-glib/file-format.h>
 
+GADatasetFileWriteOptions *
+gadataset_file_write_options_new_raw(
+  std::shared_ptr<arrow::dataset::FileWriteOptions> *arrow_options);
+std::shared_ptr<arrow::dataset::FileWriteOptions>
+gadataset_file_write_options_get_raw(GADatasetFileWriteOptions *options);
+
+
+GADatasetFileWriter *
+gadataset_file_writer_new_raw(
+  std::shared_ptr<arrow::dataset::FileWriter> *arrow_writer);
+std::shared_ptr<arrow::dataset::FileWriter>
+gadataset_file_writer_get_raw(GADatasetFileWriter *writer);
+
+
 GADatasetFileFormat *
 gadataset_file_format_new_raw(
-  std::shared_ptr<arrow::dataset::FileFormat> *arrow_file_format);
+  std::shared_ptr<arrow::dataset::FileFormat> *arrow_format);
 std::shared_ptr<arrow::dataset::FileFormat>
-gadataset_file_format_get_raw(GADatasetFileFormat *file_format);
+gadataset_file_format_get_raw(GADatasetFileFormat *format);
diff --git a/c_glib/arrow-dataset-glib/meson.build b/c_glib/arrow-dataset-glib/meson.build
index b3f617330cf..0d9b8564ecb 100644
--- a/c_glib/arrow-dataset-glib/meson.build
+++ b/c_glib/arrow-dataset-glib/meson.build
@@ -22,6 +22,7 @@ sources = files(
   'dataset.cpp',
   'file-format.cpp',
   'fragment.cpp',
+  'partitioning.cpp',
   'scanner.cpp',
 )
 
@@ -31,6 +32,7 @@ c_headers = files(
   'dataset.h',
   'file-format.h',
   'fragment.h',
+  'partitioning.h',
   'scanner.h',
 )
 
@@ -40,9 +42,22 @@ cpp_headers = files(
   'dataset.hpp',
   'file-format.hpp',
   'fragment.hpp',
+  'partitioning.hpp',
   'scanner.hpp',
 )
 
+enums = gnome.mkenums('enums',
+                      sources: c_headers,
+                      identifier_prefix: 'GADataset',
+                      symbol_prefix: 'gadataset',
+                      c_template: 'enums.c.template',
+                      h_template: 'enums.h.template',
+                      install_dir: join_paths(include_dir, meson.project_name()),
+                      install_header: true)
+enums_source = enums[0]
+enums_header = enums[1]
+
+
 headers = c_headers + cpp_headers
 install_headers(headers, subdir: 'arrow-dataset-glib')
 
@@ -51,7 +66,7 @@ dependencies = [
   arrow_glib,
 ]
 libarrow_dataset_glib = library('arrow-dataset-glib',
-                                sources: sources,
+                                sources: sources + enums,
                                 install: true,
                                 dependencies: dependencies,
                                 include_directories: base_include_directories,
@@ -59,7 +74,8 @@ libarrow_dataset_glib = library('arrow-dataset-glib',
                                 version: library_version)
 arrow_dataset_glib = declare_dependency(link_with: libarrow_dataset_glib,
                                         include_directories: base_include_directories,
-                                        dependencies: dependencies)
+                                        dependencies: dependencies,
+                                        sources: enums_header)
 
 pkgconfig.generate(libarrow_dataset_glib,
                    filebase: 'arrow-dataset-glib',
@@ -71,7 +87,7 @@ pkgconfig.generate(libarrow_dataset_glib,
 if have_gi
   gnome.generate_gir(libarrow_dataset_glib,
                      dependencies: declare_dependency(sources: arrow_glib_gir),
-                     sources: sources + c_headers,
+                     sources: sources + c_headers + enums,
                      namespace: 'ArrowDataset',
                      nsversion: api_version,
                      identifier_prefix: 'GADataset',
diff --git a/c_glib/arrow-dataset-glib/partitioning.cpp b/c_glib/arrow-dataset-glib/partitioning.cpp
new file mode 100644
index 00000000000..bce33671a35
--- /dev/null
+++ b/c_glib/arrow-dataset-glib/partitioning.cpp
@@ -0,0 +1,440 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include <arrow-glib/array.hpp>
+#include <arrow-glib/error.hpp>
+#include <arrow-glib/schema.hpp>
+
+#include <arrow-dataset-glib/enums.h>
+#include <arrow-dataset-glib/partitioning.hpp>
+
+G_BEGIN_DECLS
+
+/**
+ * SECTION: partitioning
+ * @section_id: partitioning
+ * @title: Partitioning classes
+ * @include: arrow-dataset-glib/arrow-dataset-glib.h
+ *
+ * #GADatasetPartitioningOptions is a class for partitioning options.
+ *
+ * #GADatasetPartitioning is a base class for partitioning classes
+ * such as #GADatasetDirectoryPartitioning.
+ *
+ * #GADatasetKeyValuePartitioning is a base class for key-value style
+ * partitioning classes such as #GADatasetDirectoryPartitioning.
+ *
+ * #GADatasetDirectoryPartitioning is a class for partitioning that
+ * uses directory structure.
+ *
+ * Since: 6.0.0
+ */
+
+typedef struct GADatasetPartitioningOptionsPrivate_ {
+  gboolean infer_dictionary;
+  GArrowSchema *schema;
+  GADatasetSegmentEncoding segment_encoding;
+} GADatasetPartitioningOptionsPrivate;
+
+enum {
+  PROP_INFER_DICTIONARY = 1,
+  PROP_SCHEMA,
+  PROP_SEGMENT_ENCODING,
+};
+
+G_DEFINE_TYPE_WITH_PRIVATE(GADatasetPartitioningOptions,
+                           gadataset_partitioning_options,
+                           G_TYPE_OBJECT)
+
+#define GADATASET_PARTITIONING_OPTIONS_GET_PRIVATE(obj)         \
+  static_cast<GADatasetPartitioningOptionsPrivate *>(           \
+    gadataset_partitioning_options_get_instance_private(        \
+      GADATASET_PARTITIONING_OPTIONS(obj)))
+
+static void
+gadataset_partitioning_options_dispose(GObject *object)
+{
+  auto priv = GADATASET_PARTITIONING_OPTIONS_GET_PRIVATE(object);
+
+  if (priv->schema) {
+    g_object_unref(priv->schema);
+    priv->schema = nullptr;
+  }
+
+  G_OBJECT_CLASS(gadataset_partitioning_options_parent_class)->dispose(object);
+}
+
+static void
+gadataset_partitioning_options_set_property(GObject *object,
+                                            guint prop_id,
+                                            const GValue *value,
+                                            GParamSpec *pspec)
+{
+  auto priv = GADATASET_PARTITIONING_OPTIONS_GET_PRIVATE(object);
+
+  switch (prop_id) {
+  case PROP_INFER_DICTIONARY:
+    priv->infer_dictionary = g_value_get_boolean(value);
+    break;
+  case PROP_SCHEMA:
+    {
+      auto schema = g_value_get_object(value);
+      if (priv->schema == schema) {
+        break;
+      }
+      auto old_schema = priv->schema;
+      if (schema) {
+        g_object_ref(schema);
+        priv->schema = GARROW_SCHEMA(schema);
+      } else {
+        priv->schema = NULL;
+      }
+      if (old_schema) {
+        g_object_unref(old_schema);
+      }
+    }
+    break;
+  case PROP_SEGMENT_ENCODING:
+    priv->segment_encoding =
+      static_cast<GADatasetSegmentEncoding>(g_value_get_enum(value));
+    break;
+  default:
+    G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
+    break;
+  }
+}
+
+static void
+gadataset_partitioning_options_get_property(GObject *object,
+                                            guint prop_id,
+                                            GValue *value,
+                                            GParamSpec *pspec)
+{
+  auto priv = GADATASET_PARTITIONING_OPTIONS_GET_PRIVATE(object);
+
+  switch (prop_id) {
+  case PROP_INFER_DICTIONARY:
+    g_value_set_boolean(value, priv->infer_dictionary);
+    break;
+  case PROP_SCHEMA:
+    g_value_set_object(value, priv->schema);
+    break;
+  case PROP_SEGMENT_ENCODING:
+    g_value_set_enum(value, priv->segment_encoding);
+    break;
+  default:
+    G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
+    break;
+  }
+}
+
+static void
+gadataset_partitioning_options_init(GADatasetPartitioningOptions *object)
+{
+}
+
+static void
+gadataset_partitioning_options_class_init(
+  GADatasetPartitioningOptionsClass *klass)
+{
+  auto gobject_class = G_OBJECT_CLASS(klass);
+
+  gobject_class->dispose = gadataset_partitioning_options_dispose;
+  gobject_class->set_property = gadataset_partitioning_options_set_property;
+  gobject_class->get_property = gadataset_partitioning_options_get_property;
+
+  arrow::dataset::PartitioningFactoryOptions default_options;
+  GParamSpec *spec;
+  /**
+   * GADatasetPartitioningOptions:infer-dictionary:
+   *
+   * When inferring a schema for partition fields, yield dictionary
+   * encoded types instead of plain. This can be more efficient when
+   * materializing virtual columns, and Expressions parsed by the
+   * finished Partitioning will include dictionaries of all unique
+   * inspected values for each field.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_boolean("infer-dictionary",
+                              "Infer dictionary",
+                              "Whether encode partitioned field values as "
+                              "dictionary",
+                              default_options.infer_dictionary,
+                              static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class, PROP_INFER_DICTIONARY, spec);
+
+  /**
+   * GADatasetPartitioningOptions:schema:
+   *
+   * Optionally, an expected schema can be provided, in which case
+   * inference will only check discovered fields against the schema
+   * and update internal state (such as dictionaries).
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_object("schema",
+                             "Schema",
+                             "Inference will only check discovered fields "
+                             "against the schema and update internal state",
+                             GARROW_TYPE_SCHEMA,
+                             static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class, PROP_SCHEMA, spec);
+
+  /**
+   * GADatasetPartitioningOptions:segment-encoding:
+   *
+   * After splitting a path into components, decode the path
+   * components before parsing according to this scheme.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_enum("segment-encoding",
+                           "Segment encoding",
+                           "After splitting a path into components, "
+                           "decode the path components before "
+                           "parsing according to this scheme",
+                           GADATASET_TYPE_SEGMENT_ENCODING,
+                           static_cast<GADatasetSegmentEncoding>(
+                             default_options.segment_encoding),
+                           static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class, PROP_SEGMENT_ENCODING, spec);
+}
+
+/**
+ * gadataset_partitioning_options_new:
+ *
+ * Returns: The newly created #GADatasetPartitioningOptions.
+ *
+ * Since: 6.0.0
+ */
+GADatasetPartitioningOptions *
+gadataset_partitioning_options_new(void)
+{
+  return GADATASET_PARTITIONING_OPTIONS(
+    g_object_new(GADATASET_TYPE_PARTITIONING_OPTIONS,
+                 NULL));
+}
+
+
+typedef struct GADatasetPartitioningPrivate_ {
+  std::shared_ptr<arrow::dataset::Partitioning> partitioning;
+} GADatasetPartitioningPrivate;
+
+enum {
+  PROP_PARTITIONING = 1,
+};
+
+G_DEFINE_TYPE_WITH_PRIVATE(GADatasetPartitioning,
+                           gadataset_partitioning,
+                           G_TYPE_OBJECT)
+
+#define GADATASET_PARTITIONING_GET_PRIVATE(obj)         \
+  static_cast<GADatasetPartitioningPrivate *>(          \
+    gadataset_partitioning_get_instance_private(        \
+      GADATASET_PARTITIONING(obj)))
+
+static void
+gadataset_partitioning_finalize(GObject *object)
+{
+  auto priv = GADATASET_PARTITIONING_GET_PRIVATE(object);
+  priv->partitioning.~shared_ptr();
+  G_OBJECT_CLASS(gadataset_partitioning_parent_class)->finalize(object);
+}
+
+static void
+gadataset_partitioning_set_property(GObject *object,
+                                    guint prop_id,
+                                    const GValue *value,
+                                    GParamSpec *pspec)
+{
+  auto priv = GADATASET_PARTITIONING_GET_PRIVATE(object);
+
+  switch (prop_id) {
+  case PROP_PARTITIONING:
+    priv->partitioning =
+      *static_cast<std::shared_ptr<arrow::dataset::Partitioning> *>(
+        g_value_get_pointer(value));
+    break;
+  default:
+    G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
+    break;
+  }
+}
+
+static void
+gadataset_partitioning_init(GADatasetPartitioning *object)
+{
+  auto priv = GADATASET_PARTITIONING_GET_PRIVATE(object);
+  new(&priv->partitioning) std::shared_ptr<arrow::dataset::Partitioning>;
+}
+
+static void
+gadataset_partitioning_class_init(GADatasetPartitioningClass *klass)
+{
+  auto gobject_class = G_OBJECT_CLASS(klass);
+
+  gobject_class->finalize     = gadataset_partitioning_finalize;
+  gobject_class->set_property = gadataset_partitioning_set_property;
+
+  GParamSpec *spec;
+  spec = g_param_spec_pointer("partitioning",
+                              "Partitioning",
+                              "The raw "
+                              "std::shared<arrow::dataset::Partitioning> *",
+                              static_cast<GParamFlags>(G_PARAM_WRITABLE |
+                                                       G_PARAM_CONSTRUCT_ONLY));
+  g_object_class_install_property(gobject_class, PROP_PARTITIONING, spec);
+}
+
+/**
+ * gadataset_partitioning_new:
+ *
+ * Returns: The newly created #GADatasetPartitioning that doesn't
+ *   partition.
+ *
+ * Since: 6.0.0
+ */
+GADatasetPartitioning *
+gadataset_partitioning_new(void)
+{
+  auto arrow_partitioning = arrow::dataset::Partitioning::Default();
+  return GADATASET_PARTITIONING(
+    g_object_new(GADATASET_TYPE_PARTITIONING,
+                 "partitioning", &arrow_partitioning,
+                 NULL));
+}
+
+/**
+ * gadataset_partitioning_get_type_name:
+ * @partitioning: A #GADatasetPartitioning.
+ *
+ * Returns: The type name of @partitioning.
+ *
+ *   It should be freed with g_free() when no longer needed.
+ *
+ * Since: 6.0.0
+ */
+gchar *
+gadataset_partitioning_get_type_name(GADatasetPartitioning *partitioning)
+{
+  auto arrow_partitioning = gadataset_partitioning_get_raw(partitioning);
+  auto arrow_type_name = arrow_partitioning->type_name();
+  return g_strndup(arrow_type_name.c_str(),
+                   arrow_type_name.size());
+}
+
+
+G_DEFINE_TYPE(GADatasetKeyValuePartitioning,
+              gadataset_key_value_partitioning,
+              GADATASET_TYPE_PARTITIONING)
+
+static void
+gadataset_key_value_partitioning_init(GADatasetKeyValuePartitioning *object)
+{
+}
+
+static void
+gadataset_key_value_partitioning_class_init(
+  GADatasetKeyValuePartitioningClass *klass)
+{
+}
+
+
+G_DEFINE_TYPE(GADatasetDirectoryPartitioning,
+              gadataset_directory_partitioning,
+              GADATASET_TYPE_KEY_VALUE_PARTITIONING)
+
+static void
+gadataset_directory_partitioning_init(GADatasetDirectoryPartitioning *object)
+{
+}
+
+static void
+gadataset_directory_partitioning_class_init(
+  GADatasetDirectoryPartitioningClass *klass)
+{
+}
+
+/**
+ * gadataset_directory_partitioning_new:
+ * @schema: A #GArrowSchema that describes all partitioned segments.
+ * @dictionaries: (nullable) (element-type GArrowArray): A list of #GArrowArray
+ *   for dictionary data types in @schema.
+ * @options: (nullable): A #GADatasetPartitioningOptions.
+ * @error: (nullable): Return location for a #GError or %NULL.
+ *
+ * Returns: The newly created #GADatasetDirectoryPartitioning on success,
+ *   %NULL on error.
+ *
+ * Since: 6.0.0
+ */
+GADatasetDirectoryPartitioning *
+gadataset_directory_partitioning_new(GArrowSchema *schema,
+                                     GList *dictionaries,
+                                     GADatasetPartitioningOptions *options,
+                                     GError **error)
+{
+  auto arrow_schema = garrow_schema_get_raw(schema);
+  std::vector<std::shared_ptr<arrow::Array>> arrow_dictionaries;
+  for (auto node = dictionaries; node; node = node->next) {
+    auto dictionary = GARROW_ARRAY(node->data);
+    if (dictionary) {
+      arrow_dictionaries.push_back(garrow_array_get_raw(dictionary));
+    } else {
+      arrow_dictionaries.push_back(nullptr);
+    }
+  }
+  arrow::dataset::KeyValuePartitioningOptions arrow_options;
+  if (options) {
+    arrow_options =
+      gadataset_partitioning_options_get_raw_key_value_partitioning_options(
+        options);
+  }
+  auto arrow_partitioning =
+    std::make_shared<arrow::dataset::DirectoryPartitioning>(
+      arrow_schema,
+      arrow_dictionaries,
+      arrow_options);
+  return GADATASET_DIRECTORY_PARTITIONING(
+    g_object_new(GADATASET_TYPE_DIRECTORY_PARTITIONING,
+                 "partitioning", &arrow_partitioning,
+                 NULL));
+}
+
+
+G_END_DECLS
+
+arrow::dataset::KeyValuePartitioningOptions
+gadataset_partitioning_options_get_raw_key_value_partitioning_options(
+  GADatasetPartitioningOptions *options)
+{
+  auto priv = GADATASET_PARTITIONING_OPTIONS_GET_PRIVATE(options);
+  arrow::dataset::KeyValuePartitioningOptions arrow_options;
+  arrow_options.segment_encoding =
+    static_cast<arrow::dataset::SegmentEncoding>(priv->segment_encoding);
+  return arrow_options;
+}
+
+std::shared_ptr<arrow::dataset::Partitioning>
+gadataset_partitioning_get_raw(GADatasetPartitioning *partitioning)
+{
+  auto priv = GADATASET_PARTITIONING_GET_PRIVATE(partitioning);
+  return priv->partitioning;
+}
diff --git a/c_glib/arrow-dataset-glib/partitioning.h b/c_glib/arrow-dataset-glib/partitioning.h
new file mode 100644
index 00000000000..d408d9bd502
--- /dev/null
+++ b/c_glib/arrow-dataset-glib/partitioning.h
@@ -0,0 +1,110 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#pragma once
+
+#include <arrow-glib/arrow-glib.h>
+
+G_BEGIN_DECLS
+
+/**
+ * GADatasetSegmentEncoding
+ * @GADATASET_SEGMENT_ENCODING_NONE: No encoding.
+ * @GADATASET_SEGMENT_ENCODING_URI: Segment values are URL-encoded.
+ *
+ * They are corresponding to `arrow::dataset::SegmentEncoding` values.
+ *
+ * Since: 6.0.0
+ */
+typedef enum {
+  GADATASET_SEGMENT_ENCODING_NONE,
+  GADATASET_SEGMENT_ENCODING_URI,
+} GADatasetSegmentEncoding;
+
+
+#define GADATASET_TYPE_PARTITIONING_OPTIONS   \
+  (gadataset_partitioning_options_get_type())
+G_DECLARE_DERIVABLE_TYPE(GADatasetPartitioningOptions,
+                         gadataset_partitioning_options,
+                         GADATASET,
+                         PARTITIONING_OPTIONS,
+                         GObject)
+struct _GADatasetPartitioningOptionsClass
+{
+  GObjectClass parent_class;
+};
+
+GARROW_AVAILABLE_IN_6_0
+GADatasetPartitioningOptions *
+gadataset_partitioning_options_new(void);
+
+
+#define GADATASET_TYPE_PARTITIONING (gadataset_partitioning_get_type())
+G_DECLARE_DERIVABLE_TYPE(GADatasetPartitioning,
+                         gadataset_partitioning,
+                         GADATASET,
+                         PARTITIONING,
+                         GObject)
+struct _GADatasetPartitioningClass
+{
+  GObjectClass parent_class;
+};
+
+GARROW_AVAILABLE_IN_6_0
+GADatasetPartitioning *
+gadataset_partitioning_new(void);
+GARROW_AVAILABLE_IN_6_0
+gchar *
+gadataset_partitioning_get_type_name(GADatasetPartitioning *partitioning);
+
+
+#define GADATASET_TYPE_KEY_VALUE_PARTITIONING   \
+  (gadataset_key_value_partitioning_get_type())
+G_DECLARE_DERIVABLE_TYPE(GADatasetKeyValuePartitioning,
+                         gadataset_key_value_partitioning,
+                         GADATASET,
+                         KEY_VALUE_PARTITIONING,
+                         GADatasetPartitioning)
+struct _GADatasetKeyValuePartitioningClass
+{
+  GADatasetPartitioningClass parent_class;
+};
+
+
+#define GADATASET_TYPE_DIRECTORY_PARTITIONING   \
+  (gadataset_directory_partitioning_get_type())
+G_DECLARE_DERIVABLE_TYPE(GADatasetDirectoryPartitioning,
+                         gadataset_directory_partitioning,
+                         GADATASET,
+                         DIRECTORY_PARTITIONING,
+                         GADatasetKeyValuePartitioning)
+struct _GADatasetDirectoryPartitioningClass
+{
+  GADatasetKeyValuePartitioningClass parent_class;
+};
+
+GARROW_AVAILABLE_IN_6_0
+GADatasetDirectoryPartitioning *
+gadataset_directory_partitioning_new(GArrowSchema *schema,
+                                     GList *dictionaries,
+                                     GADatasetPartitioningOptions *options,
+                                     GError **error);
+
+
+G_END_DECLS
diff --git a/c_glib/arrow-dataset-glib/partitioning.hpp b/c_glib/arrow-dataset-glib/partitioning.hpp
new file mode 100644
index 00000000000..2481ecb3340
--- /dev/null
+++ b/c_glib/arrow-dataset-glib/partitioning.hpp
@@ -0,0 +1,31 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#pragma once
+
+#include <arrow/dataset/api.h>
+
+#include <arrow-dataset-glib/partitioning.h>
+
+arrow::dataset::KeyValuePartitioningOptions
+gadataset_partitioning_options_get_raw_key_value_partitioning_options(
+  GADatasetPartitioningOptions *options);
+
+std::shared_ptr<arrow::dataset::Partitioning>
+gadataset_partitioning_get_raw(GADatasetPartitioning *partitioning);
diff --git a/c_glib/arrow-dataset-glib/scanner.cpp b/c_glib/arrow-dataset-glib/scanner.cpp
index efa2a5c3287..ddd3fd88af7 100644
--- a/c_glib/arrow-dataset-glib/scanner.cpp
+++ b/c_glib/arrow-dataset-glib/scanner.cpp
@@ -18,6 +18,7 @@
  */
 
 #include <arrow-glib/error.hpp>
+#include <arrow-glib/reader.hpp>
 #include <arrow-glib/table.hpp>
 
 #include <arrow-dataset-glib/dataset.hpp>
@@ -225,6 +226,24 @@ gadataset_scanner_builder_new(GADatasetDataset *dataset, GError **error)
   }
 }
 
+/**
+ * gadataset_scanner_builder_new_record_batch_reader:
+ * @reader: A #GArrowRecordBatchReader that produces record batches.
+ *
+ * Returns: (nullable): A newly created #GADatasetScannerBuilder.
+ *
+ * Since: 6.0.0
+ */
+GADatasetScannerBuilder *
+gadataset_scanner_builder_new_record_batch_reader(
+  GArrowRecordBatchReader *reader)
+{
+  auto arrow_reader = garrow_record_batch_reader_get_raw(reader);
+  auto arrow_scanner_builder =
+    arrow::dataset::ScannerBuilder::FromRecordBatchReader(arrow_reader);
+  return gadataset_scanner_builder_new_raw(&arrow_scanner_builder);
+}
+
 /**
  * gadataset_scanner_builder_finish:
  * @builder: A #GADatasetScannerBuilder.
diff --git a/c_glib/arrow-dataset-glib/scanner.h b/c_glib/arrow-dataset-glib/scanner.h
index 446815d6db1..ba7f9c6b7c3 100644
--- a/c_glib/arrow-dataset-glib/scanner.h
+++ b/c_glib/arrow-dataset-glib/scanner.h
@@ -55,6 +55,10 @@ GARROW_AVAILABLE_IN_5_0
 GADatasetScannerBuilder *
 gadataset_scanner_builder_new(GADatasetDataset *dataset,
                               GError **error);
+GARROW_AVAILABLE_IN_6_0
+GADatasetScannerBuilder *
+gadataset_scanner_builder_new_record_batch_reader(
+  GArrowRecordBatchReader *reader);
 GARROW_AVAILABLE_IN_5_0
 GADatasetScanner *
 gadataset_scanner_builder_finish(GADatasetScannerBuilder *builder,
diff --git a/c_glib/arrow-glib/composite-data-type.cpp b/c_glib/arrow-glib/composite-data-type.cpp
index 95cd283c1b3..fadcafe6b40 100644
--- a/c_glib/arrow-glib/composite-data-type.cpp
+++ b/c_glib/arrow-glib/composite-data-type.cpp
@@ -376,7 +376,7 @@ garrow_map_data_type_new(GArrowDataType *key_type,
  * garrow_map_data_type_get_key_type:
  * @map_data_type: A #GArrowMapDataType.
  *
- * Return: (transfer full): The key type of the map.
+ * Returns: (transfer full): The key type of the map.
  *
  * Since: 0.17.0
  */
@@ -395,7 +395,7 @@ garrow_map_data_type_get_key_type(GArrowMapDataType *map_data_type)
  * garrow_map_data_type_get_item_type:
  * @map_data_type: A #GArrowMapDataType.
  *
- * Return: (transfer full): The item type of the map.
+ * Returns: (transfer full): The item type of the map.
  *
  * Since: 0.17.0
  */
diff --git a/c_glib/arrow-glib/compute.cpp b/c_glib/arrow-glib/compute.cpp
index 8783510728a..2f4a0de215c 100644
--- a/c_glib/arrow-glib/compute.cpp
+++ b/c_glib/arrow-glib/compute.cpp
@@ -126,6 +126,8 @@ G_BEGIN_DECLS
  * #GArrowFunctionOptions is a base class for all function options
  * classes such as #GArrowCastOptions.
  *
+ * #GArrowFunctionDoc is a class for function document.
+ *
  * #GArrowFunction is a class to process data.
  *
  * #GArrowExecuteNodeOptions is a base class for all execute node
@@ -165,6 +167,12 @@ G_BEGIN_DECLS
  * #GArrowSortOptions is a class to customize the `sort_indices`
  * function.
  *
+ * #GArrowSetLookupOptions is a class to customize the `is_in` function
+ * and `index_in` function.
+ *
+ * #GArrowVarianceOptions is a class to customize the `stddev` function
+ * and `variance` function.
+ *
  * There are many functions to compute data on an array.
  */
 
@@ -254,6 +262,145 @@ garrow_function_options_class_init(GArrowFunctionOptionsClass *klass)
 }
 
 
+typedef struct GArrowFunctionDocPrivate_ {
+  arrow::compute::FunctionDoc *doc;
+} GArrowFunctionDocPrivate;
+
+enum {
+  PROP_DOC = 1,
+};
+
+G_DEFINE_TYPE_WITH_PRIVATE(GArrowFunctionDoc,
+                           garrow_function_doc,
+                           G_TYPE_OBJECT)
+
+#define GARROW_FUNCTION_DOC_GET_PRIVATE(object) \
+  static_cast<GArrowFunctionDocPrivate *>(      \
+    garrow_function_doc_get_instance_private(   \
+      GARROW_FUNCTION_DOC(object)))
+
+static void
+garrow_function_doc_set_property(GObject *object,
+                                 guint prop_id,
+                                 const GValue *value,
+                                 GParamSpec *pspec)
+{
+  auto priv = GARROW_FUNCTION_DOC_GET_PRIVATE(object);
+
+  switch (prop_id) {
+  case PROP_DOC:
+    priv->doc =
+      static_cast<arrow::compute::FunctionDoc *>(g_value_get_pointer(value));
+    break;
+  default:
+    G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
+    break;
+  }
+}
+
+static void
+garrow_function_doc_init(GArrowFunctionDoc *object)
+{
+}
+
+static void
+garrow_function_doc_class_init(GArrowFunctionDocClass *klass)
+{
+  auto gobject_class = G_OBJECT_CLASS(klass);
+  gobject_class->set_property = garrow_function_doc_set_property;
+
+  GParamSpec *spec;
+  spec = g_param_spec_pointer("doc",
+                              "Doc",
+                              "The raw arrow::compute::FunctionDoc *",
+                              static_cast<GParamFlags>(G_PARAM_WRITABLE |
+                                                       G_PARAM_CONSTRUCT_ONLY));
+  g_object_class_install_property(gobject_class, PROP_DOC, spec);
+}
+
+/**
+ * garrow_function_doc_get_summary:
+ * @doc: A #GArrowFunctionDoc.
+ *
+ * Returns: A one-line summary of the function, using a verb.
+ *
+ *   It should be freed with g_free() when no longer needed.
+ *
+ * Since: 6.0.0
+ */
+gchar *
+garrow_function_doc_get_summary(GArrowFunctionDoc *doc)
+{
+  auto arrow_doc = garrow_function_doc_get_raw(doc);
+  return g_strndup(arrow_doc->summary.data(),
+                   arrow_doc->summary.size());
+}
+
+/**
+ * garrow_function_doc_get_description:
+ * @doc: A #GArrowFunctionDoc.
+ *
+ * Returns: A detailed description of the function, meant to follow
+ *   the summary.
+ *
+ *   It should be freed with g_free() when no longer needed.
+ *
+ * Since: 6.0.0
+ */
+gchar *
+garrow_function_doc_get_description(GArrowFunctionDoc *doc)
+{
+  auto arrow_doc = garrow_function_doc_get_raw(doc);
+  return g_strndup(arrow_doc->description.data(),
+                   arrow_doc->description.size());
+}
+
+/**
+ * garrow_function_doc_get_arg_names:
+ * @doc: A #GArrowFunctionDoc.
+ *
+ * Returns: (array zero-terminated=1) (element-type utf8) (transfer full):
+ *   Symbolic names (identifiers) for the function arguments.
+ *
+ *   It's a %NULL-terminated string array. It must be freed with
+ *   g_strfreev() when no longer needed.
+ *
+ * Since: 6.0.0
+ */
+gchar **
+garrow_function_doc_get_arg_names(GArrowFunctionDoc *doc)
+{
+  auto arrow_doc = garrow_function_doc_get_raw(doc);
+  const auto &arrow_arg_names = arrow_doc->arg_names;
+  auto n = arrow_arg_names.size();
+  auto arg_names = g_new(gchar *, n + 1);
+  for (size_t i = 0; i < n; ++i) {
+    arg_names[i] = g_strndup(arrow_arg_names[i].data(),
+                             arrow_arg_names[i].size());
+  }
+  arg_names[n] = NULL;
+  return arg_names;
+}
+
+/**
+ * garrow_function_doc_get_options_class_name:
+ * @doc: A #GArrowFunctionDoc.
+ *
+ * Returns: Name of the options class, if any.
+ *
+ *   It should be freed with g_free() when no longer needed.
+ *
+ * Since: 6.0.0
+ */
+gchar *
+garrow_function_doc_get_options_class_name(GArrowFunctionDoc *doc)
+{
+  auto arrow_doc = garrow_function_doc_get_raw(doc);
+  return g_strndup(arrow_doc->options_class.data(),
+                   arrow_doc->options_class.size());
+}
+
+
 typedef struct GArrowFunctionPrivate_ {
   std::shared_ptr<arrow::compute::Function> function;
 } GArrowFunctionPrivate;
@@ -397,6 +544,22 @@ garrow_function_execute(GArrowFunction *function,
   }
 }
 
+/**
+ * garrow_function_get_doc:
+ * @function: A #GArrowFunction.
+ *
+ * Returns: (transfer full): The function documentation.
+ *
+ * Since: 6.0.0
+ */
+GArrowFunctionDoc *
+garrow_function_get_doc(GArrowFunction *function)
+{
+  auto arrow_function = garrow_function_get_raw(function);
+  const auto &arrow_doc = arrow_function->doc();
+  return garrow_function_doc_new_raw(&arrow_doc);
+}
+
 
 typedef struct GArrowExecuteNodeOptionsPrivate_ {
   arrow::compute::ExecNodeOptions *options;
@@ -1271,7 +1434,7 @@ garrow_execute_plan_build_source_node(GArrowExecutePlan *plan,
 /**
  * garrow_execute_plan_build_aggregate_node:
  * @plan: A #GArrowExecutePlan.
- * @input: A #GarrowExecuteNode.
+ * @input: A #GArrowExecuteNode.
  * @options: A #GArrowAggregateNodeOptions.
  * @error: (nullable): Return location for a #GError or %NULL.
  *
@@ -1304,7 +1467,7 @@ garrow_execute_plan_build_aggregate_node(GArrowExecutePlan *plan,
 /**
  * garrow_execute_plan_build_sink_node:
  * @plan: A #GArrowExecutePlan.
- * @input: A #GarrowExecuteNode.
+ * @input: A #GArrowExecuteNode.
  * @options: A #GArrowSinkNodeOptions.
  * @error: (nullable): Return location for a #GError or %NULL.
  *
@@ -2417,6 +2580,312 @@ garrow_sort_options_set_sort_keys(GArrowSortOptions *options,
 }
 
 
+typedef struct GArrowSetLookupOptionsPrivate_ {
+  GArrowDatum *value_set;
+} GArrowSetLookupOptionsPrivate;
+
+enum {
+  PROP_SET_LOOKUP_OPTIONS_VALUE_SET = 1,
+  PROP_SET_LOOKUP_OPTIONS_SKIP_NULLS,
+};
+
+G_DEFINE_TYPE_WITH_PRIVATE(GArrowSetLookupOptions,
+                           garrow_set_lookup_options,
+                           GARROW_TYPE_FUNCTION_OPTIONS)
+
+#define GARROW_SET_LOOKUP_OPTIONS_GET_PRIVATE(object) \
+  static_cast<GArrowSetLookupOptionsPrivate *>(       \
+    garrow_set_lookup_options_get_instance_private(   \
+      GARROW_SET_LOOKUP_OPTIONS(object)))
+
+static void
+garrow_set_lookup_options_dispose(GObject *object)
+{
+  auto priv = GARROW_SET_LOOKUP_OPTIONS_GET_PRIVATE(object);
+
+  if (priv->value_set) {
+    g_object_unref(priv->value_set);
+    priv->value_set = NULL;
+  }
+
+  G_OBJECT_CLASS(garrow_set_lookup_options_parent_class)->dispose(object);
+}
+
+static void
+garrow_set_lookup_options_set_property(GObject *object,
+                                       guint prop_id,
+                                       const GValue *value,
+                                       GParamSpec *pspec)
+{
+  auto priv = GARROW_SET_LOOKUP_OPTIONS_GET_PRIVATE(object);
+  auto options =
+    garrow_set_lookup_options_get_raw(GARROW_SET_LOOKUP_OPTIONS(object));
+
+  switch (prop_id) {
+  case PROP_SET_LOOKUP_OPTIONS_VALUE_SET:
+    priv->value_set = GARROW_DATUM(g_value_dup_object(value));
+    options->value_set = garrow_datum_get_raw(priv->value_set);
+    break;
+  case PROP_SET_LOOKUP_OPTIONS_SKIP_NULLS:
+    options->skip_nulls = g_value_get_boolean(value);
+    break;
+  default:
+    G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
+    break;
+  }
+}
+
+static void
+garrow_set_lookup_options_get_property(GObject *object,
+                                       guint prop_id,
+                                       GValue *value,
+                                       GParamSpec *pspec)
+{
+  auto priv = GARROW_SET_LOOKUP_OPTIONS_GET_PRIVATE(object);
+  auto options =
+    garrow_set_lookup_options_get_raw(GARROW_SET_LOOKUP_OPTIONS(object));
+
+  switch (prop_id) {
+  case PROP_SET_LOOKUP_OPTIONS_VALUE_SET:
+    g_value_set_object(value, priv->value_set);
+    break;
+  case PROP_SET_LOOKUP_OPTIONS_SKIP_NULLS:
+    g_value_set_boolean(value, options->skip_nulls);
+    break;
+  default:
+    G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
+    break;
+  }
+}
+
+static void
+garrow_set_lookup_options_init(GArrowSetLookupOptions *object)
+{
+  auto priv = GARROW_FUNCTION_OPTIONS_GET_PRIVATE(object);
+  priv->options = static_cast<arrow::compute::FunctionOptions *>(
+    new arrow::compute::SetLookupOptions());
+}
+
+static void
+garrow_set_lookup_options_class_init(GArrowSetLookupOptionsClass *klass)
+{
+  auto gobject_class = G_OBJECT_CLASS(klass);
+
+  gobject_class->dispose = garrow_set_lookup_options_dispose;
+  gobject_class->set_property = garrow_set_lookup_options_set_property;
+  gobject_class->get_property = garrow_set_lookup_options_get_property;
+
+
+  arrow::compute::SetLookupOptions options;
+
+  GParamSpec *spec;
+  /**
+   * GArrowSetLookupOptions:value-set:
+   *
+   * The set of values to look up input values into.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_object("value-set",
+                             "Value set",
+                             "The set of values to look up input values into",
+                             GARROW_TYPE_DATUM,
+                             static_cast<GParamFlags>(G_PARAM_READWRITE |
+                                                      G_PARAM_CONSTRUCT_ONLY));
+  g_object_class_install_property(gobject_class,
+                                  PROP_SET_LOOKUP_OPTIONS_VALUE_SET,
+                                  spec);
+
+  /**
+   * GArrowSetLookupOptions:skip-nulls:
+   *
+   * Whether NULLs are skipped or not.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_boolean("skip-nulls",
+                              "Skip NULLs",
+                              "Whether NULLs are skipped or not",
+                              options.skip_nulls,
+                              static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class,
+                                  PROP_SET_LOOKUP_OPTIONS_SKIP_NULLS,
+                                  spec);
+}
+
+/**
+ * garrow_set_lookup_options_new:
+ * @value_set: A #GArrowArrayDatum or #GArrowChunkedArrayDatum to be looked up.
+ *
+ * Returns: A newly created #GArrowSetLookupOptions.
+ *
+ * Since: 6.0.0
+ */
+GArrowSetLookupOptions *
+garrow_set_lookup_options_new(GArrowDatum *value_set)
+{
+  return GARROW_SET_LOOKUP_OPTIONS(
+    g_object_new(GARROW_TYPE_SET_LOOKUP_OPTIONS,
+                 "value-set", value_set,
+                 NULL));
+}
+
+
+enum {
+  PROP_VARIANCE_OPTIONS_DDOF = 1,
+  PROP_VARIANCE_OPTIONS_SKIP_NULLS,
+  PROP_VARIANCE_OPTIONS_MIN_COUNT,
+};
+
+G_DEFINE_TYPE(GArrowVarianceOptions,
+              garrow_variance_options,
+              GARROW_TYPE_FUNCTION_OPTIONS)
+
+#define GARROW_VARIANCE_OPTIONS_GET_PRIVATE(object)  \
+  static_cast<GArrowVarianceOptionsPrivate *>(       \
+    garrow_variance_options_get_instance_private(    \
+      GARROW_VARIANCE_OPTIONS(object)))
+
+static void
+garrow_variance_options_set_property(GObject *object,
+                                     guint prop_id,
+                                     const GValue *value,
+                                     GParamSpec *pspec)
+{
+  auto options =
+    garrow_variance_options_get_raw(GARROW_VARIANCE_OPTIONS(object));
+
+  switch (prop_id) {
+  case PROP_VARIANCE_OPTIONS_DDOF:
+    options->ddof = g_value_get_int(value);
+    break;
+  case PROP_VARIANCE_OPTIONS_SKIP_NULLS:
+    options->skip_nulls = g_value_get_boolean(value);
+    break;
+  case PROP_VARIANCE_OPTIONS_MIN_COUNT:
+    options->min_count = g_value_get_uint(value);
+    break;
+  default:
+    G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
+    break;
+  }
+}
+
+static void
+garrow_variance_options_get_property(GObject *object,
+                                     guint prop_id,
+                                     GValue *value,
+                                     GParamSpec *pspec)
+{
+  auto options =
+    garrow_variance_options_get_raw(GARROW_VARIANCE_OPTIONS(object));
+
+  switch (prop_id) {
+  case PROP_VARIANCE_OPTIONS_DDOF:
+    g_value_set_int(value, options->ddof);
+    break;
+  case PROP_VARIANCE_OPTIONS_SKIP_NULLS:
+    g_value_set_boolean(value, options->skip_nulls);
+    break;
+  case PROP_VARIANCE_OPTIONS_MIN_COUNT:
+    g_value_set_uint(value, options->min_count);
+    break;
+  default:
+    G_OBJECT_WARN_INVALID_PROPERTY_ID(object, prop_id, pspec);
+    break;
+  }
+}
+
+static void
+garrow_variance_options_init(GArrowVarianceOptions *object)
+{
+  auto priv = GARROW_FUNCTION_OPTIONS_GET_PRIVATE(object);
+  priv->options = static_cast<arrow::compute::FunctionOptions *>(
+    new arrow::compute::VarianceOptions());
+}
+
+static void
+garrow_variance_options_class_init(GArrowVarianceOptionsClass *klass)
+{
+  auto gobject_class = G_OBJECT_CLASS(klass);
+
+  gobject_class->set_property = garrow_variance_options_set_property;
+  gobject_class->get_property = garrow_variance_options_get_property;
+
+
+  arrow::compute::VarianceOptions options;
+
+  GParamSpec *spec;
+  /**
+   * GArrowVarianceOptions:ddof:
+   *
+   * The Delta Degrees of Freedom (ddof) to be used.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_int("ddof",
+                          "Delta Degrees of Freedom",
+                          "The Delta Degrees of Freedom (ddof) to be used",
+                          G_MININT,
+                          G_MAXINT,
+                          options.ddof,
+                          static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class,
+                                  PROP_VARIANCE_OPTIONS_DDOF,
+                                  spec);
+
+  /**
+   * GArrowVarianceOptions:skip-nulls:
+   *
+   * Whether NULLs are skipped or not.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_boolean("skip-nulls",
+                              "Skip NULLs",
+                              "Whether NULLs are skipped or not",
+                              options.skip_nulls,
+                              static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class,
+                                  PROP_VARIANCE_OPTIONS_SKIP_NULLS,
+                                  spec);
+
+  /**
+   * GArrowVarianceOptions:min-count:
+   *
+   * If less than this many non-null values are observed, emit null.
+   *
+   * Since: 6.0.0
+   */
+  spec = g_param_spec_uint("min-count",
+                           "Min count",
+                           "If less than this many non-null values "
+                           "are observed, emit null",
+                           0,
+                           G_MAXUINT,
+                           options.min_count,
+                           static_cast<GParamFlags>(G_PARAM_READWRITE));
+  g_object_class_install_property(gobject_class,
+                                  PROP_VARIANCE_OPTIONS_MIN_COUNT,
+                                  spec);
+
+}
+
+/**
+ * garrow_variance_options_new:
+ *
+ * Returns: A newly created #GArrowVarianceOptions.
+ *
+ * Since: 6.0.0
+ */
+GArrowVarianceOptions *
+garrow_variance_options_new(void)
+{
+  return GARROW_VARIANCE_OPTIONS(
+    g_object_new(GARROW_TYPE_VARIANCE_OPTIONS, NULL));
+}
+
+
 /**
  * garrow_array_cast:
  * @array: A #GArrowArray.
@@ -3610,6 +4079,23 @@ garrow_function_options_get_raw(GArrowFunctionOptions *options)
   return priv->options;
 }
 
+
+GArrowFunctionDoc *
+garrow_function_doc_new_raw(const arrow::compute::FunctionDoc *arrow_doc)
+{
+  return GARROW_FUNCTION_DOC(g_object_new(GARROW_TYPE_FUNCTION_DOC,
+                                          "doc", arrow_doc,
+                                          NULL));
+}
+
+arrow::compute::FunctionDoc *
+garrow_function_doc_get_raw(GArrowFunctionDoc *doc)
+{
+  auto priv = GARROW_FUNCTION_DOC_GET_PRIVATE(doc);
+  return priv->doc;
+}
+
+
 GArrowFunction *
 garrow_function_new_raw(std::shared_ptr<arrow::compute::Function> *arrow_function)
 {
@@ -3755,3 +4241,18 @@ garrow_sort_options_get_raw(GArrowSortOptions *options)
   return static_cast<arrow::compute::SortOptions *>(
     garrow_function_options_get_raw(GARROW_FUNCTION_OPTIONS(options)));
 }
+
+arrow::compute::SetLookupOptions *
+garrow_set_lookup_options_get_raw(GArrowSetLookupOptions *options)
+{
+  return static_cast<arrow::compute::SetLookupOptions *>(
+    garrow_function_options_get_raw(GARROW_FUNCTION_OPTIONS(options)));
+}
+
+
+arrow::compute::VarianceOptions *
+garrow_variance_options_get_raw(GArrowVarianceOptions *options)
+{
+  return static_cast<arrow::compute::VarianceOptions *>(
+    garrow_function_options_get_raw(GARROW_FUNCTION_OPTIONS(options)));
+}
diff --git a/c_glib/arrow-glib/compute.h b/c_glib/arrow-glib/compute.h
index 108b27ff7ba..2171d6abd9a 100644
--- a/c_glib/arrow-glib/compute.h
+++ b/c_glib/arrow-glib/compute.h
@@ -51,6 +51,31 @@ struct _GArrowFunctionOptionsClass
 };
 
 
+#define GARROW_TYPE_FUNCTION_DOC (garrow_function_doc_get_type())
+G_DECLARE_DERIVABLE_TYPE(GArrowFunctionDoc,
+                         garrow_function_doc,
+                         GARROW,
+                         FUNCTION_DOC,
+                         GObject)
+struct _GArrowFunctionDocClass
+{
+  GObjectClass parent_class;
+};
+
+GARROW_AVAILABLE_IN_6_0
+gchar *
+garrow_function_doc_get_summary(GArrowFunctionDoc *doc);
+GARROW_AVAILABLE_IN_6_0
+gchar *
+garrow_function_doc_get_description(GArrowFunctionDoc *doc);
+GARROW_AVAILABLE_IN_6_0
+gchar **
+garrow_function_doc_get_arg_names(GArrowFunctionDoc *doc);
+GARROW_AVAILABLE_IN_6_0
+gchar *
+garrow_function_doc_get_options_class_name(GArrowFunctionDoc *doc);
+
+
 #define GARROW_TYPE_FUNCTION (garrow_function_get_type())
 G_DECLARE_DERIVABLE_TYPE(GArrowFunction,
                          garrow_function,
@@ -73,6 +98,10 @@ GArrowDatum *garrow_function_execute(GArrowFunction *function,
                                      GArrowExecuteContext *context,
                                      GError **error);
 
+GARROW_AVAILABLE_IN_6_0
+GArrowFunctionDoc *
+garrow_function_get_doc(GArrowFunction *function);
+
 
 #define GARROW_TYPE_EXECUTE_NODE_OPTIONS (garrow_execute_node_options_get_type())
 G_DECLARE_DERIVABLE_TYPE(GArrowExecuteNodeOptions,
@@ -436,6 +465,38 @@ garrow_sort_options_add_sort_key(GArrowSortOptions *options,
                                  GArrowSortKey *sort_key);
 
 
+#define GARROW_TYPE_SET_LOOKUP_OPTIONS (garrow_set_lookup_options_get_type())
+G_DECLARE_DERIVABLE_TYPE(GArrowSetLookupOptions,
+                         garrow_set_lookup_options,
+                         GARROW,
+                         SET_LOOKUP_OPTIONS,
+                         GArrowFunctionOptions)
+struct _GArrowSetLookupOptionsClass
+{
+  GArrowFunctionOptionsClass parent_class;
+};
+
+GARROW_AVAILABLE_IN_6_0
+GArrowSetLookupOptions *
+garrow_set_lookup_options_new(GArrowDatum *value_set);
+
+
+#define GARROW_TYPE_VARIANCE_OPTIONS (garrow_variance_options_get_type())
+G_DECLARE_DERIVABLE_TYPE(GArrowVarianceOptions,
+                         garrow_variance_options,
+                         GARROW,
+                         VARIANCE_OPTIONS,
+                         GArrowFunctionOptions)
+struct _GArrowVarianceOptionsClass
+{
+  GArrowFunctionOptionsClass parent_class;
+};
+
+GARROW_AVAILABLE_IN_6_0
+GArrowVarianceOptions *
+garrow_variance_options_new(void);
+
+
 GArrowArray *garrow_array_cast(GArrowArray *array,
                                GArrowDataType *target_data_type,
                                GArrowCastOptions *options,
diff --git a/c_glib/arrow-glib/compute.hpp b/c_glib/arrow-glib/compute.hpp
index 01265eee2a8..88f55d5329c 100644
--- a/c_glib/arrow-glib/compute.hpp
+++ b/c_glib/arrow-glib/compute.hpp
@@ -30,6 +30,11 @@ garrow_execute_context_get_raw(GArrowExecuteContext *context);
 arrow::compute::FunctionOptions *
 garrow_function_options_get_raw(GArrowFunctionOptions *options);
 
+GArrowFunctionDoc *
+garrow_function_doc_new_raw(const arrow::compute::FunctionDoc *arrow_doc);
+arrow::compute::FunctionDoc *
+garrow_function_doc_get_raw(GArrowFunctionDoc *doc);
+
 GArrowFunction *
 garrow_function_new_raw(std::shared_ptr<arrow::compute::Function> *arrow_function);
 std::shared_ptr<arrow::compute::Function>
@@ -89,3 +94,11 @@ garrow_sort_key_get_raw(GArrowSortKey *sort_key);
 
 arrow::compute::SortOptions *
 garrow_sort_options_get_raw(GArrowSortOptions *options);
+
+
+arrow::compute::SetLookupOptions *
+garrow_set_lookup_options_get_raw(GArrowSetLookupOptions *options);
+
+
+arrow::compute::VarianceOptions *
+garrow_variance_options_get_raw(GArrowVarianceOptions *options);
diff --git a/c_glib/arrow-glib/input-stream.cpp b/c_glib/arrow-glib/input-stream.cpp
index 64f366a6282..37e4702ff16 100644
--- a/c_glib/arrow-glib/input-stream.cpp
+++ b/c_glib/arrow-glib/input-stream.cpp
@@ -50,6 +50,8 @@ G_BEGIN_DECLS
  *
  * #GArrowBufferInputStream is a class to read data on buffer.
  *
+ * #GArrowFileInputStream is a class to read data in file.
+ *
  * #GArrowMemoryMappedInputStream is a class to read data in file by
  * mapping the file on memory. It supports zero copy.
  *
@@ -631,6 +633,86 @@ garrow_buffer_input_stream_get_buffer(GArrowBufferInputStream *input_stream)
 }
 
 
+G_DEFINE_TYPE(GArrowFileInputStream,
+              garrow_file_input_stream,
+              GARROW_TYPE_SEEKABLE_INPUT_STREAM);
+
+static void
+garrow_file_input_stream_init(GArrowFileInputStream *object)
+{
+}
+
+static void
+garrow_file_input_stream_class_init(GArrowFileInputStreamClass *klass)
+{
+}
+
+/**
+ * garrow_file_input_stream_new:
+ * @path: The path of the file to be opened.
+ * @error: (nullable): Return location for a #GError or %NULL.
+ *
+ * Returns: (nullable): A newly created #GArrowFileInputStream
+ *   or %NULL on error.
+ *
+ * Since: 6.0.0
+ */
+GArrowFileInputStream *
+garrow_file_input_stream_new(const gchar *path,
+                             GError **error)
+{
+  auto arrow_stream_result = arrow::io::ReadableFile::Open(path);
+  if (garrow::check(error, arrow_stream_result, "[file-input-stream][new]")) {
+    auto arrow_stream = *arrow_stream_result;
+    return garrow_file_input_stream_new_raw(&arrow_stream);
+  } else {
+    return NULL;
+  }
+}
+
+/**
+ * garrow_file_input_stream_new_file_descriptor:
+ * @file_descriptor: The file descriptor of this input stream.
+ * @error: (nullable): Return location for a #GError or %NULL.
+ *
+ * Returns: (nullable): A newly created #GArrowFileInputStream
+ *   or %NULL on error.
+ *
+ * Since: 6.0.0
+ */
+GArrowFileInputStream *
+garrow_file_input_stream_new_file_descriptor(gint file_descriptor,
+                                             GError **error)
+{
+  auto arrow_stream_result = arrow::io::ReadableFile::Open(file_descriptor);
+  if (garrow::check(error,
+                    arrow_stream_result,
+                    "[file-input-stream][new-file-descriptor]")) {
+    auto arrow_stream = *arrow_stream_result;
+    return garrow_file_input_stream_new_raw(&arrow_stream);
+  } else {
+    return NULL;
+  }
+}
+
+/**
+ * garrow_file_input_stream_get_file_descriptor:
+ * @stream: A #GArrowFileInuptStream.
+ *
+ * Returns: The file descriptor of @stream.
+ *
+ * Since: 6.0.0
+ */
+gint
+garrow_file_input_stream_get_file_descriptor(GArrowFileInputStream *stream)
+{
+  auto arrow_stream =
+    std::static_pointer_cast<arrow::io::ReadableFile>(
+      garrow_input_stream_get_raw(GARROW_INPUT_STREAM(stream)));
+  return arrow_stream->file_descriptor();
+}
+
+
 G_DEFINE_TYPE(GArrowMemoryMappedInputStream,
               garrow_memory_mapped_input_stream,
               GARROW_TYPE_SEEKABLE_INPUT_STREAM);
@@ -657,18 +739,14 @@ GArrowMemoryMappedInputStream *
 garrow_memory_mapped_input_stream_new(const gchar *path,
                                       GError **error)
 {
-  auto arrow_memory_mapped_file_result =
-    arrow::io::MemoryMappedFile::Open(std::string(path),
-                                      arrow::io::FileMode::READ);
-  if (arrow_memory_mapped_file_result.ok()) {
-    auto arrow_memory_mapped_file =
-      arrow_memory_mapped_file_result.ValueOrDie();
-    return garrow_memory_mapped_input_stream_new_raw(&(arrow_memory_mapped_file));
+  auto arrow_stream_result =
+    arrow::io::MemoryMappedFile::Open(path, arrow::io::FileMode::READ);
+  if (garrow::check(error,
+                    arrow_stream_result,
+                    "[memory-mapped-input-stream][new]")) {
+    auto arrow_stream = *arrow_stream_result;
+    return garrow_memory_mapped_input_stream_new_raw(&arrow_stream);
   } else {
-    std::string context("[memory-mapped-input-stream][open]: <");
-    context += path;
-    context += ">";
-    garrow::check(error, arrow_memory_mapped_file_result, context.c_str());
     return NULL;
   }
 }
@@ -1203,16 +1281,28 @@ garrow_buffer_input_stream_get_raw(GArrowBufferInputStream *buffer_input_stream)
   return arrow_buffer_reader;
 }
 
+
+GArrowFileInputStream *
+garrow_file_input_stream_new_raw(
+  std::shared_ptr<arrow::io::ReadableFile> *arrow_stream)
+{
+  return GARROW_FILE_INPUT_STREAM(g_object_new(GARROW_TYPE_FILE_INPUT_STREAM,
+                                               "input-stream", arrow_stream,
+                                               NULL));
+}
+
+
 GArrowMemoryMappedInputStream *
-garrow_memory_mapped_input_stream_new_raw(std::shared_ptr<arrow::io::MemoryMappedFile> *arrow_memory_mapped_file)
+garrow_memory_mapped_input_stream_new_raw(
+  std::shared_ptr<arrow::io::MemoryMappedFile> *arrow_stream)
 {
-  auto object = g_object_new(GARROW_TYPE_MEMORY_MAPPED_INPUT_STREAM,
-                             "input-stream", arrow_memory_mapped_file,
-                             NULL);
-  auto memory_mapped_input_stream = GARROW_MEMORY_MAPPED_INPUT_STREAM(object);
-  return memory_mapped_input_stream;
+  return GARROW_MEMORY_MAPPED_INPUT_STREAM(
+    g_object_new(GARROW_TYPE_MEMORY_MAPPED_INPUT_STREAM,
+                 "input-stream", arrow_stream,
+                 NULL));
 }
 
+
 GArrowCompressedInputStream *
 garrow_compressed_input_stream_new_raw(std::shared_ptr<arrow::io::CompressedInputStream> *arrow_raw,
                                        GArrowCodec *codec,
diff --git a/c_glib/arrow-glib/input-stream.h b/c_glib/arrow-glib/input-stream.h
index 4b4c51eb3e7..5f583c80486 100644
--- a/c_glib/arrow-glib/input-stream.h
+++ b/c_glib/arrow-glib/input-stream.h
@@ -104,54 +104,42 @@ GArrowBufferInputStream *garrow_buffer_input_stream_new(GArrowBuffer *buffer);
 GArrowBuffer *garrow_buffer_input_stream_get_buffer(GArrowBufferInputStream *input_stream);
 
 
-#define GARROW_TYPE_MEMORY_MAPPED_INPUT_STREAM          \
-  (garrow_memory_mapped_input_stream_get_type())
-#define GARROW_MEMORY_MAPPED_INPUT_STREAM(obj)                          \
-  (G_TYPE_CHECK_INSTANCE_CAST((obj),                                    \
-                              GARROW_TYPE_MEMORY_MAPPED_INPUT_STREAM,   \
-                              GArrowMemoryMappedInputStream))
-#define GARROW_MEMORY_MAPPED_INPUT_STREAM_CLASS(klass)                  \
-  (G_TYPE_CHECK_CLASS_CAST((klass),                                     \
-                           GARROW_TYPE_MEMORY_MAPPED_INPUT_STREAM,      \
-                           GArrowMemoryMappedInputStreamClass))
-#define GARROW_IS_MEMORY_MAPPED_INPUT_STREAM(obj)                       \
-  (G_TYPE_CHECK_INSTANCE_TYPE((obj),                                    \
-                              GARROW_TYPE_MEMORY_MAPPED_INPUT_STREAM))
-#define GARROW_IS_MEMORY_MAPPED_INPUT_STREAM_CLASS(klass)               \
-  (G_TYPE_CHECK_CLASS_TYPE((klass),                                     \
-                           GARROW_TYPE_MEMORY_MAPPED_INPUT_STREAM))
-#define GARROW_MEMORY_MAPPED_INPUT_STREAM_GET_CLASS(obj)                \
-  (G_TYPE_INSTANCE_GET_CLASS((obj),                                     \
-                             GARROW_TYPE_MEMORY_MAPPED_INPUT_STREAM,    \
-                             GArrowMemoryMappedInputStreamClass))
-
-typedef struct _GArrowMemoryMappedInputStream         GArrowMemoryMappedInputStream;
-#ifndef __GTK_DOC_IGNORE__
-typedef struct _GArrowMemoryMappedInputStreamClass    GArrowMemoryMappedInputStreamClass;
-#endif
-
-/**
- * GArrowMemoryMappedInputStream:
- *
- * It wraps `arrow::io::MemoryMappedFile`.
- */
-struct _GArrowMemoryMappedInputStream
+#define GARROW_TYPE_FILE_INPUT_STREAM (garrow_file_input_stream_get_type())
+G_DECLARE_DERIVABLE_TYPE(GArrowFileInputStream,
+                         garrow_file_input_stream,
+                         GARROW,
+                         FILE_INPUT_STREAM,
+                         GArrowSeekableInputStream)
+struct _GArrowFileInputStreamClass
 {
-  /*< private >*/
-  GArrowSeekableInputStream parent_instance;
+  GArrowSeekableInputStreamClass parent_class;
 };
 
-#ifndef __GTK_DOC_IGNORE__
+GArrowFileInputStream *
+garrow_file_input_stream_new(const gchar *path,
+                             GError **error);
+GArrowFileInputStream *
+garrow_file_input_stream_new_file_descriptor(gint file_descriptor,
+                                             GError **error);
+gint
+garrow_file_input_stream_get_file_descriptor(GArrowFileInputStream *stream);
+
+
+#define GARROW_TYPE_MEMORY_MAPPED_INPUT_STREAM          \
+  (garrow_memory_mapped_input_stream_get_type())
+G_DECLARE_DERIVABLE_TYPE(GArrowMemoryMappedInputStream,
+                         garrow_memory_mapped_input_stream,
+                         GARROW,
+                         MEMORY_MAPPED_INPUT_STREAM,
+                         GArrowSeekableInputStream)
 struct _GArrowMemoryMappedInputStreamClass
 {
   GArrowSeekableInputStreamClass parent_class;
 };
-#endif
 
-GType garrow_memory_mapped_input_stream_get_type(void) G_GNUC_CONST;
-
-GArrowMemoryMappedInputStream *garrow_memory_mapped_input_stream_new(const gchar *path,
-                                                                     GError **error);
+GArrowMemoryMappedInputStream *
+garrow_memory_mapped_input_stream_new(const gchar *path,
+                                      GError **error);
 
 
 #define GARROW_TYPE_GIO_INPUT_STREAM            \
diff --git a/c_glib/arrow-glib/input-stream.hpp b/c_glib/arrow-glib/input-stream.hpp
index 88fbb8f64c1..2a0a3d3ddcc 100644
--- a/c_glib/arrow-glib/input-stream.hpp
+++ b/c_glib/arrow-glib/input-stream.hpp
@@ -40,7 +40,16 @@ garrow_buffer_input_stream_new_raw(std::shared_ptr<arrow::io::BufferReader> *arr
                                    GArrowBuffer *buffer);
 std::shared_ptr<arrow::io::BufferReader> garrow_buffer_input_stream_get_raw(GArrowBufferInputStream *input_stream);
 
-GArrowMemoryMappedInputStream *garrow_memory_mapped_input_stream_new_raw(std::shared_ptr<arrow::io::MemoryMappedFile> *arrow_memory_mapped_file);
+
+GArrowFileInputStream *
+garrow_file_input_stream_new_raw(
+  std::shared_ptr<arrow::io::ReadableFile> *arrow_stream);
+
+
+GArrowMemoryMappedInputStream *
+garrow_memory_mapped_input_stream_new_raw(
+  std::shared_ptr<arrow::io::MemoryMappedFile> *arrow_stream);
+
 
 GArrowCompressedInputStream *
 garrow_compressed_input_stream_new_raw(std::shared_ptr<arrow::io::CompressedInputStream> *arrow_raw,
diff --git a/c_glib/arrow-glib/reader.cpp b/c_glib/arrow-glib/reader.cpp
index 3e6539feb5a..98038248050 100644
--- a/c_glib/arrow-glib/reader.cpp
+++ b/c_glib/arrow-glib/reader.cpp
@@ -1360,10 +1360,13 @@ garrow_csv_read_options_set_null_values(GArrowCSVReadOptions *options,
  * garrow_csv_read_options_get_null_values:
  * @options: A #GArrowCSVReadOptions.
  *
- * Return: (nullable) (array zero-terminated=1) (element-type utf8) (transfer full):
- *   The values to be processed as null. It's a %NULL-terminated string array.
+ * Returns: (nullable) (array zero-terminated=1) (element-type utf8) (transfer full):
+ *   The values to be processed as null.
+ *
  *   If the number of values is zero, this returns %NULL.
- *   It must be freed with g_strfreev() when no longer needed.
+ *
+ *   It's a %NULL-terminated string array. It must be freed with
+ *   g_strfreev() when no longer needed.
  *
  * Since: 0.14.0
  */
@@ -1425,10 +1428,13 @@ garrow_csv_read_options_set_true_values(GArrowCSVReadOptions *options,
  * garrow_csv_read_options_get_true_values:
  * @options: A #GArrowCSVReadOptions.
  *
- * Return: (nullable) (array zero-terminated=1) (element-type utf8) (transfer full):
- *   The values to be processed as true. It's a %NULL-terminated string array.
+ * Returns: (nullable) (array zero-terminated=1) (element-type utf8) (transfer full):
+ *   The values to be processed as true.
+ *
  *   If the number of values is zero, this returns %NULL.
- *   It must be freed with g_strfreev() when no longer needed.
+ *
+ *   It's a %NULL-terminated string array. It must be freed with
+ *   g_strfreev() when no longer needed.
  *
  * Since: 0.14.0
  */
@@ -1490,10 +1496,13 @@ garrow_csv_read_options_set_false_values(GArrowCSVReadOptions *options,
  * garrow_csv_read_options_get_false_values:
  * @options: A #GArrowCSVReadOptions.
  *
- * Return: (nullable) (array zero-terminated=1) (element-type utf8) (transfer full):
- *   The values to be processed as false. It's a %NULL-terminated string array.
+ * Returns: (nullable) (array zero-terminated=1) (element-type utf8) (transfer full):
+ *   The values to be processed as false.
+ *
  *   If the number of values is zero, this returns %NULL.
- *   It must be freed with g_strfreev() when no longer needed.
+ *
+ *   It's a %NULL-terminated string array. It must be freed with
+ *   g_strfreev() when no longer needed.
  *
  * Since: 0.14.0
  */
@@ -1556,10 +1565,13 @@ garrow_csv_read_options_set_column_names(GArrowCSVReadOptions *options,
  * garrow_csv_read_options_get_column_names:
  * @options: A #GArrowCSVReadOptions.
  *
- * Return: (nullable) (array zero-terminated=1) (element-type utf8) (transfer full):
- *   The column names. It's a %NULL-terminated string array.
+ * Returns: (nullable) (array zero-terminated=1) (element-type utf8) (transfer full):
+ *   The column names.
+ *
  *   If the number of values is zero, this returns %NULL.
- *   It must be freed with g_strfreev() when no longer needed.
+ *
+ *   It's a %NULL-terminated string array. It must be freed with
+ *   g_strfreev() when no longer needed.
  *
  * Since: 0.15.0
  */
diff --git a/c_glib/doc/arrow-dataset-glib/arrow-dataset-glib-docs.xml b/c_glib/doc/arrow-dataset-glib/arrow-dataset-glib-docs.xml
index 3e8da5bd9d1..b13195b0703 100644
--- a/c_glib/doc/arrow-dataset-glib/arrow-dataset-glib-docs.xml
+++ b/c_glib/doc/arrow-dataset-glib/arrow-dataset-glib-docs.xml
@@ -39,6 +39,8 @@
   <part id="data">
     <title>Data</title>
     <chapter id="source">
+      <title>Partitioning</title>
+      <xi:include href="xml/partitioning.xml"/>
       <title>Dataset</title>
       <xi:include href="xml/dataset.xml"/>
       <title>Dataset factory</title>
@@ -66,8 +68,12 @@
     <title>Index of deprecated API</title>
     <xi:include href="xml/api-index-deprecated.xml"><xi:fallback /></xi:include>
   </index>
+  <index id="api-index-6-0-0" role="6.0.0">
+    <title>Index of new symbols in 6.0.0</title>
+    <xi:include href="xml/api-index-6.0.0.xml"><xi:fallback /></xi:include>
+  </index>
   <index id="api-index-5-0-0" role="5.0.0">
-    <title>Index of new symbols in 4.0.0</title>
+    <title>Index of new symbols in 5.0.0</title>
     <xi:include href="xml/api-index-5.0.0.xml"><xi:fallback /></xi:include>
   </index>
   <index id="api-index-4-0-0" role="4.0.0">
diff --git a/c_glib/test/dataset/test-file-system-dataset.rb b/c_glib/test/dataset/test-file-system-dataset.rb
index 6d6ec3b18c6..0e856b678f8 100644
--- a/c_glib/test/dataset/test-file-system-dataset.rb
+++ b/c_glib/test/dataset/test-file-system-dataset.rb
@@ -16,19 +16,73 @@
 # under the License.
 
 class TestDatasetFileSystemDataset < Test::Unit::TestCase
+  include Helper::Buildable
+  include Helper::Readable
+
   def setup
     omit("Arrow Dataset is required") unless defined?(ArrowDataset)
     Dir.mktmpdir do |tmpdir|
       @dir = tmpdir
-      format = ArrowDataset::IPCFileFormat.new
-      factory = ArrowDataset::FileSystemDatasetFactory.new(format)
-      factory.file_system = Arrow::LocalFileSystem.new
-      @dataset = factory.finish
+      @format = ArrowDataset::IPCFileFormat.new
+      @factory = ArrowDataset::FileSystemDatasetFactory.new(@format)
+      @file_system = Arrow::LocalFileSystem.new
+      @factory.file_system = @file_system
+      partitioning_schema = build_schema(label: Arrow::StringDataType.new)
+      @partitioning =
+        ArrowDataset::DirectoryPartitioning.new(partitioning_schema)
+      @factory.partitioning = @partitioning
       yield
     end
   end
 
   def test_type_name
-    assert_equal("filesystem", @dataset.type_name)
+    dataset = @factory.finish
+    assert_equal("filesystem", dataset.type_name)
+  end
+
+  def test_format
+    dataset = @factory.finish
+    assert_equal(@format, dataset.format)
+  end
+
+  def test_file_system
+    dataset = @factory.finish
+    assert_equal(@file_system, dataset.file_system)
+  end
+
+  def test_partitioning
+    dataset = @factory.finish
+    assert_equal(@partitioning, dataset.partitioning)
+  end
+
+  def test_read_write
+    table = build_table(label: build_string_array(["a", "a", "b", "c"]),
+                        count: build_int32_array([1, 10, 2, 3]))
+    table_reader = Arrow::TableBatchReader.new(table)
+    scanner_builder = ArrowDataset::ScannerBuilder.new(table_reader)
+    scanner = scanner_builder.finish
+    options = ArrowDataset::FileSystemDatasetWriteOptions.new
+    options.file_write_options = @format.default_write_options
+    options.file_system = Arrow::LocalFileSystem.new
+    options.base_dir = @dir
+    options.base_name_template = "{i}.arrow"
+    options.partitioning = @partitioning
+    ArrowDataset::FileSystemDataset.write_scanner(scanner, options)
+    Find.find(@dir) do |path|
+      @factory.add_path(path) if File.file?(path)
+    end
+    @factory.partition_base_dir = @dir
+    dataset = @factory.finish
+    assert_equal(build_table(count: [
+                               build_int32_array([1, 10]),
+                               build_int32_array([2]),
+                               build_int32_array([3]),
+                             ],
+                             label: [
+                               build_string_array(["a", "a"]),
+                               build_string_array(["b"]),
+                               build_string_array(["c"]),
+                             ]),
+                 dataset.to_table)
   end
 end
diff --git a/c_glib/test/dataset/test-file-writer.rb b/c_glib/test/dataset/test-file-writer.rb
new file mode 100644
index 00000000000..5b25d6044d6
--- /dev/null
+++ b/c_glib/test/dataset/test-file-writer.rb
@@ -0,0 +1,65 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+class TestDatasetFileWriter < Test::Unit::TestCase
+  include Helper::Buildable
+  include Helper::Readable
+
+  def setup
+    omit("Arrow Dataset is required") unless defined?(ArrowDataset)
+    Dir.mktmpdir do |tmpdir|
+      @dir = tmpdir
+      @format = ArrowDataset::IPCFileFormat.new
+      @file_system = Arrow::LocalFileSystem.new
+      @path = File.join(@dir, "data.arrow")
+      @output = @file_system.open_output_stream(@path)
+      @schema = build_schema(visible: Arrow::BooleanDataType.new,
+                             point: Arrow::UInt8DataType.new)
+      @writer = @format.open_writer(@output,
+                                    @file_system,
+                                    @path,
+                                    @schema,
+                                    @format.default_write_options)
+      yield
+    end
+  end
+
+  def test_write_record_batch
+    record_batch = build_record_batch(
+      visible: build_boolean_array([true, false, true]),
+      point: build_uint8_array([1, 2, 3]))
+    @writer.write_record_batch(record_batch)
+    @writer.finish
+    @output.close
+    read_table(@path) do |written_table|
+      assert_equal(Arrow::Table.new(record_batch.schema,
+                                    [record_batch]),
+                   written_table)
+    end
+  end
+
+  def test_write_record_batch_reader
+    table = build_table(visible: build_boolean_array([true, false, true]),
+                        point: build_uint8_array([1, 2, 3]))
+    @writer.write_record_batch_reader(Arrow::TableBatchReader.new(table))
+    @writer.finish
+    @output.close
+    read_table(@path) do |written_table|
+      assert_equal(table, written_table)
+    end
+  end
+end
diff --git a/c_glib/test/dataset/test-partitioning-options.rb b/c_glib/test/dataset/test-partitioning-options.rb
new file mode 100644
index 00000000000..9ff585aa7cf
--- /dev/null
+++ b/c_glib/test/dataset/test-partitioning-options.rb
@@ -0,0 +1,46 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+class TestDatasetPartitioningOptions < Test::Unit::TestCase
+  include Helper::Buildable
+
+  def setup
+    omit("Arrow Dataset is required") unless defined?(ArrowDataset)
+    @options = ArrowDataset::PartitioningOptions.new
+  end
+
+  def test_infer_dictionary
+    assert_false(@options.infer_dictionary?)
+    @options.infer_dictionary = true
+    assert_true(@options.infer_dictionary?)
+  end
+
+  def test_schema
+    assert_nil(@options.schema)
+    schema = build_schema(year: Arrow::UInt16DataType.new)
+    @options.schema = schema
+    assert_equal(schema, @options.schema)
+  end
+
+  def test_segment_encoding
+    assert_equal(ArrowDataset::SegmentEncoding::NONE,
+                 @options.segment_encoding)
+    @options.segment_encoding = :uri
+    assert_equal(ArrowDataset::SegmentEncoding::URI,
+                 @options.segment_encoding)
+  end
+end
diff --git a/c_glib/test/dataset/test-partitioning.rb b/c_glib/test/dataset/test-partitioning.rb
new file mode 100644
index 00000000000..d98e51f3c59
--- /dev/null
+++ b/c_glib/test/dataset/test-partitioning.rb
@@ -0,0 +1,34 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+class TestDatasetPartitioning < Test::Unit::TestCase
+  include Helper::Buildable
+
+  def setup
+    omit("Arrow Dataset is required") unless defined?(ArrowDataset)
+  end
+
+  def test_default
+    assert_equal("default", ArrowDataset::Partitioning.new.type_name)
+  end
+
+  def test_directory
+    schema = build_schema(year: Arrow::UInt16DataType.new)
+    partitioning = ArrowDataset::DirectoryPartitioning.new(schema)
+    assert_equal("schema", partitioning.type_name)
+  end
+end
diff --git a/c_glib/test/dataset/test-scanner.rb b/c_glib/test/dataset/test-scanner.rb
index f7702d4905f..ed6a706c6f2 100644
--- a/c_glib/test/dataset/test-scanner.rb
+++ b/c_glib/test/dataset/test-scanner.rb
@@ -45,4 +45,11 @@ def setup
   def test_to_table
     assert_equal(@table, @scanner.to_table)
   end
+
+  def test_new_record_batch_reader
+    reader = Arrow::TableBatchReader.new(@table)
+    builder = ArrowDataset::ScannerBuilder.new(reader)
+    scanner = builder.finish
+    assert_equal(@table, scanner.to_table)
+  end
 end
diff --git a/c_glib/test/helper/buildable.rb b/c_glib/test/helper/buildable.rb
index 356fa651c6a..3a1240cfa1f 100644
--- a/c_glib/test/helper/buildable.rb
+++ b/c_glib/test/helper/buildable.rb
@@ -17,6 +17,13 @@
 
 module Helper
   module Buildable
+    def build_schema(fields)
+      fields = fields.collect do |name, data_type|
+        Arrow::Field.new(name, data_type)
+      end
+      Arrow::Schema.new(fields)
+    end
+
     def build_null_array(values)
       build_array(Arrow::NullArrayBuilder.new, values)
     end
diff --git a/c_glib/test/helper/readable.rb b/c_glib/test/helper/readable.rb
new file mode 100644
index 00000000000..81bf0795c6b
--- /dev/null
+++ b/c_glib/test/helper/readable.rb
@@ -0,0 +1,47 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+module Helper
+  module Readable
+    def read_table(input, type: :file)
+      if input.is_a?(Arrow::Buffer)
+        input_stream = Arrow::BufferIntputStream.new(input)
+      else
+        input_stream = Arrow::FileInputStream.new(input)
+      end
+      begin
+        if type == :file
+          reader = Arrow::RecordBatchFileReader.new(input_stream)
+          record_batches = []
+          reader.n_record_batches.times do |i|
+            record_batches << reader.read_record_batch(i)
+          end
+          yield(Arrow::Table.new(record_batches[0].schema, record_batches))
+        else
+          reader = Arrow::RecordBatchStreamReader.new(input_stream)
+          begin
+            yield(reader.read_all)
+          ensure
+            reader.close
+          end
+        end
+      ensure
+        input_stream.close
+      end
+    end
+  end
+end
diff --git a/c_glib/test/run-test.rb b/c_glib/test/run-test.rb
index abae4e722c5..621c78c3986 100755
--- a/c_glib/test/run-test.rb
+++ b/c_glib/test/run-test.rb
@@ -84,6 +84,7 @@ def should_unlock_gvl?(info, klass)
 end
 
 require "fileutils"
+require "find"
 require "rbconfig"
 require "stringio"
 require "tempfile"
@@ -97,6 +98,7 @@ def should_unlock_gvl?(info, klass)
 end
 require_relative "helper/omittable"
 require_relative "helper/plasma-store"
+require_relative "helper/readable"
 require_relative "helper/writable"
 
 exit(Test::Unit::AutoRunner.run(true, test_dir.to_s))
diff --git a/c_glib/test/test-file-input-stream.rb b/c_glib/test/test-file-input-stream.rb
new file mode 100644
index 00000000000..2b43f97f5dd
--- /dev/null
+++ b/c_glib/test/test-file-input-stream.rb
@@ -0,0 +1,102 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+class TestFileInputStream < Test::Unit::TestCase
+  def setup
+    @data = "Hello World"
+    @tempfile = Tempfile.open("arrow-file-input-stream")
+    @tempfile.write(@data)
+    @tempfile.close
+  end
+
+  def test_new
+    input = Arrow::FileInputStream.new(@tempfile.path)
+    begin
+      buffer = input.read(5)
+      assert_equal("Hello", buffer.data.to_s)
+    ensure
+      input.close
+    end
+  end
+
+  def test_close
+    input = Arrow::FileInputStream.new(@tempfile.path)
+    assert do
+      not input.closed?
+    end
+    input.close
+    assert do
+      input.closed?
+    end
+  end
+
+  def test_size
+    input = Arrow::FileInputStream.new(@tempfile.path)
+    begin
+      assert_equal(@data.bytesize, input.size)
+    ensure
+      input.close
+    end
+  end
+
+  def test_read
+    input = Arrow::FileInputStream.new(@tempfile.path)
+    begin
+      buffer = input.read(5)
+      assert_equal("Hello", buffer.data.to_s)
+    ensure
+      input.close
+    end
+  end
+
+  def test_read_at
+    input = Arrow::FileInputStream.new(@tempfile.path)
+    begin
+      buffer = input.read_at(6, 5)
+      assert_equal("World", buffer.data.to_s)
+    ensure
+      input.close
+    end
+  end
+
+  def test_mode
+    input = Arrow::FileInputStream.new(@tempfile.path)
+    begin
+      assert_equal(Arrow::FileMode::READ, input.mode)
+    ensure
+      input.close
+    end
+  end
+
+  def test_file_descriptor
+    @tempfile.open
+    begin
+      fd = @tempfile.fileno
+      input = Arrow::FileInputStream.new(fd)
+      begin
+        assert_equal(fd, input.file_descriptor)
+      ensure
+        input.close
+      end
+    ensure
+      begin
+        @tempfile.close
+      rescue
+      end
+    end
+  end
+end
diff --git a/c_glib/test/test-function-doc.rb b/c_glib/test/test-function-doc.rb
new file mode 100644
index 00000000000..7e624a5ab7c
--- /dev/null
+++ b/c_glib/test/test-function-doc.rb
@@ -0,0 +1,43 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+class TestFunctionDoc < Test::Unit::TestCase
+  def setup
+    @doc = Arrow::Function.find("or").doc
+  end
+
+  def test_summary
+    assert_equal("Logical 'or' boolean values",
+                 @doc.summary)
+  end
+
+  def test_description
+    assert_equal(<<-DESCRIPTION.chomp, @doc.description)
+When a null is encountered in either input, a null is output.
+For a different null behavior, see function "or_kleene".
+    DESCRIPTION
+  end
+
+  def test_arg_names
+    assert_equal(["x", "y"], @doc.arg_names)
+  end
+
+  def test_options_class_name
+    doc = Arrow::Function.find("cast").doc
+    assert_equal("CastOptions", doc.options_class_name)
+  end
+end
diff --git a/c_glib/test/test-is-in.rb b/c_glib/test/test-is-in.rb
index ba44075d6b3..590b5e3798a 100644
--- a/c_glib/test/test-is-in.rb
+++ b/c_glib/test/test-is-in.rb
@@ -46,6 +46,16 @@ def test_null_in_both
       assert_equal(build_boolean_array([false, true, true, true]),
                    left.is_in(right))
     end
+
+    def test_options
+      left = build_int16_array([1, 0, nil, 2])
+      right = build_int16_array([2, 0, nil])
+      is_in = Arrow::Function.find("is_in")
+      options = Arrow::SetLookupOptions.new(Arrow::ArrayDatum.new(right))
+      assert_equal(build_boolean_array([false, true, true, true]),
+                   is_in.execute([Arrow::ArrayDatum.new(left)],
+                                 options).value)
+    end
   end
 
   sub_test_case("ChunkedArray") do
@@ -92,5 +102,19 @@ def test_null_in_both
       assert_equal(build_boolean_array([false, true, true, true]),
                    left.is_in_chunked_array(right))
     end
+
+    def test_options
+      left = build_int16_array([1, 0, nil, 2])
+      chunks = [
+        build_int16_array([2, 0]),
+        build_int16_array([3, nil])
+      ]
+      right = Arrow::ChunkedArray.new(chunks)
+      is_in = Arrow::Function.find("is_in")
+      options = Arrow::SetLookupOptions.new(Arrow::ChunkedArrayDatum.new(right))
+      assert_equal(build_boolean_array([false, true, true, true]),
+                   is_in.execute([Arrow::ArrayDatum.new(left)],
+                                 options).value)
+    end
   end
 end
diff --git a/c_glib/test/test-set-lookup-options.rb b/c_glib/test/test-set-lookup-options.rb
new file mode 100644
index 00000000000..779bacef683
--- /dev/null
+++ b/c_glib/test/test-set-lookup-options.rb
@@ -0,0 +1,43 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+class TestSetLookupOptions < Test::Unit::TestCase
+  include Helper::Buildable
+
+  def test_new
+    value_set = Arrow::ArrayDatum.new(build_int8_array([1, 2, 3]))
+    options = Arrow::SetLookupOptions.new(value_set)
+    assert_equal(value_set, options.value_set)
+  end
+
+  sub_test_case("instance methods") do
+    def setup
+      value_set = Arrow::ArrayDatum.new(build_int8_array([1, 2, 3]))
+      @options = Arrow::SetLookupOptions.new(value_set)
+    end
+
+    def test_skip_nulls
+      assert do
+        not @options.skip_nulls?
+      end
+      @options.skip_nulls = true
+      assert do
+        @options.skip_nulls?
+      end
+    end
+  end
+end
diff --git a/c_glib/test/test-variance-options.rb b/c_glib/test/test-variance-options.rb
new file mode 100644
index 00000000000..64bdf670bf0
--- /dev/null
+++ b/c_glib/test/test-variance-options.rb
@@ -0,0 +1,46 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+class TestVarianceOptions < Test::Unit::TestCase
+  include Helper::Buildable
+
+  def setup
+    @options = Arrow::VarianceOptions.new
+  end
+
+  def test_ddof
+    assert_equal(0, @options.ddof)
+    @options.ddof = 1
+    assert_equal(1, @options.ddof)
+  end
+
+  def test_skip_nulls
+    assert do
+      @options.skip_nulls?
+    end
+    @options.skip_nulls = false
+    assert do
+      not @options.skip_nulls?
+    end
+  end
+
+  def test_min_count
+    assert_equal(0, @options.min_count)
+    @options.min_count = 1
+    assert_equal(1, @options.min_count)
+  end
+end
diff --git a/ci/appveyor-cpp-setup.bat b/ci/appveyor-cpp-setup.bat
index 47448ce0887..3bf01ec12dd 100644
--- a/ci/appveyor-cpp-setup.bat
+++ b/ci/appveyor-cpp-setup.bat
@@ -70,6 +70,12 @@ if "%JOB%" NEQ "Build_Debug" (
     "fsspec" ^
     "python=%PYTHON%" ^
     || exit /B
+
+  @rem On Windows, GTest is always bundled from source instead of using
+  @rem conda binaries, avoid any interference between the two versions.
+  if "%JOB%" == "Toolchain" (
+    conda uninstall -n arrow -q -y -c conda-forge gtest
+  )
 )
 
 @rem
diff --git a/ci/scripts/go_test.sh b/ci/scripts/go_test.sh
index 7dd873df3e1..9b2572e1b43 100755
--- a/ci/scripts/go_test.sh
+++ b/ci/scripts/go_test.sh
@@ -21,10 +21,18 @@ set -ex
 
 source_dir=${1}/go
 
+testargs="-race"
+case "$(uname)" in
+    MINGW*)
+        # -race doesn't work on windows currently
+        testargs=""
+        ;;
+esac
+
 pushd ${source_dir}/arrow
 
 for d in $(go list ./... | grep -v vendor); do
-    go test $d
+    go test $testargs -tags "test" $d
 done
 
 popd
@@ -32,7 +40,7 @@ popd
 pushd ${source_dir}/parquet
 
 for d in $(go list ./... | grep -v vendor); do
-    go test $d
+    go test $testargs  $d
 done
 
 popd
diff --git a/ci/scripts/python_wheel_macos_build.sh b/ci/scripts/python_wheel_macos_build.sh
index 82e0339c9d0..1a52a2ad52b 100755
--- a/ci/scripts/python_wheel_macos_build.sh
+++ b/ci/scripts/python_wheel_macos_build.sh
@@ -53,6 +53,7 @@ export PIP_SITE_PACKAGES=$(python -c 'import site; print(site.getsitepackages()[
 export PIP_TARGET_PLATFORM="macosx_${MACOSX_DEPLOYMENT_TARGET//./_}_${arch}"
 
 pip install \
+  --upgrade \
   --only-binary=:all: \
   --target $PIP_SITE_PACKAGES \
   --platform $PIP_TARGET_PLATFORM \
diff --git a/ci/scripts/r_docker_configure.sh b/ci/scripts/r_docker_configure.sh
index 2b9bc03bea0..d138d030eca 100755
--- a/ci/scripts/r_docker_configure.sh
+++ b/ci/scripts/r_docker_configure.sh
@@ -37,7 +37,7 @@ if [ "$RHUB_PLATFORM" = "linux-x86_64-fedora-clang" ]; then
   dnf install -y libcxx-devel
   sed -i.bak -E -e 's/(CXX1?1? =.*)/\1 -stdlib=libc++/g' $(${R_BIN} RHOME)/etc/Makeconf
   rm -rf $(${R_BIN} RHOME)/etc/Makeconf.bak
-  
+
   sed -i.bak -E -e 's/(CXXFLAGS = )(.*)/\1 -g -O3 -Wall -pedantic -frtti -fPIC/' $(${R_BIN} RHOME)/etc/Makeconf
   rm -rf $(${R_BIN} RHOME)/etc/Makeconf.bak
 fi
@@ -75,9 +75,3 @@ fi
 
 # Workaround for html help install failure; see https://github.com/r-lib/devtools/issues/2084#issuecomment-530912786
 Rscript -e 'x <- file.path(R.home("doc"), "html"); if (!file.exists(x)) {dir.create(x, recursive=TRUE); file.copy(system.file("html/R.css", package="stats"), x)}'
-
-if [ "`which curl`" ]; then
-  # We need this on R >= 4.0
-  curl -L https://sourceforge.net/projects/checkbaskisms/files/2.0.0.2/checkbashisms/download > /usr/local/bin/checkbashisms
-  chmod 755 /usr/local/bin/checkbashisms
-fi
diff --git a/ci/scripts/r_windows_build.sh b/ci/scripts/r_windows_build.sh
index 47120eef433..8a96b3f5e79 100755
--- a/ci/scripts/r_windows_build.sh
+++ b/ci/scripts/r_windows_build.sh
@@ -92,10 +92,10 @@ cp $MSYS_LIB_DIR/mingw32/lib/lib{zstd,lz4,crypto,utf8proc,re2,aws*}.a $DST_DIR/l
 
 # Do the same also for ucrt64
 if [ "$RTOOLS_VERSION" != "35" ]; then
-ls $MSYS_LIB_DIR/ucrt64/lib/
-mkdir -p $DST_DIR/lib/x64-ucrt
-mv ucrt64/lib/*.a $DST_DIR/${RWINLIB_LIB_DIR}/x64-ucrt
-cp $MSYS_LIB_DIR/ucrt64/lib/lib{zstd,lz4,crypto,utf8proc,re2,aws*}.a $DST_DIR/lib/x64-ucrt
+  ls $MSYS_LIB_DIR/ucrt64/lib/
+  mkdir -p $DST_DIR/lib/x64-ucrt
+  mv ucrt64/lib/*.a $DST_DIR/lib/x64-ucrt
+  cp $MSYS_LIB_DIR/ucrt64/lib/lib{thrift,snappy,zstd,lz4,crypto,utf8proc,re2,aws*}.a $DST_DIR/lib/x64-ucrt
 fi
 
 # Create build artifact
diff --git a/cpp/build-support/fuzzing/generate_corpuses.sh b/cpp/build-support/fuzzing/generate_corpuses.sh
index f0d8e162375..e3f00e64782 100755
--- a/cpp/build-support/fuzzing/generate_corpuses.sh
+++ b/cpp/build-support/fuzzing/generate_corpuses.sh
@@ -27,15 +27,21 @@ fi
 set -ex
 
 CORPUS_DIR=/tmp/corpus
-ARROW_CPP=$(cd $(dirname $BASH_SOURCE)/../..; pwd)
+ARROW_ROOT=$(cd $(dirname $BASH_SOURCE)/../../..; pwd)
+ARROW_CPP=$ARROW_ROOT/cpp
 OUT=$1
 
 # NOTE: name of seed corpus output file should be "<FUZZ TARGET>-seed_corpus.zip"
 # where "<FUZZ TARGET>" is the exact name of the fuzz target executable the
 # seed corpus is generated for.
 
+IPC_INTEGRATION_FILES=$(find ${ARROW_ROOT}/testing/data/arrow-ipc-stream/integration -name "*.stream")
+
 rm -rf ${CORPUS_DIR}
 ${OUT}/arrow-ipc-generate-fuzz-corpus -stream ${CORPUS_DIR}
+# Several IPC integration files can have the same name, make sure
+# they all appear in the corpus by numbering the duplicates.
+cp --backup=numbered ${IPC_INTEGRATION_FILES} ${CORPUS_DIR}
 ${ARROW_CPP}/build-support/fuzzing/pack_corpus.py ${CORPUS_DIR} ${OUT}/arrow-ipc-stream-fuzz_seed_corpus.zip
 
 rm -rf ${CORPUS_DIR}
@@ -48,5 +54,6 @@ ${ARROW_CPP}/build-support/fuzzing/pack_corpus.py ${CORPUS_DIR} ${OUT}/arrow-ipc
 
 rm -rf ${CORPUS_DIR}
 ${OUT}/parquet-arrow-generate-fuzz-corpus ${CORPUS_DIR}
+# Add Parquet testing examples
 cp ${ARROW_CPP}/submodules/parquet-testing/data/*.parquet ${CORPUS_DIR}
 ${ARROW_CPP}/build-support/fuzzing/pack_corpus.py ${CORPUS_DIR} ${OUT}/parquet-arrow-fuzz_seed_corpus.zip
diff --git a/cpp/src/arrow/CMakeLists.txt b/cpp/src/arrow/CMakeLists.txt
index 637f3d1a54f..e06fad9a1de 100644
--- a/cpp/src/arrow/CMakeLists.txt
+++ b/cpp/src/arrow/CMakeLists.txt
@@ -190,6 +190,7 @@ set(ARROW_SRCS
     io/slow.cc
     io/stdio.cc
     io/transform.cc
+    util/async_util.cc
     util/basic_decimal.cc
     util/bit_block_counter.cc
     util/bit_run_reader.cc
diff --git a/cpp/src/arrow/adapters/orc/adapter.cc b/cpp/src/arrow/adapters/orc/adapter.cc
index 2f74b40e40d..94a3b6e882a 100644
--- a/cpp/src/arrow/adapters/orc/adapter.cc
+++ b/cpp/src/arrow/adapters/orc/adapter.cc
@@ -430,10 +430,14 @@ ORCFileReader::~ORCFileReader() {}
 
 Status ORCFileReader::Open(const std::shared_ptr<io::RandomAccessFile>& file,
                            MemoryPool* pool, std::unique_ptr<ORCFileReader>* reader) {
+  return Open(file, pool).Value(reader);
+}
+
+Result<std::unique_ptr<ORCFileReader>> ORCFileReader::Open(
+    const std::shared_ptr<io::RandomAccessFile>& file, MemoryPool* pool) {
   auto result = std::unique_ptr<ORCFileReader>(new ORCFileReader());
   RETURN_NOT_OK(result->impl_->Open(file, pool));
-  *reader = std::move(result);
-  return Status::OK();
+  return std::move(result);
 }
 
 Result<std::shared_ptr<const KeyValueMetadata>> ORCFileReader::ReadMetadata() {
@@ -444,33 +448,79 @@ Status ORCFileReader::ReadSchema(std::shared_ptr<Schema>* out) {
   return impl_->ReadSchema(out);
 }
 
+Result<std::shared_ptr<Schema>> ORCFileReader::ReadSchema() {
+  std::shared_ptr<Schema> schema;
+  RETURN_NOT_OK(impl_->ReadSchema(&schema));
+  return schema;
+}
+
 Status ORCFileReader::Read(std::shared_ptr<Table>* out) { return impl_->Read(out); }
 
+Result<std::shared_ptr<Table>> ORCFileReader::Read() {
+  std::shared_ptr<Table> table;
+  RETURN_NOT_OK(impl_->Read(&table));
+  return table;
+}
+
 Status ORCFileReader::Read(const std::shared_ptr<Schema>& schema,
                            std::shared_ptr<Table>* out) {
   return impl_->Read(schema, out);
 }
 
+Result<std::shared_ptr<Table>> ORCFileReader::Read(
+    const std::shared_ptr<Schema>& schema) {
+  std::shared_ptr<Table> table;
+  RETURN_NOT_OK(impl_->Read(schema, &table));
+  return table;
+}
+
 Status ORCFileReader::Read(const std::vector<int>& include_indices,
                            std::shared_ptr<Table>* out) {
   return impl_->Read(include_indices, out);
 }
 
+Result<std::shared_ptr<Table>> ORCFileReader::Read(
+    const std::vector<int>& include_indices) {
+  std::shared_ptr<Table> table;
+  RETURN_NOT_OK(impl_->Read(include_indices, &table));
+  return table;
+}
+
 Status ORCFileReader::Read(const std::shared_ptr<Schema>& schema,
                            const std::vector<int>& include_indices,
                            std::shared_ptr<Table>* out) {
   return impl_->Read(schema, include_indices, out);
 }
 
+Result<std::shared_ptr<Table>> ORCFileReader::Read(
+    const std::shared_ptr<Schema>& schema, const std::vector<int>& include_indices) {
+  std::shared_ptr<Table> table;
+  RETURN_NOT_OK(impl_->Read(schema, include_indices, &table));
+  return table;
+}
+
 Status ORCFileReader::ReadStripe(int64_t stripe, std::shared_ptr<RecordBatch>* out) {
   return impl_->ReadStripe(stripe, out);
 }
 
+Result<std::shared_ptr<RecordBatch>> ORCFileReader::ReadStripe(int64_t stripe) {
+  std::shared_ptr<RecordBatch> recordBatch;
+  RETURN_NOT_OK(impl_->ReadStripe(stripe, &recordBatch));
+  return recordBatch;
+}
+
 Status ORCFileReader::ReadStripe(int64_t stripe, const std::vector<int>& include_indices,
                                  std::shared_ptr<RecordBatch>* out) {
   return impl_->ReadStripe(stripe, include_indices, out);
 }
 
+Result<std::shared_ptr<RecordBatch>> ORCFileReader::ReadStripe(
+    int64_t stripe, const std::vector<int>& include_indices) {
+  std::shared_ptr<RecordBatch> recordBatch;
+  RETURN_NOT_OK(impl_->ReadStripe(stripe, include_indices, &recordBatch));
+  return recordBatch;
+}
+
 Status ORCFileReader::Seek(int64_t row_number) { return impl_->Seek(row_number); }
 
 Status ORCFileReader::NextStripeReader(int64_t batch_sizes,
@@ -478,12 +528,26 @@ Status ORCFileReader::NextStripeReader(int64_t batch_sizes,
   return impl_->NextStripeReader(batch_sizes, out);
 }
 
+Result<std::shared_ptr<RecordBatchReader>> ORCFileReader::NextStripeReader(
+    int64_t batch_size) {
+  std::shared_ptr<RecordBatchReader> reader;
+  RETURN_NOT_OK(impl_->NextStripeReader(batch_size, &reader));
+  return reader;
+}
+
 Status ORCFileReader::NextStripeReader(int64_t batch_size,
                                        const std::vector<int>& include_indices,
                                        std::shared_ptr<RecordBatchReader>* out) {
   return impl_->NextStripeReader(batch_size, include_indices, out);
 }
 
+Result<std::shared_ptr<RecordBatchReader>> ORCFileReader::NextStripeReader(
+    int64_t batch_size, const std::vector<int>& include_indices) {
+  std::shared_ptr<RecordBatchReader> reader;
+  RETURN_NOT_OK(impl_->NextStripeReader(batch_size, include_indices, &reader));
+  return reader;
+}
+
 int64_t ORCFileReader::NumberOfStripes() { return impl_->NumberOfStripes(); }
 
 int64_t ORCFileReader::NumberOfRows() { return impl_->NumberOfRows(); }
diff --git a/cpp/src/arrow/adapters/orc/adapter.h b/cpp/src/arrow/adapters/orc/adapter.h
index 012c1701980..036795188f6 100644
--- a/cpp/src/arrow/adapters/orc/adapter.h
+++ b/cpp/src/arrow/adapters/orc/adapter.h
@@ -27,6 +27,7 @@
 #include "arrow/status.h"
 #include "arrow/type.h"
 #include "arrow/type_fwd.h"
+#include "arrow/util/macros.h"
 #include "arrow/util/visibility.h"
 
 namespace arrow {
@@ -45,9 +46,18 @@ class ARROW_EXPORT ORCFileReader {
   /// \param[in] pool a MemoryPool to use for buffer allocations
   /// \param[out] reader the returned reader object
   /// \return Status
+  ARROW_DEPRECATED("Deprecated in 6.0.0. Use Result-returning overload instead.")
   static Status Open(const std::shared_ptr<io::RandomAccessFile>& file, MemoryPool* pool,
                      std::unique_ptr<ORCFileReader>* reader);
 
+  /// \brief Creates a new ORC reader
+  ///
+  /// \param[in] file the data source
+  /// \param[in] pool a MemoryPool to use for buffer allocations
+  /// \return the returned reader object
+  static Result<std::unique_ptr<ORCFileReader>> Open(
+      const std::shared_ptr<io::RandomAccessFile>& file, MemoryPool* pool);
+
   /// \brief Return the metadata read from the ORC file
   ///
   /// \return A KeyValueMetadata object containing the ORC metadata
@@ -56,31 +66,63 @@ class ARROW_EXPORT ORCFileReader {
   /// \brief Return the schema read from the ORC file
   ///
   /// \param[out] out the returned Schema object
+  ARROW_DEPRECATED("Deprecated in 6.0.0. Use Result-returning overload instead.")
   Status ReadSchema(std::shared_ptr<Schema>* out);
 
+  /// \brief Return the schema read from the ORC file
+  ///
+  /// \return the returned Schema object
+  Result<std::shared_ptr<Schema>> ReadSchema();
+
   /// \brief Read the file as a Table
   ///
   /// The table will be composed of one record batch per stripe.
   ///
   /// \param[out] out the returned Table
+  ARROW_DEPRECATED("Deprecated in 6.0.0. Use Result-returning overload instead.")
   Status Read(std::shared_ptr<Table>* out);
 
+  /// \brief Read the file as a Table
+  ///
+  /// The table will be composed of one record batch per stripe.
+  ///
+  /// \return the returned Table
+  Result<std::shared_ptr<Table>> Read();
+
   /// \brief Read the file as a Table
   ///
   /// The table will be composed of one record batch per stripe.
   ///
   /// \param[in] schema the Table schema
   /// \param[out] out the returned Table
+  ARROW_DEPRECATED("Deprecated in 6.0.0. Use Result-returning overload instead.")
   Status Read(const std::shared_ptr<Schema>& schema, std::shared_ptr<Table>* out);
 
+  /// \brief Read the file as a Table
+  ///
+  /// The table will be composed of one record batch per stripe.
+  ///
+  /// \param[in] schema the Table schema
+  /// \return the returned Table
+  Result<std::shared_ptr<Table>> Read(const std::shared_ptr<Schema>& schema);
+
   /// \brief Read the file as a Table
   ///
   /// The table will be composed of one record batch per stripe.
   ///
   /// \param[in] include_indices the selected field indices to read
   /// \param[out] out the returned Table
+  ARROW_DEPRECATED("Deprecated in 6.0.0. Use Result-returning overload instead.")
   Status Read(const std::vector<int>& include_indices, std::shared_ptr<Table>* out);
 
+  /// \brief Read the file as a Table
+  ///
+  /// The table will be composed of one record batch per stripe.
+  ///
+  /// \param[in] include_indices the selected field indices to read
+  /// \return the returned Table
+  Result<std::shared_ptr<Table>> Read(const std::vector<int>& include_indices);
+
   /// \brief Read the file as a Table
   ///
   /// The table will be composed of one record batch per stripe.
@@ -88,23 +130,50 @@ class ARROW_EXPORT ORCFileReader {
   /// \param[in] schema the Table schema
   /// \param[in] include_indices the selected field indices to read
   /// \param[out] out the returned Table
+  ARROW_DEPRECATED("Deprecated in 6.0.0. Use Result-returning overload instead.")
   Status Read(const std::shared_ptr<Schema>& schema,
               const std::vector<int>& include_indices, std::shared_ptr<Table>* out);
 
+  /// \brief Read the file as a Table
+  ///
+  /// The table will be composed of one record batch per stripe.
+  ///
+  /// \param[in] schema the Table schema
+  /// \param[in] include_indices the selected field indices to read
+  /// \return the returned Table
+  Result<std::shared_ptr<Table>> Read(const std::shared_ptr<Schema>& schema,
+                                      const std::vector<int>& include_indices);
+
   /// \brief Read a single stripe as a RecordBatch
   ///
   /// \param[in] stripe the stripe index
   /// \param[out] out the returned RecordBatch
+  ARROW_DEPRECATED("Deprecated in 6.0.0. Use Result-returning overload instead.")
   Status ReadStripe(int64_t stripe, std::shared_ptr<RecordBatch>* out);
 
+  /// \brief Read a single stripe as a RecordBatch
+  ///
+  /// \param[in] stripe the stripe index
+  /// \return the returned RecordBatch
+  Result<std::shared_ptr<RecordBatch>> ReadStripe(int64_t stripe);
+
   /// \brief Read a single stripe as a RecordBatch
   ///
   /// \param[in] stripe the stripe index
   /// \param[in] include_indices the selected field indices to read
   /// \param[out] out the returned RecordBatch
+  ARROW_DEPRECATED("Deprecated in 6.0.0. Use Result-returning overload instead.")
   Status ReadStripe(int64_t stripe, const std::vector<int>& include_indices,
                     std::shared_ptr<RecordBatch>* out);
 
+  /// \brief Read a single stripe as a RecordBatch
+  ///
+  /// \param[in] stripe the stripe index
+  /// \param[in] include_indices the selected field indices to read
+  /// \return the returned RecordBatch
+  Result<std::shared_ptr<RecordBatch>> ReadStripe(
+      int64_t stripe, const std::vector<int>& include_indices);
+
   /// \brief Seek to designated row. Invoke NextStripeReader() after seek
   ///        will return stripe reader starting from designated row.
   ///
@@ -119,8 +188,19 @@ class ARROW_EXPORT ORCFileReader {
   /// \param[in] batch_size the number of rows each record batch contains in
   ///            record batch iteration.
   /// \param[out] out the returned stripe reader
+  ARROW_DEPRECATED("Deprecated in 6.0.0. Use Result-returning overload instead.")
   Status NextStripeReader(int64_t batch_size, std::shared_ptr<RecordBatchReader>* out);
 
+  /// \brief Get a stripe level record batch iterator with specified row count
+  ///         in each record batch. NextStripeReader serves as a fine grain
+  ///         alternative to ReadStripe which may cause OOM issue by loading
+  ///         the whole stripes into memory.
+  ///
+  /// \param[in] batch_size the number of rows each record batch contains in
+  ///            record batch iteration.
+  /// \return the returned stripe reader
+  Result<std::shared_ptr<RecordBatchReader>> NextStripeReader(int64_t batch_size);
+
   /// \brief Get a stripe level record batch iterator with specified row count
   ///         in each record batch. NextStripeReader serves as a fine grain
   ///         alternative to ReadStripe which may cause OOM issue by loading
@@ -131,9 +211,23 @@ class ARROW_EXPORT ORCFileReader {
   ///
   /// \param[in] include_indices the selected field indices to read
   /// \param[out] out the returned stripe reader
+  ARROW_DEPRECATED("Deprecated in 6.0.0. Use Result-returning overload instead.")
   Status NextStripeReader(int64_t batch_size, const std::vector<int>& include_indices,
                           std::shared_ptr<RecordBatchReader>* out);
 
+  /// \brief Get a stripe level record batch iterator with specified row count
+  ///         in each record batch. NextStripeReader serves as a fine grain
+  ///         alternative to ReadStripe which may cause OOM issue by loading
+  ///         the whole stripes into memory.
+  ///
+  /// \param[in] batch_size Get a stripe level record batch iterator with specified row
+  /// count in each record batch.
+  ///
+  /// \param[in] include_indices the selected field indices to read
+  /// \return the returned stripe reader
+  Result<std::shared_ptr<RecordBatchReader>> NextStripeReader(
+      int64_t batch_size, const std::vector<int>& include_indices);
+
   /// \brief The number of stripes in the file
   int64_t NumberOfStripes();
 
diff --git a/cpp/src/arrow/adapters/orc/adapter_test.cc b/cpp/src/arrow/adapters/orc/adapter_test.cc
index 9f7fb561362..39c66b90f6d 100644
--- a/cpp/src/arrow/adapters/orc/adapter_test.cc
+++ b/cpp/src/arrow/adapters/orc/adapter_test.cc
@@ -237,13 +237,12 @@ void AssertTableWriteReadEqual(const std::shared_ptr<Table>& input_table,
   ARROW_EXPECT_OK(writer->Close());
   EXPECT_OK_AND_ASSIGN(auto buffer, buffer_output_stream->Finish());
   std::shared_ptr<io::RandomAccessFile> in_stream(new io::BufferReader(buffer));
-  std::unique_ptr<adapters::orc::ORCFileReader> reader;
-  ARROW_EXPECT_OK(
-      adapters::orc::ORCFileReader::Open(in_stream, default_memory_pool(), &reader));
-  std::shared_ptr<Table> actual_output_table;
-  ARROW_EXPECT_OK(reader->Read(&actual_output_table));
+  EXPECT_OK_AND_ASSIGN(
+      auto reader, adapters::orc::ORCFileReader::Open(in_stream, default_memory_pool()));
+  EXPECT_OK_AND_ASSIGN(auto actual_output_table, reader->Read());
   AssertTablesEqual(*expected_output_table, *actual_output_table, false, false);
 }
+
 void AssertArrayWriteReadEqual(const std::shared_ptr<Array>& input_array,
                                const std::shared_ptr<Array>& expected_output_array,
                                const int64_t max_size = kDefaultSmallMemStreamSize) {
@@ -323,9 +322,8 @@ TEST(TestAdapterRead, ReadIntAndStringFileMultipleStripes) {
       std::make_shared<Buffer>(reinterpret_cast<const uint8_t*>(mem_stream.getData()),
                                static_cast<int64_t>(mem_stream.getLength()))));
 
-  std::unique_ptr<adapters::orc::ORCFileReader> reader;
-  ASSERT_TRUE(
-      adapters::orc::ORCFileReader::Open(in_stream, default_memory_pool(), &reader).ok());
+  ASSERT_OK_AND_ASSIGN(
+      auto reader, adapters::orc::ORCFileReader::Open(in_stream, default_memory_pool()));
 
   EXPECT_OK_AND_ASSIGN(auto metadata, reader->ReadMetadata());
   auto expected_metadata = std::const_pointer_cast<const KeyValueMetadata>(
@@ -334,8 +332,7 @@ TEST(TestAdapterRead, ReadIntAndStringFileMultipleStripes) {
   ASSERT_EQ(stripe_row_count * stripe_count, reader->NumberOfRows());
   ASSERT_EQ(stripe_count, reader->NumberOfStripes());
   accumulated = 0;
-  std::shared_ptr<RecordBatchReader> stripe_reader;
-  EXPECT_TRUE(reader->NextStripeReader(reader_batch_size, &stripe_reader).ok());
+  EXPECT_OK_AND_ASSIGN(auto stripe_reader, reader->NextStripeReader(reader_batch_size));
   while (stripe_reader) {
     std::shared_ptr<RecordBatch> record_batch;
     EXPECT_TRUE(stripe_reader->ReadNext(&record_batch).ok());
@@ -350,14 +347,14 @@ TEST(TestAdapterRead, ReadIntAndStringFileMultipleStripes) {
       }
       EXPECT_TRUE(stripe_reader->ReadNext(&record_batch).ok());
     }
-    EXPECT_TRUE(reader->NextStripeReader(reader_batch_size, &stripe_reader).ok());
+    EXPECT_OK_AND_ASSIGN(stripe_reader, reader->NextStripeReader(reader_batch_size));
   }
 
   // test seek operation
   int64_t start_offset = 830;
   EXPECT_TRUE(reader->Seek(stripe_row_count + start_offset).ok());
 
-  EXPECT_TRUE(reader->NextStripeReader(reader_batch_size, &stripe_reader).ok());
+  EXPECT_OK_AND_ASSIGN(stripe_reader, reader->NextStripeReader(reader_batch_size));
   std::shared_ptr<RecordBatch> record_batch;
   EXPECT_TRUE(stripe_reader->ReadNext(&record_batch).ok());
   while (record_batch) {
diff --git a/cpp/src/arrow/array/array_test.cc b/cpp/src/arrow/array/array_test.cc
index cc45a369400..d9617c4e603 100644
--- a/cpp/src/arrow/array/array_test.cc
+++ b/cpp/src/arrow/array/array_test.cc
@@ -3214,4 +3214,73 @@ TEST(TestSwapEndianArrayData, MonthDayNanoInterval) {
   ASSERT_OK(swap_array->ValidateFull());
 }
 
+DataTypeVector SwappableTypes() {
+  return DataTypeVector{int8(),
+                        int16(),
+                        int32(),
+                        int64(),
+                        uint8(),
+                        uint16(),
+                        uint32(),
+                        uint64(),
+                        decimal128(19, 4),
+                        decimal256(37, 8),
+                        timestamp(TimeUnit::MICRO, ""),
+                        time32(TimeUnit::SECOND),
+                        time64(TimeUnit::NANO),
+                        date32(),
+                        date64(),
+                        day_time_interval(),
+                        month_interval(),
+                        month_day_nano_interval(),
+                        binary(),
+                        utf8(),
+                        large_binary(),
+                        large_utf8(),
+                        list(int16()),
+                        large_list(int16()),
+                        dictionary(int16(), utf8())};
+}
+
+TEST(TestSwapEndianArrayData, RandomData) {
+  random::RandomArrayGenerator rng(42);
+
+  for (const auto& type : SwappableTypes()) {
+    ARROW_SCOPED_TRACE("type = ", type->ToString());
+    auto arr = rng.ArrayOf(*field("", type), /*size=*/31);
+    ASSERT_OK_AND_ASSIGN(auto swapped_data,
+                         ::arrow::internal::SwapEndianArrayData(arr->data()));
+    auto swapped = MakeArray(swapped_data);
+    ASSERT_OK_AND_ASSIGN(auto roundtripped_data,
+                         ::arrow::internal::SwapEndianArrayData(swapped_data));
+    auto roundtripped = MakeArray(roundtripped_data);
+    ASSERT_OK(roundtripped->ValidateFull());
+
+    AssertArraysEqual(*arr, *roundtripped, /*verbose=*/true);
+    if (type->id() == Type::INT8 || type->id() == Type::UINT8) {
+      AssertArraysEqual(*arr, *swapped, /*verbose=*/true);
+    } else {
+      // Random generated data is unlikely to be made of byte-palindromes
+      ASSERT_FALSE(arr->Equals(*swapped));
+    }
+  }
+}
+
+TEST(TestSwapEndianArrayData, InvalidLength) {
+  // IPC-incoming data may be invalid, SwapEndianArrayData shouldn't crash
+  // by accessing memory out of bounds.
+  random::RandomArrayGenerator rng(42);
+
+  for (const auto& type : SwappableTypes()) {
+    ARROW_SCOPED_TRACE("type = ", type->ToString());
+    ASSERT_OK_AND_ASSIGN(auto arr, MakeArrayOfNull(type, 0));
+    auto data = arr->data();
+    // Fake length
+    data->length = 123456789;
+    ASSERT_OK_AND_ASSIGN(auto swapped_data, ::arrow::internal::SwapEndianArrayData(data));
+    auto swapped = MakeArray(swapped_data);
+    ASSERT_RAISES(Invalid, swapped->Validate());
+  }
+}
+
 }  // namespace arrow
diff --git a/cpp/src/arrow/array/util.cc b/cpp/src/arrow/array/util.cc
index f12281155b8..232947d2c88 100644
--- a/cpp/src/arrow/array/util.cc
+++ b/cpp/src/arrow/array/util.cc
@@ -78,11 +78,16 @@ class ArrayDataWrapper {
 
 class ArrayDataEndianSwapper {
  public:
-  ArrayDataEndianSwapper(const std::shared_ptr<ArrayData>& data, int64_t length)
-      : data_(data), length_(length) {
+  explicit ArrayDataEndianSwapper(const std::shared_ptr<ArrayData>& data) : data_(data) {
     out_ = data->Copy();
   }
 
+  // WARNING: this facility can be called on invalid Array data by the IPC reader.
+  // Do not rely on the advertised ArrayData length, instead use the physical
+  // buffer sizes to avoid accessing memory out of bounds.
+  //
+  // (If this guarantee turns out to be difficult to maintain, we should call
+  //  Validate() instead)
   Status SwapType(const DataType& type) {
     RETURN_NOT_OK(VisitTypeInline(type, this));
     RETURN_NOT_OK(SwapChildren(type.fields()));
@@ -111,6 +116,7 @@ class ArrayDataEndianSwapper {
     auto in_data = reinterpret_cast<const T*>(in_buffer->data());
     ARROW_ASSIGN_OR_RAISE(auto out_buffer, AllocateBuffer(in_buffer->size()));
     auto out_data = reinterpret_cast<T*>(out_buffer->mutable_data());
+    // NOTE: data_->length not trusted (see warning above)
     int64_t length = in_buffer->size() / sizeof(T);
     for (int64_t i = 0; i < length; i++) {
       out_data[i] = BitUtil::ByteSwap(in_data[i]);
@@ -146,8 +152,8 @@ class ArrayDataEndianSwapper {
     auto data = reinterpret_cast<const uint64_t*>(data_->buffers[1]->data());
     ARROW_ASSIGN_OR_RAISE(auto new_buffer, AllocateBuffer(data_->buffers[1]->size()));
     auto new_data = reinterpret_cast<uint64_t*>(new_buffer->mutable_data());
-    int64_t length = length_;
-    length = data_->buffers[1]->size() / (sizeof(uint64_t) * 2);
+    // NOTE: data_->length not trusted (see warning above)
+    const int64_t length = data_->buffers[1]->size() / Decimal128Type::kByteWidth;
     for (int64_t i = 0; i < length; i++) {
       uint64_t tmp;
       auto idx = i * 2;
@@ -169,8 +175,8 @@ class ArrayDataEndianSwapper {
     auto data = reinterpret_cast<const uint64_t*>(data_->buffers[1]->data());
     ARROW_ASSIGN_OR_RAISE(auto new_buffer, AllocateBuffer(data_->buffers[1]->size()));
     auto new_data = reinterpret_cast<uint64_t*>(new_buffer->mutable_data());
-    int64_t length = length_;
-    length = data_->buffers[1]->size() / (sizeof(uint64_t) * 4);
+    // NOTE: data_->length not trusted (see warning above)
+    const int64_t length = data_->buffers[1]->size() / Decimal256Type::kByteWidth;
     for (int64_t i = 0; i < length; i++) {
       uint64_t tmp0, tmp1, tmp2;
       auto idx = i * 4;
@@ -206,9 +212,10 @@ class ArrayDataEndianSwapper {
     auto data = reinterpret_cast<const MonthDayNanos*>(data_->buffers[1]->data());
     ARROW_ASSIGN_OR_RAISE(auto new_buffer, AllocateBuffer(data_->buffers[1]->size()));
     auto new_data = reinterpret_cast<MonthDayNanos*>(new_buffer->mutable_data());
-    int64_t length = data_->length;
+    // NOTE: data_->length not trusted (see warning above)
+    const int64_t length = data_->buffers[1]->size() / sizeof(MonthDayNanos);
     for (int64_t i = 0; i < length; i++) {
-      MonthDayNanoIntervalType::MonthDayNanos tmp = data[i];
+      MonthDayNanos tmp = data[i];
 #if ARROW_LITTLE_ENDIAN
       tmp.months = BitUtil::FromBigEndian(tmp.months);
       tmp.days = BitUtil::FromBigEndian(tmp.days);
@@ -279,7 +286,6 @@ class ArrayDataEndianSwapper {
   }
 
   const std::shared_ptr<ArrayData>& data_;
-  int64_t length_;
   std::shared_ptr<ArrayData> out_;
 };
 
@@ -292,7 +298,7 @@ Result<std::shared_ptr<ArrayData>> SwapEndianArrayData(
   if (data->offset != 0) {
     return Status::Invalid("Unsupported data format: data.offset != 0");
   }
-  ArrayDataEndianSwapper swapper(data, data->length);
+  ArrayDataEndianSwapper swapper(data);
   RETURN_NOT_OK(swapper.SwapType(*data->type));
   return std::move(swapper.out_);
 }
diff --git a/cpp/src/arrow/c/bridge.cc b/cpp/src/arrow/c/bridge.cc
index 8b8153465ee..9484b44590a 100644
--- a/cpp/src/arrow/c/bridge.cc
+++ b/cpp/src/arrow/c/bridge.cc
@@ -28,6 +28,7 @@
 #include "arrow/buffer.h"
 #include "arrow/c/helpers.h"
 #include "arrow/c/util_internal.h"
+#include "arrow/extension_type.h"
 #include "arrow/memory_pool.h"
 #include "arrow/record_batch.h"
 #include "arrow/result.h"
@@ -56,8 +57,6 @@ using internal::ArrayExportTraits;
 using internal::SchemaExportGuard;
 using internal::SchemaExportTraits;
 
-// TODO export / import Extension types and arrays
-
 namespace {
 
 Status ExportingNotImplemented(const DataType& type) {
@@ -171,23 +170,26 @@ struct SchemaExporter {
     export_.name_ = field.name();
     flags_ = field.nullable() ? ARROW_FLAG_NULLABLE : 0;
 
-    const DataType& type = *field.type();
-    RETURN_NOT_OK(ExportFormat(type));
-    RETURN_NOT_OK(ExportChildren(type.fields()));
+    const DataType* type = UnwrapExtension(field.type().get());
+    RETURN_NOT_OK(ExportFormat(*type));
+    RETURN_NOT_OK(ExportChildren(type->fields()));
     RETURN_NOT_OK(ExportMetadata(field.metadata().get()));
     return Status::OK();
   }
 
-  Status ExportType(const DataType& type) {
+  Status ExportType(const DataType& orig_type) {
     flags_ = ARROW_FLAG_NULLABLE;
 
-    RETURN_NOT_OK(ExportFormat(type));
-    RETURN_NOT_OK(ExportChildren(type.fields()));
+    const DataType* type = UnwrapExtension(&orig_type);
+    RETURN_NOT_OK(ExportFormat(*type));
+    RETURN_NOT_OK(ExportChildren(type->fields()));
+    // There may be additional metadata to export
+    RETURN_NOT_OK(ExportMetadata(nullptr));
     return Status::OK();
   }
 
   Status ExportSchema(const Schema& schema) {
-    static StructType dummy_struct_type({});
+    static const StructType dummy_struct_type({});
     flags_ = 0;
 
     RETURN_NOT_OK(ExportFormat(dummy_struct_type));
@@ -232,6 +234,17 @@ struct SchemaExporter {
     c_struct->release = ReleaseExportedSchema;
   }
 
+  const DataType* UnwrapExtension(const DataType* type) {
+    if (type->id() == Type::EXTENSION) {
+      const auto& ext_type = checked_cast<const ExtensionType&>(*type);
+      additional_metadata_.reserve(2);
+      additional_metadata_.emplace_back(kExtensionTypeKeyName, ext_type.extension_name());
+      additional_metadata_.emplace_back(kExtensionMetadataKeyName, ext_type.Serialize());
+      return ext_type.storage_type().get();
+    }
+    return type;
+  }
+
   Status ExportFormat(const DataType& type) {
     if (type.id() == Type::DICTIONARY) {
       const auto& dict_type = checked_cast<const DictionaryType&>(type);
@@ -259,10 +272,29 @@ struct SchemaExporter {
     return Status::OK();
   }
 
-  Status ExportMetadata(const KeyValueMetadata* metadata) {
-    if (metadata != nullptr && metadata->size() >= 0) {
-      ARROW_ASSIGN_OR_RAISE(export_.metadata_, EncodeMetadata(*metadata));
+  Status ExportMetadata(const KeyValueMetadata* orig_metadata) {
+    static const KeyValueMetadata empty_metadata;
+
+    if (orig_metadata == nullptr) {
+      orig_metadata = &empty_metadata;
     }
+    if (additional_metadata_.empty()) {
+      if (orig_metadata->size() > 0) {
+        ARROW_ASSIGN_OR_RAISE(export_.metadata_, EncodeMetadata(*orig_metadata));
+      }
+      return Status::OK();
+    }
+    // Additional metadata needs to be appended to the existing
+    // (for extension types)
+    KeyValueMetadata metadata(orig_metadata->keys(), orig_metadata->values());
+    for (const auto& kv : additional_metadata_) {
+      // The metadata may already be there => ignore
+      if (metadata.Contains(kv.first)) {
+        continue;
+      }
+      metadata.Append(kv.first, kv.second);
+    }
+    ARROW_ASSIGN_OR_RAISE(export_.metadata_, EncodeMetadata(metadata));
     return Status::OK();
   }
 
@@ -442,6 +474,7 @@ struct SchemaExporter {
 
   ExportedSchemaPrivateData export_;
   int64_t flags_ = 0;
+  std::vector<std::pair<std::string, std::string>> additional_metadata_;
   std::unique_ptr<SchemaExporter> dict_exporter_;
   std::vector<SchemaExporter> child_exporters_;
 };
@@ -721,7 +754,13 @@ class FormatStringParser {
   size_t index_;
 };
 
-Result<std::shared_ptr<KeyValueMetadata>> DecodeMetadata(const char* metadata) {
+struct DecodedMetadata {
+  std::shared_ptr<KeyValueMetadata> metadata;
+  std::string extension_name;
+  std::string extension_serialized;
+};
+
+Result<DecodedMetadata> DecodeMetadata(const char* metadata) {
   auto read_int32 = [&](int32_t* out) -> Status {
     int32_t v;
     memcpy(&v, metadata, 4);
@@ -744,21 +783,29 @@ Result<std::shared_ptr<KeyValueMetadata>> DecodeMetadata(const char* metadata) {
     return Status::OK();
   };
 
+  DecodedMetadata decoded;
+
   if (metadata == nullptr) {
-    return nullptr;
+    return decoded;
   }
   int32_t npairs;
   RETURN_NOT_OK(read_int32(&npairs));
   if (npairs == 0) {
-    return nullptr;
+    return decoded;
   }
   std::vector<std::string> keys(npairs);
   std::vector<std::string> values(npairs);
   for (int32_t i = 0; i < npairs; ++i) {
     RETURN_NOT_OK(read_string(&keys[i]));
     RETURN_NOT_OK(read_string(&values[i]));
+    if (keys[i] == kExtensionTypeKeyName) {
+      decoded.extension_name = values[i];
+    } else if (keys[i] == kExtensionMetadataKeyName) {
+      decoded.extension_serialized = values[i];
+    }
   }
-  return key_value_metadata(std::move(keys), std::move(values));
+  decoded.metadata = key_value_metadata(std::move(keys), std::move(values));
+  return decoded;
 }
 
 struct SchemaImporter {
@@ -775,10 +822,9 @@ struct SchemaImporter {
   }
 
   Result<std::shared_ptr<Field>> MakeField() const {
-    ARROW_ASSIGN_OR_RAISE(auto metadata, DecodeMetadata(c_struct_->metadata));
     const char* name = c_struct_->name ? c_struct_->name : "";
     bool nullable = (c_struct_->flags & ARROW_FLAG_NULLABLE) != 0;
-    return field(name, type_, nullable, std::move(metadata));
+    return field(name, type_, nullable, std::move(metadata_.metadata));
   }
 
   Result<std::shared_ptr<Schema>> MakeSchema() const {
@@ -787,8 +833,7 @@ struct SchemaImporter {
           "Cannot import schema: ArrowSchema describes non-struct type ",
           type_->ToString());
     }
-    ARROW_ASSIGN_OR_RAISE(auto metadata, DecodeMetadata(c_struct_->metadata));
-    return schema(type_->fields(), std::move(metadata));
+    return schema(type_->fields(), std::move(metadata_.metadata));
   }
 
   Result<std::shared_ptr<DataType>> MakeType() const { return type_; }
@@ -836,6 +881,20 @@ struct SchemaImporter {
       bool ordered = (c_struct_->flags & ARROW_FLAG_DICTIONARY_ORDERED) != 0;
       type_ = dictionary(type_, dict_importer.type_, ordered);
     }
+
+    // Import metadata
+    ARROW_ASSIGN_OR_RAISE(metadata_, DecodeMetadata(c_struct_->metadata));
+
+    // Detect extension type
+    if (!metadata_.extension_name.empty()) {
+      const auto registered_ext_type = GetExtensionType(metadata_.extension_name);
+      if (registered_ext_type) {
+        ARROW_ASSIGN_OR_RAISE(
+            type_, registered_ext_type->Deserialize(std::move(type_),
+                                                    metadata_.extension_serialized));
+      }
+    }
+
     return Status::OK();
   }
 
@@ -1130,6 +1189,7 @@ struct SchemaImporter {
   int64_t recursion_level_;
   std::vector<SchemaImporter> child_importers_;
   std::shared_ptr<DataType> type_;
+  DecodedMetadata metadata_;
 };
 
 }  // namespace
@@ -1255,8 +1315,15 @@ struct ArrayImporter {
   }
 
   Status DoImport() {
+    // Unwrap extension type
+    const DataType* storage_type = type_.get();
+    if (storage_type->id() == Type::EXTENSION) {
+      storage_type =
+          checked_cast<const ExtensionType&>(*storage_type).storage_type().get();
+    }
+
     // First import children (required for reconstituting parent array data)
-    const auto& fields = type_->fields();
+    const auto& fields = storage_type->fields();
     if (c_struct_->n_children != static_cast<int64_t>(fields.size())) {
       return Status::Invalid("ArrowArray struct has ", c_struct_->n_children,
                              " children, expected ", fields.size(), " for type ",
@@ -1270,15 +1337,15 @@ struct ArrayImporter {
     }
 
     // Import main data
-    RETURN_NOT_OK(ImportMainData());
+    RETURN_NOT_OK(VisitTypeInline(*storage_type, this));
 
-    bool is_dict_type = (type_->id() == Type::DICTIONARY);
+    bool is_dict_type = (storage_type->id() == Type::DICTIONARY);
     if (c_struct_->dictionary != nullptr) {
       if (!is_dict_type) {
         return Status::Invalid("Import type is ", type_->ToString(),
                                " but dictionary field in ArrowArray struct is not null");
       }
-      const auto& dict_type = checked_cast<const DictionaryType&>(*type_);
+      const auto& dict_type = checked_cast<const DictionaryType&>(*storage_type);
       // Import dictionary values
       ArrayImporter dict_importer(dict_type.value_type());
       RETURN_NOT_OK(dict_importer.ImportDict(this, c_struct_->dictionary));
@@ -1292,13 +1359,11 @@ struct ArrayImporter {
     return Status::OK();
   }
 
-  Status ImportMainData() { return VisitTypeInline(*type_, this); }
-
   Status Visit(const DataType& type) {
     return Status::NotImplemented("Cannot import array of type ", type_->ToString());
   }
 
-  Status Visit(const FixedWidthType& type) { return ImportFixedSizePrimitive(); }
+  Status Visit(const FixedWidthType& type) { return ImportFixedSizePrimitive(type); }
 
   Status Visit(const NullType& type) {
     RETURN_NOT_OK(CheckNoChildren());
@@ -1352,16 +1417,15 @@ struct ArrayImporter {
     return Status::OK();
   }
 
-  Status ImportFixedSizePrimitive() {
-    const auto& fw_type = checked_cast<const FixedWidthType&>(*type_);
+  Status ImportFixedSizePrimitive(const FixedWidthType& type) {
     RETURN_NOT_OK(CheckNoChildren());
     RETURN_NOT_OK(CheckNumBuffers(2));
     RETURN_NOT_OK(AllocateArrayData());
     RETURN_NOT_OK(ImportNullBitmap());
-    if (BitUtil::IsMultipleOf8(fw_type.bit_width())) {
-      RETURN_NOT_OK(ImportFixedSizeBuffer(1, fw_type.bit_width() / 8));
+    if (BitUtil::IsMultipleOf8(type.bit_width())) {
+      RETURN_NOT_OK(ImportFixedSizeBuffer(1, type.bit_width() / 8));
     } else {
-      DCHECK_EQ(fw_type.bit_width(), 1);
+      DCHECK_EQ(type.bit_width(), 1);
       RETURN_NOT_OK(ImportBitsBuffer(1));
     }
     return Status::OK();
diff --git a/cpp/src/arrow/c/bridge_test.cc b/cpp/src/arrow/c/bridge_test.cc
index 54ce0efcf9d..c51cb66c03b 100644
--- a/cpp/src/arrow/c/bridge_test.cc
+++ b/cpp/src/arrow/c/bridge_test.cc
@@ -31,8 +31,10 @@
 #include "arrow/c/util_internal.h"
 #include "arrow/ipc/json_simple.h"
 #include "arrow/memory_pool.h"
+#include "arrow/testing/extension_type.h"
 #include "arrow/testing/gtest_util.h"
 #include "arrow/testing/util.h"
+#include "arrow/util/checked_cast.h"
 #include "arrow/util/endian.h"
 #include "arrow/util/key_value_metadata.h"
 #include "arrow/util/logging.h"
@@ -45,6 +47,7 @@ using internal::ArrayExportGuard;
 using internal::ArrayExportTraits;
 using internal::ArrayStreamExportGuard;
 using internal::ArrayStreamExportTraits;
+using internal::checked_cast;
 using internal::SchemaExportGuard;
 using internal::SchemaExportTraits;
 
@@ -122,6 +125,10 @@ using ArrayReleaseCallback = ReleaseCallback<ArrayExportTraits>;
 
 static const std::vector<std::string> kMetadataKeys1{"key1", "key2"};
 static const std::vector<std::string> kMetadataValues1{"", "bar"};
+
+static const std::vector<std::string> kMetadataKeys2{"key"};
+static const std::vector<std::string> kMetadataValues2{"abcde"};
+
 // clang-format off
 static const std::string kEncodedMetadata1{  // NOLINT: runtime/string
 #if ARROW_LITTLE_ENDIAN
@@ -133,11 +140,7 @@ static const std::string kEncodedMetadata1{  // NOLINT: runtime/string
     0, 0, 0, 4, 'k', 'e', 'y', '1', 0, 0, 0, 0,
     0, 0, 0, 4, 'k', 'e', 'y', '2', 0, 0, 0, 3, 'b', 'a', 'r'};
 #endif
-// clang-format on
 
-static const std::vector<std::string> kMetadataKeys2{"key"};
-static const std::vector<std::string> kMetadataValues2{"abcde"};
-// clang-format off
 static const std::string kEncodedMetadata2{  // NOLINT: runtime/string
 #if ARROW_LITTLE_ENDIAN
     1, 0, 0, 0,
@@ -146,6 +149,51 @@ static const std::string kEncodedMetadata2{  // NOLINT: runtime/string
     0, 0, 0, 1,
     0, 0, 0, 3, 'k', 'e', 'y', 0, 0, 0, 5, 'a', 'b', 'c', 'd', 'e'};
 #endif
+
+static const std::string kEncodedUuidMetadata =  // NOLINT: runtime/string
+#if ARROW_LITTLE_ENDIAN
+    std::string {2, 0, 0, 0} +
+    std::string {20, 0, 0, 0} + kExtensionTypeKeyName +
+    std::string {4, 0, 0, 0} + "uuid" +
+    std::string {24, 0, 0, 0} + kExtensionMetadataKeyName +
+    std::string {15, 0, 0, 0} + "uuid-serialized";
+#else
+    std::string {0, 0, 0, 2} +
+    std::string {0, 0, 0, 20} + kExtensionTypeKeyName +
+    std::string {0, 0, 0, 4} + "uuid" +
+    std::string {0, 0, 0, 24} + kExtensionMetadataKeyName +
+    std::string {0, 0, 0, 15} + "uuid-serialized";
+#endif
+
+static const std::string kEncodedDictExtensionMetadata =  // NOLINT: runtime/string
+#if ARROW_LITTLE_ENDIAN
+    std::string {2, 0, 0, 0} +
+    std::string {20, 0, 0, 0} + kExtensionTypeKeyName +
+    std::string {14, 0, 0, 0} + "dict-extension" +
+    std::string {24, 0, 0, 0} + kExtensionMetadataKeyName +
+    std::string {25, 0, 0, 0} + "dict-extension-serialized";
+#else
+    std::string {0, 0, 0, 2} +
+    std::string {0, 0, 0, 20} + kExtensionTypeKeyName +
+    std::string {0, 0, 0, 14} + "dict-extension" +
+    std::string {0, 0, 0, 24} + kExtensionMetadataKeyName +
+    std::string {0, 0, 0, 25} + "dict-extension-serialized";
+#endif
+
+static const std::string kEncodedComplex128Metadata =  // NOLINT: runtime/string
+#if ARROW_LITTLE_ENDIAN
+    std::string {2, 0, 0, 0} +
+    std::string {20, 0, 0, 0} + kExtensionTypeKeyName +
+    std::string {10, 0, 0, 0} + "complex128" +
+    std::string {24, 0, 0, 0} + kExtensionMetadataKeyName +
+    std::string {21, 0, 0, 0} + "complex128-serialized";
+#else
+    std::string {0, 0, 0, 2} +
+    std::string {0, 0, 0, 20} + kExtensionTypeKeyName +
+    std::string {0, 0, 0, 10} + "complex128" +
+    std::string {0, 0, 0, 24} + kExtensionMetadataKeyName +
+    std::string {0, 0, 0, 21} + "complex128-serialized";
+#endif
 // clang-format on
 
 static constexpr int64_t kDefaultFlags = ARROW_FLAG_NULLABLE;
@@ -404,6 +452,16 @@ TEST_F(TestSchemaExport, Dictionary) {
   }
 }
 
+TEST_F(TestSchemaExport, Extension) {
+  TestPrimitive(uuid(), "w:16", "", kDefaultFlags, kEncodedUuidMetadata);
+
+  TestNested(dict_extension_type(), {"c", "u"}, {"", ""}, {kDefaultFlags, kDefaultFlags},
+             {kEncodedDictExtensionMetadata, ""});
+
+  TestNested(complex128(), {"+s", "g", "g"}, {"", "real", "imag"},
+             {ARROW_FLAG_NULLABLE, 0, 0}, {kEncodedComplex128Metadata, "", ""});
+}
+
 TEST_F(TestSchemaExport, ExportField) {
   TestPrimitive(field("thing", null()), "n", "thing", ARROW_FLAG_NULLABLE);
   // With nullable = false
@@ -507,11 +565,9 @@ class TestArrayExport : public ::testing::Test {
  public:
   void SetUp() override { pool_ = default_memory_pool(); }
 
-  static std::function<Status(std::shared_ptr<Array>*)> JSONArrayFactory(
+  static std::function<Result<std::shared_ptr<Array>>()> JSONArrayFactory(
       std::shared_ptr<DataType> type, const char* json) {
-    return [=](std::shared_ptr<Array>* out) -> Status {
-      return ::arrow::ipc::internal::json::ArrayFromJSON(type, json, out);
-    };
+    return [=]() { return ArrayFromJSON(type, json); };
   }
 
   template <typename ArrayFactory, typename ExportCheckFunc>
@@ -519,7 +575,7 @@ class TestArrayExport : public ::testing::Test {
     auto orig_bytes = pool_->bytes_allocated();
 
     std::shared_ptr<Array> arr;
-    ASSERT_OK(factory(&arr));
+    ASSERT_OK_AND_ASSIGN(arr, ToResult(factory()));
     const ArrayData& data = *arr->data();  // non-owning reference
     struct ArrowArray c_export;
     ASSERT_OK(ExportArray(*arr, &c_export));
@@ -562,7 +618,7 @@ class TestArrayExport : public ::testing::Test {
     auto orig_bytes = pool_->bytes_allocated();
 
     std::shared_ptr<Array> arr;
-    ASSERT_OK(factory(&arr));
+    ASSERT_OK_AND_ASSIGN(arr, ToResult(factory()));
     const ArrayData& data = *arr->data();  // non-owning reference
     struct ArrowArray c_export_temp, c_export_final;
     ASSERT_OK(ExportArray(*arr, &c_export_temp));
@@ -607,7 +663,7 @@ class TestArrayExport : public ::testing::Test {
     auto orig_bytes = pool_->bytes_allocated();
 
     std::shared_ptr<Array> arr;
-    ASSERT_OK(factory(&arr));
+    ASSERT_OK_AND_ASSIGN(arr, ToResult(factory()));
     struct ArrowArray c_export_parent, c_export_child;
     ASSERT_OK(ExportArray(*arr, &c_export_parent));
 
@@ -661,7 +717,7 @@ class TestArrayExport : public ::testing::Test {
     auto orig_bytes = pool_->bytes_allocated();
 
     std::shared_ptr<Array> arr;
-    ASSERT_OK(factory(&arr));
+    ASSERT_OK_AND_ASSIGN(arr, ToResult(factory()));
     struct ArrowArray c_export_parent;
     ASSERT_OK(ExportArray(*arr, &c_export_parent));
 
@@ -752,10 +808,7 @@ TEST_F(TestArrayExport, Primitive) {
 }
 
 TEST_F(TestArrayExport, PrimitiveSliced) {
-  auto factory = [](std::shared_ptr<Array>* out) -> Status {
-    *out = ArrayFromJSON(int16(), "[1, 2, null, -3]")->Slice(1, 2);
-    return Status::OK();
-  };
+  auto factory = []() { return ArrayFromJSON(int16(), "[1, 2, null, -3]")->Slice(1, 2); };
 
   TestPrimitive(factory);
 }
@@ -802,18 +855,17 @@ TEST_F(TestArrayExport, List) {
 
 TEST_F(TestArrayExport, ListSliced) {
   {
-    auto factory = [](std::shared_ptr<Array>* out) -> Status {
-      *out = ArrayFromJSON(list(int8()), "[[1, 2], [3, null], [4, 5, 6], null]")
-                 ->Slice(1, 2);
-      return Status::OK();
+    auto factory = []() {
+      return ArrayFromJSON(list(int8()), "[[1, 2], [3, null], [4, 5, 6], null]")
+          ->Slice(1, 2);
     };
     TestNested(factory);
   }
   {
-    auto factory = [](std::shared_ptr<Array>* out) -> Status {
+    auto factory = []() {
       auto values = ArrayFromJSON(int16(), "[1, 2, 3, 4, null, 5, 6, 7, 8]")->Slice(1, 6);
       auto offsets = ArrayFromJSON(int32(), "[0, 2, 3, 5, 6]")->Slice(2, 4);
-      return ListArray::FromArrays(*offsets, *values).Value(out);
+      return ListArray::FromArrays(*offsets, *values);
     };
     TestNested(factory);
   }
@@ -847,28 +899,25 @@ TEST_F(TestArrayExport, Union) {
 
 TEST_F(TestArrayExport, Dictionary) {
   {
-    auto factory = [](std::shared_ptr<Array>* out) -> Status {
+    auto factory = []() {
       auto values = ArrayFromJSON(utf8(), R"(["foo", "bar", "quux"])");
       auto indices = ArrayFromJSON(uint16(), "[0, 2, 1, null, 1]");
       return DictionaryArray::FromArrays(dictionary(indices->type(), values->type()),
-                                         indices, values)
-          .Value(out);
+                                         indices, values);
     };
     TestNested(factory);
   }
   {
-    auto factory = [](std::shared_ptr<Array>* out) -> Status {
+    auto factory = []() {
       auto values = ArrayFromJSON(list(utf8()), R"([["abc", "def"], ["efg"], []])");
       auto indices = ArrayFromJSON(int32(), "[0, 2, 1, null, 1]");
       return DictionaryArray::FromArrays(
-                 dictionary(indices->type(), values->type(), /*ordered=*/true), indices,
-                 values)
-          .Value(out);
+          dictionary(indices->type(), values->type(), /*ordered=*/true), indices, values);
     };
     TestNested(factory);
   }
   {
-    auto factory = [](std::shared_ptr<Array>* out) -> Status {
+    auto factory = []() -> Result<std::shared_ptr<Array>> {
       auto values = ArrayFromJSON(list(utf8()), R"([["abc", "def"], ["efg"], []])");
       auto indices = ArrayFromJSON(int32(), "[0, 2, 1, null, 1]");
       ARROW_ASSIGN_OR_RAISE(
@@ -876,13 +925,20 @@ TEST_F(TestArrayExport, Dictionary) {
           DictionaryArray::FromArrays(dictionary(indices->type(), values->type()),
                                       indices, values));
       auto offsets = ArrayFromJSON(int64(), "[0, 2, 5]");
-      RETURN_NOT_OK(LargeListArray::FromArrays(*offsets, *dict_array).Value(out));
-      return (*out)->ValidateFull();
+      ARROW_ASSIGN_OR_RAISE(auto arr, LargeListArray::FromArrays(*offsets, *dict_array));
+      RETURN_NOT_OK(arr->ValidateFull());
+      return arr;
     };
     TestNested(factory);
   }
 }
 
+TEST_F(TestArrayExport, Extension) {
+  TestPrimitive(ExampleUuid);
+  TestPrimitive(ExampleSmallint);
+  TestPrimitive(ExampleComplex128);
+}
+
 TEST_F(TestArrayExport, MovePrimitive) {
   TestMovePrimitive(int8(), "[1, 2, null, -3]");
   TestMovePrimitive(fixed_size_binary(3), R"(["foo", "bar", null])");
@@ -898,17 +954,16 @@ TEST_F(TestArrayExport, MoveNested) {
 
 TEST_F(TestArrayExport, MoveDictionary) {
   {
-    auto factory = [](std::shared_ptr<Array>* out) -> Status {
+    auto factory = []() {
       auto values = ArrayFromJSON(utf8(), R"(["foo", "bar", "quux"])");
       auto indices = ArrayFromJSON(int32(), "[0, 2, 1, null, 1]");
       return DictionaryArray::FromArrays(dictionary(indices->type(), values->type()),
-                                         indices, values)
-          .Value(out);
+                                         indices, values);
     };
     TestMoveNested(factory);
   }
   {
-    auto factory = [](std::shared_ptr<Array>* out) -> Status {
+    auto factory = []() -> Result<std::shared_ptr<Array>> {
       auto values = ArrayFromJSON(list(utf8()), R"([["abc", "def"], ["efg"], []])");
       auto indices = ArrayFromJSON(int32(), "[0, 2, 1, null, 1]");
       ARROW_ASSIGN_OR_RAISE(
@@ -916,8 +971,9 @@ TEST_F(TestArrayExport, MoveDictionary) {
           DictionaryArray::FromArrays(dictionary(indices->type(), values->type()),
                                       indices, values));
       auto offsets = ArrayFromJSON(int64(), "[0, 2, 5]");
-      RETURN_NOT_OK(LargeListArray::FromArrays(*offsets, *dict_array).Value(out));
-      return (*out)->ValidateFull();
+      ARROW_ASSIGN_OR_RAISE(auto arr, LargeListArray::FromArrays(*offsets, *dict_array));
+      RETURN_NOT_OK(arr->ValidateFull());
+      return arr;
     };
     TestMoveNested(factory);
   }
@@ -934,7 +990,7 @@ TEST_F(TestArrayExport, MoveChild) {
                 R"([[1, "foo"], [2, null]])",
                 /*child_id=*/1);
   {
-    auto factory = [](std::shared_ptr<Array>* out) -> Status {
+    auto factory = []() -> Result<std::shared_ptr<Array>> {
       auto values = ArrayFromJSON(list(utf8()), R"([["abc", "def"], ["efg"], []])");
       auto indices = ArrayFromJSON(int32(), "[0, 2, 1, null, 1]");
       ARROW_ASSIGN_OR_RAISE(
@@ -942,8 +998,9 @@ TEST_F(TestArrayExport, MoveChild) {
           DictionaryArray::FromArrays(dictionary(indices->type(), values->type()),
                                       indices, values));
       auto offsets = ArrayFromJSON(int64(), "[0, 2, 5]");
-      RETURN_NOT_OK(LargeListArray::FromArrays(*offsets, *dict_array).Value(out));
-      return (*out)->ValidateFull();
+      ARROW_ASSIGN_OR_RAISE(auto arr, LargeListArray::FromArrays(*offsets, *dict_array));
+      RETURN_NOT_OK(arr->ValidateFull());
+      return arr;
     };
     TestMoveChild(factory, /*child_id=*/0);
   }
@@ -1400,6 +1457,32 @@ TEST_F(TestSchemaImport, Dictionary) {
   CheckImport(expected);
 }
 
+TEST_F(TestSchemaImport, UnregisteredExtension) {
+  FillPrimitive("w:16");
+  c_struct_.metadata = kEncodedUuidMetadata.c_str();
+  auto expected = fixed_size_binary(16);
+  CheckImport(expected);
+}
+
+TEST_F(TestSchemaImport, RegisteredExtension) {
+  {
+    ExtensionTypeGuard guard(uuid());
+    FillPrimitive("w:16");
+    c_struct_.metadata = kEncodedUuidMetadata.c_str();
+    auto expected = uuid();
+    CheckImport(expected);
+  }
+  {
+    ExtensionTypeGuard guard(dict_extension_type());
+    FillPrimitive(AddChild(), "u");
+    FillPrimitive("c");
+    FillDictionary();
+    c_struct_.metadata = kEncodedDictExtensionMetadata.c_str();
+    auto expected = dict_extension_type();
+    CheckImport(expected);
+  }
+}
+
 TEST_F(TestSchemaImport, FormatStringError) {
   FillPrimitive("");
   CheckImportError();
@@ -1481,6 +1564,22 @@ TEST_F(TestSchemaImport, DictionaryError) {
   CheckImportError();
 }
 
+TEST_F(TestSchemaImport, ExtensionError) {
+  ExtensionTypeGuard guard(uuid());
+
+  // Storage type doesn't match
+  FillPrimitive("w:15");
+  c_struct_.metadata = kEncodedUuidMetadata.c_str();
+  CheckImportError();
+
+  // Invalid serialization
+  std::string bogus_metadata = kEncodedUuidMetadata;
+  bogus_metadata[bogus_metadata.size() - 5] += 1;
+  FillPrimitive("w:16");
+  c_struct_.metadata = bogus_metadata.c_str();
+  CheckImportError();
+}
+
 TEST_F(TestSchemaImport, RecursionError) {
   FillPrimitive(AddChild(), "c", "unused");
   auto c = AddChild();
@@ -2163,21 +2262,44 @@ TEST_F(TestArrayImport, DictionaryWithOffset) {
   FillPrimitive(3, 0, 0, primitive_buffers_no_nulls4);
   FillDictionary();
 
-  auto dict_values = ArrayFromJSON(utf8(), R"(["", "bar", "quux"])");
-  auto indices = ArrayFromJSON(int8(), "[1, 2, 0]");
-  ASSERT_OK_AND_ASSIGN(
-      auto expected,
-      DictionaryArray::FromArrays(dictionary(int8(), utf8()), indices, dict_values));
+  auto expected = DictArrayFromJSON(dictionary(int8(), utf8()), "[1, 2, 0]",
+                                    R"(["", "bar", "quux"])");
   CheckImport(expected);
 
   FillStringLike(AddChild(), 4, 0, 0, string_buffers_no_nulls1);
   FillPrimitive(4, 0, 2, primitive_buffers_no_nulls4);
   FillDictionary();
 
-  dict_values = ArrayFromJSON(utf8(), R"(["foo", "", "bar", "quux"])");
-  indices = ArrayFromJSON(int8(), "[0, 1, 3, 0]");
-  ASSERT_OK_AND_ASSIGN(expected, DictionaryArray::FromArrays(dictionary(int8(), utf8()),
-                                                             indices, dict_values));
+  expected = DictArrayFromJSON(dictionary(int8(), utf8()), "[0, 1, 3, 0]",
+                               R"(["foo", "", "bar", "quux"])");
+  CheckImport(expected);
+}
+
+TEST_F(TestArrayImport, RegisteredExtension) {
+  ExtensionTypeGuard guard({smallint(), dict_extension_type(), complex128()});
+
+  // smallint
+  FillPrimitive(3, 0, 0, primitive_buffers_no_nulls1_16);
+  auto expected =
+      ExtensionType::WrapArray(smallint(), ArrayFromJSON(int16(), "[513, 1027, 1541]"));
+  CheckImport(expected);
+
+  // dict_extension_type
+  FillStringLike(AddChild(), 4, 0, 0, string_buffers_no_nulls1);
+  FillPrimitive(6, 0, 0, primitive_buffers_no_nulls4);
+  FillDictionary();
+
+  auto storage = DictArrayFromJSON(dictionary(int8(), utf8()), "[1, 2, 0, 1, 3, 0]",
+                                   R"(["foo", "", "bar", "quux"])");
+  expected = ExtensionType::WrapArray(dict_extension_type(), storage);
+  CheckImport(expected);
+
+  // complex128
+  FillPrimitive(AddChild(), 3, 0, /*offset=*/0, primitive_buffers_no_nulls6);
+  FillPrimitive(AddChild(), 3, 0, /*offset=*/3, primitive_buffers_no_nulls6);
+  FillStructLike(3, 0, 0, 2, buffers_no_nulls_no_data);
+  expected = MakeComplex128(ArrayFromJSON(float64(), "[0.0, 1.5, -2.0]"),
+                            ArrayFromJSON(float64(), "[3.0, 4.0, 5.0]"));
   CheckImport(expected);
 }
 
@@ -2341,8 +2463,9 @@ class TestSchemaRoundtrip : public ::testing::Test {
  public:
   void SetUp() override { pool_ = default_memory_pool(); }
 
-  template <typename TypeFactory>
-  void TestWithTypeFactory(TypeFactory&& factory) {
+  template <typename TypeFactory, typename ExpectedTypeFactory>
+  void TestWithTypeFactory(TypeFactory&& factory,
+                           ExpectedTypeFactory&& factory_expected) {
     std::shared_ptr<DataType> type, actual;
     struct ArrowSchema c_schema {};  // zeroed
     SchemaExportGuard schema_guard(&c_schema);
@@ -2359,7 +2482,7 @@ class TestSchemaRoundtrip : public ::testing::Test {
 
     // Recreate the type
     ASSERT_OK_AND_ASSIGN(actual, ImportType(&c_schema));
-    type = factory();
+    type = factory_expected();
     AssertTypeEqual(*type, *actual);
     type.reset();
     actual.reset();
@@ -2367,6 +2490,11 @@ class TestSchemaRoundtrip : public ::testing::Test {
     ASSERT_EQ(pool_->bytes_allocated(), orig_bytes);
   }
 
+  template <typename TypeFactory>
+  void TestWithTypeFactory(TypeFactory&& factory) {
+    TestWithTypeFactory(factory, factory);
+  }
+
   template <typename SchemaFactory>
   void TestWithSchemaFactory(SchemaFactory&& factory) {
     std::shared_ptr<Schema> schema, actual;
@@ -2459,6 +2587,27 @@ TEST_F(TestSchemaRoundtrip, Dictionary) {
   }
 }
 
+TEST_F(TestSchemaRoundtrip, UnregisteredExtension) {
+  TestWithTypeFactory(uuid, []() { return fixed_size_binary(16); });
+  TestWithTypeFactory(dict_extension_type, []() { return dictionary(int8(), utf8()); });
+
+  // Inside nested type
+  TestWithTypeFactory([]() { return list(dict_extension_type()); },
+                      []() { return list(dictionary(int8(), utf8())); });
+}
+
+TEST_F(TestSchemaRoundtrip, RegisteredExtension) {
+  ExtensionTypeGuard guard({uuid(), dict_extension_type(), complex128()});
+  TestWithTypeFactory(uuid);
+  TestWithTypeFactory(dict_extension_type);
+  TestWithTypeFactory(complex128);
+
+  // Inside nested type
+  TestWithTypeFactory([]() { return list(uuid()); });
+  TestWithTypeFactory([]() { return list(dict_extension_type()); });
+  TestWithTypeFactory([]() { return list(complex128()); });
+}
+
 TEST_F(TestSchemaRoundtrip, Map) {
   TestWithTypeFactory([&]() { return map(utf8(), int32()); });
   TestWithTypeFactory([&]() { return map(list(utf8()), int32()); });
@@ -2482,28 +2631,30 @@ TEST_F(TestSchemaRoundtrip, Schema) {
 
 class TestArrayRoundtrip : public ::testing::Test {
  public:
-  using ArrayFactory = std::function<Status(std::shared_ptr<Array>*)>;
+  using ArrayFactory = std::function<Result<std::shared_ptr<Array>>()>;
 
   void SetUp() override { pool_ = default_memory_pool(); }
 
   static ArrayFactory JSONArrayFactory(std::shared_ptr<DataType> type, const char* json) {
-    return [=](std::shared_ptr<Array>* out) -> Status {
-      return ::arrow::ipc::internal::json::ArrayFromJSON(type, json, out);
-    };
+    return [=]() { return ArrayFromJSON(type, json); };
   }
 
   static ArrayFactory SlicedArrayFactory(ArrayFactory factory) {
-    return [=](std::shared_ptr<Array>* out) -> Status {
-      std::shared_ptr<Array> arr;
-      RETURN_NOT_OK(factory(&arr));
+    return [=]() -> Result<std::shared_ptr<Array>> {
+      ARROW_ASSIGN_OR_RAISE(auto arr, factory());
       DCHECK_GE(arr->length(), 2);
-      *out = arr->Slice(1, arr->length() - 2);
-      return Status::OK();
+      return arr->Slice(1, arr->length() - 2);
     };
   }
 
   template <typename ArrayFactory>
   void TestWithArrayFactory(ArrayFactory&& factory) {
+    TestWithArrayFactory(factory, factory);
+  }
+
+  template <typename ArrayFactory, typename ExpectedArrayFactory>
+  void TestWithArrayFactory(ArrayFactory&& factory,
+                            ExpectedArrayFactory&& factory_expected) {
     std::shared_ptr<Array> array;
     struct ArrowArray c_array {};
     struct ArrowSchema c_schema {};
@@ -2512,7 +2663,7 @@ class TestArrayRoundtrip : public ::testing::Test {
 
     auto orig_bytes = pool_->bytes_allocated();
 
-    ASSERT_OK(factory(&array));
+    ASSERT_OK_AND_ASSIGN(array, ToResult(factory()));
     ASSERT_OK(ExportType(*array->type(), &c_schema));
     ASSERT_OK(ExportArray(*array, &c_array));
 
@@ -2539,7 +2690,7 @@ class TestArrayRoundtrip : public ::testing::Test {
     // Check value of imported array
     {
       std::shared_ptr<Array> expected;
-      ASSERT_OK(factory(&expected));
+      ASSERT_OK_AND_ASSIGN(expected, ToResult(factory_expected()));
       AssertTypeEqual(*expected->type(), *array->type());
       AssertArraysEqual(*expected, *array, true);
     }
@@ -2556,7 +2707,7 @@ class TestArrayRoundtrip : public ::testing::Test {
     SchemaExportGuard schema_guard(&c_schema);
 
     auto orig_bytes = pool_->bytes_allocated();
-    ASSERT_OK(factory(&batch));
+    ASSERT_OK_AND_ASSIGN(batch, ToResult(factory()));
     ASSERT_OK(ExportSchema(*batch->schema(), &c_schema));
     ASSERT_OK(ExportRecordBatch(*batch, &c_array));
 
@@ -2579,7 +2730,7 @@ class TestArrayRoundtrip : public ::testing::Test {
     // Check value of imported record batch
     {
       std::shared_ptr<RecordBatch> expected;
-      ASSERT_OK(factory(&expected));
+      ASSERT_OK_AND_ASSIGN(expected, ToResult(factory()));
       AssertSchemaEqual(*expected->schema(), *batch->schema());
       AssertBatchesEqual(*expected, *batch);
     }
@@ -2621,15 +2772,15 @@ TEST_F(TestArrayRoundtrip, Primitive) {
 }
 
 TEST_F(TestArrayRoundtrip, UnknownNullCount) {
-  TestWithArrayFactory([](std::shared_ptr<Array>* arr) -> Status {
-    *arr = ArrayFromJSON(int32(), "[0, 1, 2]");
-    if ((*arr)->null_bitmap()) {
+  TestWithArrayFactory([]() -> Result<std::shared_ptr<Array>> {
+    auto arr = ArrayFromJSON(int32(), "[0, 1, 2]");
+    if (arr->null_bitmap()) {
       return Status::Invalid(
           "Failed precondition: "
           "the array shouldn't have a null bitmap.");
     }
-    (*arr)->data()->SetNullCount(kUnknownNullCount);
-    return Status::OK();
+    arr->data()->SetNullCount(kUnknownNullCount);
+    return arr;
   });
 }
 
@@ -2670,30 +2821,62 @@ TEST_F(TestArrayRoundtrip, Nested) {
 
 TEST_F(TestArrayRoundtrip, Dictionary) {
   {
-    auto factory = [](std::shared_ptr<Array>* out) -> Status {
+    auto factory = []() {
       auto values = ArrayFromJSON(utf8(), R"(["foo", "bar", "quux"])");
       auto indices = ArrayFromJSON(int32(), "[0, 2, 1, null, 1]");
       return DictionaryArray::FromArrays(dictionary(indices->type(), values->type()),
-                                         indices, values)
-          .Value(out);
+                                         indices, values);
     };
     TestWithArrayFactory(factory);
     TestWithArrayFactory(SlicedArrayFactory(factory));
   }
   {
-    auto factory = [](std::shared_ptr<Array>* out) -> Status {
+    auto factory = []() {
       auto values = ArrayFromJSON(list(utf8()), R"([["abc", "def"], ["efg"], []])");
       auto indices = ArrayFromJSON(int32(), "[0, 2, 1, null, 1]");
       return DictionaryArray::FromArrays(
-                 dictionary(indices->type(), values->type(), /*ordered=*/true), indices,
-                 values)
-          .Value(out);
+          dictionary(indices->type(), values->type(), /*ordered=*/true), indices, values);
     };
     TestWithArrayFactory(factory);
     TestWithArrayFactory(SlicedArrayFactory(factory));
   }
 }
 
+TEST_F(TestArrayRoundtrip, RegisteredExtension) {
+  ExtensionTypeGuard guard({smallint(), complex128(), dict_extension_type(), uuid()});
+
+  TestWithArrayFactory(ExampleSmallint);
+  TestWithArrayFactory(ExampleUuid);
+  TestWithArrayFactory(ExampleComplex128);
+  TestWithArrayFactory(ExampleDictExtension);
+
+  // Nested inside outer array
+  auto NestedFactory = [](ArrayFactory factory) {
+    return [factory]() -> Result<std::shared_ptr<Array>> {
+      ARROW_ASSIGN_OR_RAISE(auto arr, ToResult(factory()));
+      return FixedSizeListArray::FromArrays(arr, /*list_size=*/1);
+    };
+  };
+  TestWithArrayFactory(NestedFactory(ExampleSmallint));
+  TestWithArrayFactory(NestedFactory(ExampleUuid));
+  TestWithArrayFactory(NestedFactory(ExampleComplex128));
+  TestWithArrayFactory(NestedFactory(ExampleDictExtension));
+}
+
+TEST_F(TestArrayRoundtrip, UnregisteredExtension) {
+  auto StorageExtractor = [](ArrayFactory factory) {
+    return [factory]() -> Result<std::shared_ptr<Array>> {
+      ARROW_ASSIGN_OR_RAISE(auto arr, ToResult(factory()));
+      return checked_cast<const ExtensionArray&>(*arr).storage();
+    };
+  };
+
+  TestWithArrayFactory(ExampleSmallint, StorageExtractor(ExampleSmallint));
+  TestWithArrayFactory(ExampleUuid, StorageExtractor(ExampleUuid));
+  TestWithArrayFactory(ExampleComplex128, StorageExtractor(ExampleComplex128));
+  TestWithArrayFactory(ExampleDictExtension, StorageExtractor(ExampleDictExtension));
+}
+
 TEST_F(TestArrayRoundtrip, RecordBatch) {
   auto schema = ::arrow::schema(
       {field("ints", int16()), field("bools", boolean(), /*nullable=*/false)});
@@ -2701,22 +2884,18 @@ TEST_F(TestArrayRoundtrip, RecordBatch) {
   auto arr1 = ArrayFromJSON(boolean(), "[false, true, false]");
 
   {
-    auto factory = [&](std::shared_ptr<RecordBatch>* out) -> Status {
-      *out = RecordBatch::Make(schema, 3, {arr0, arr1});
-      return Status::OK();
-    };
+    auto factory = [&]() { return RecordBatch::Make(schema, 3, {arr0, arr1}); };
     TestWithBatchFactory(factory);
   }
   {
     // With schema and field metadata
-    auto factory = [&](std::shared_ptr<RecordBatch>* out) -> Status {
+    auto factory = [&]() {
       auto f0 = schema->field(0);
       auto f1 = schema->field(1);
       f1 = f1->WithMetadata(key_value_metadata(kMetadataKeys1, kMetadataValues1));
       auto schema_with_md =
           ::arrow::schema({f0, f1}, key_value_metadata(kMetadataKeys2, kMetadataValues2));
-      *out = RecordBatch::Make(schema_with_md, 3, {arr0, arr1});
-      return Status::OK();
+      return RecordBatch::Make(schema_with_md, 3, {arr0, arr1});
     };
     TestWithBatchFactory(factory);
   }
diff --git a/cpp/src/arrow/compute/api_aggregate.cc b/cpp/src/arrow/compute/api_aggregate.cc
index 6d7bdfa6cf9..1216fe27d4e 100644
--- a/cpp/src/arrow/compute/api_aggregate.cc
+++ b/cpp/src/arrow/compute/api_aggregate.cc
@@ -85,18 +85,23 @@ static auto kScalarAggregateOptionsType = GetFunctionOptionsType<ScalarAggregate
     DataMember("min_count", &ScalarAggregateOptions::min_count));
 static auto kCountOptionsType =
     GetFunctionOptionsType<CountOptions>(DataMember("mode", &CountOptions::mode));
-static auto kModeOptionsType =
-    GetFunctionOptionsType<ModeOptions>(DataMember("n", &ModeOptions::n));
+static auto kModeOptionsType = GetFunctionOptionsType<ModeOptions>(
+    DataMember("n", &ModeOptions::n), DataMember("skip_nulls", &ModeOptions::skip_nulls),
+    DataMember("min_count", &ModeOptions::min_count));
 static auto kVarianceOptionsType = GetFunctionOptionsType<VarianceOptions>(
     DataMember("ddof", &VarianceOptions::ddof),
     DataMember("skip_nulls", &VarianceOptions::skip_nulls),
     DataMember("min_count", &VarianceOptions::min_count));
 static auto kQuantileOptionsType = GetFunctionOptionsType<QuantileOptions>(
     DataMember("q", &QuantileOptions::q),
-    DataMember("interpolation", &QuantileOptions::interpolation));
+    DataMember("interpolation", &QuantileOptions::interpolation),
+    DataMember("skip_nulls", &QuantileOptions::skip_nulls),
+    DataMember("min_count", &QuantileOptions::min_count));
 static auto kTDigestOptionsType = GetFunctionOptionsType<TDigestOptions>(
     DataMember("q", &TDigestOptions::q), DataMember("delta", &TDigestOptions::delta),
-    DataMember("buffer_size", &TDigestOptions::buffer_size));
+    DataMember("buffer_size", &TDigestOptions::buffer_size),
+    DataMember("skip_nulls", &TDigestOptions::skip_nulls),
+    DataMember("min_count", &TDigestOptions::min_count));
 static auto kIndexOptionsType =
     GetFunctionOptionsType<IndexOptions>(DataMember("value", &IndexOptions::value));
 }  // namespace
@@ -112,7 +117,11 @@ CountOptions::CountOptions(CountMode mode)
     : FunctionOptions(internal::kCountOptionsType), mode(mode) {}
 constexpr char CountOptions::kTypeName[];
 
-ModeOptions::ModeOptions(int64_t n) : FunctionOptions(internal::kModeOptionsType), n(n) {}
+ModeOptions::ModeOptions(int64_t n, bool skip_nulls, uint32_t min_count)
+    : FunctionOptions(internal::kModeOptionsType),
+      n{n},
+      skip_nulls{skip_nulls},
+      min_count{min_count} {}
 constexpr char ModeOptions::kTypeName[];
 
 VarianceOptions::VarianceOptions(int ddof, bool skip_nulls, uint32_t min_count)
@@ -122,27 +131,38 @@ VarianceOptions::VarianceOptions(int ddof, bool skip_nulls, uint32_t min_count)
       min_count(min_count) {}
 constexpr char VarianceOptions::kTypeName[];
 
-QuantileOptions::QuantileOptions(double q, enum Interpolation interpolation)
+QuantileOptions::QuantileOptions(double q, enum Interpolation interpolation,
+                                 bool skip_nulls, uint32_t min_count)
     : FunctionOptions(internal::kQuantileOptionsType),
       q{q},
-      interpolation{interpolation} {}
-QuantileOptions::QuantileOptions(std::vector<double> q, enum Interpolation interpolation)
+      interpolation{interpolation},
+      skip_nulls{skip_nulls},
+      min_count{min_count} {}
+QuantileOptions::QuantileOptions(std::vector<double> q, enum Interpolation interpolation,
+                                 bool skip_nulls, uint32_t min_count)
     : FunctionOptions(internal::kQuantileOptionsType),
       q{std::move(q)},
-      interpolation{interpolation} {}
+      interpolation{interpolation},
+      skip_nulls{skip_nulls},
+      min_count{min_count} {}
 constexpr char QuantileOptions::kTypeName[];
 
-TDigestOptions::TDigestOptions(double q, uint32_t delta, uint32_t buffer_size)
+TDigestOptions::TDigestOptions(double q, uint32_t delta, uint32_t buffer_size,
+                               bool skip_nulls, uint32_t min_count)
     : FunctionOptions(internal::kTDigestOptionsType),
       q{q},
       delta{delta},
-      buffer_size{buffer_size} {}
+      buffer_size{buffer_size},
+      skip_nulls{skip_nulls},
+      min_count{min_count} {}
 TDigestOptions::TDigestOptions(std::vector<double> q, uint32_t delta,
-                               uint32_t buffer_size)
+                               uint32_t buffer_size, bool skip_nulls, uint32_t min_count)
     : FunctionOptions(internal::kTDigestOptionsType),
       q{std::move(q)},
       delta{delta},
-      buffer_size{buffer_size} {}
+      buffer_size{buffer_size},
+      skip_nulls{skip_nulls},
+      min_count{min_count} {}
 constexpr char TDigestOptions::kTypeName[];
 
 IndexOptions::IndexOptions(std::shared_ptr<Scalar> value)
diff --git a/cpp/src/arrow/compute/api_aggregate.h b/cpp/src/arrow/compute/api_aggregate.h
index 8c27da49765..c8df81773d4 100644
--- a/cpp/src/arrow/compute/api_aggregate.h
+++ b/cpp/src/arrow/compute/api_aggregate.h
@@ -82,11 +82,16 @@ class ARROW_EXPORT CountOptions : public FunctionOptions {
 /// By default, returns the most common value and count.
 class ARROW_EXPORT ModeOptions : public FunctionOptions {
  public:
-  explicit ModeOptions(int64_t n = 1);
+  explicit ModeOptions(int64_t n = 1, bool skip_nulls = true, uint32_t min_count = 0);
   constexpr static char const kTypeName[] = "ModeOptions";
   static ModeOptions Defaults() { return ModeOptions{}; }
 
   int64_t n = 1;
+  /// If true (the default), null values are ignored. Otherwise, if any value is null,
+  /// emit null.
+  bool skip_nulls;
+  /// If less than this many non-null values are observed, emit null.
+  uint32_t min_count;
 };
 
 /// \brief Control Delta Degrees of Freedom (ddof) of Variance and Stddev kernel
@@ -121,10 +126,12 @@ class ARROW_EXPORT QuantileOptions : public FunctionOptions {
     MIDPOINT,
   };
 
-  explicit QuantileOptions(double q = 0.5, enum Interpolation interpolation = LINEAR);
+  explicit QuantileOptions(double q = 0.5, enum Interpolation interpolation = LINEAR,
+                           bool skip_nulls = true, uint32_t min_count = 0);
 
   explicit QuantileOptions(std::vector<double> q,
-                           enum Interpolation interpolation = LINEAR);
+                           enum Interpolation interpolation = LINEAR,
+                           bool skip_nulls = true, uint32_t min_count = 0);
 
   constexpr static char const kTypeName[] = "QuantileOptions";
   static QuantileOptions Defaults() { return QuantileOptions{}; }
@@ -132,6 +139,11 @@ class ARROW_EXPORT QuantileOptions : public FunctionOptions {
   /// quantile must be between 0 and 1 inclusive
   std::vector<double> q;
   enum Interpolation interpolation;
+  /// If true (the default), null values are ignored. Otherwise, if any value is null,
+  /// emit null.
+  bool skip_nulls;
+  /// If less than this many non-null values are observed, emit null.
+  uint32_t min_count;
 };
 
 /// \brief Control TDigest approximate quantile kernel behavior
@@ -140,9 +152,11 @@ class ARROW_EXPORT QuantileOptions : public FunctionOptions {
 class ARROW_EXPORT TDigestOptions : public FunctionOptions {
  public:
   explicit TDigestOptions(double q = 0.5, uint32_t delta = 100,
-                          uint32_t buffer_size = 500);
+                          uint32_t buffer_size = 500, bool skip_nulls = true,
+                          uint32_t min_count = 0);
   explicit TDigestOptions(std::vector<double> q, uint32_t delta = 100,
-                          uint32_t buffer_size = 500);
+                          uint32_t buffer_size = 500, bool skip_nulls = true,
+                          uint32_t min_count = 0);
   constexpr static char const kTypeName[] = "TDigestOptions";
   static TDigestOptions Defaults() { return TDigestOptions{}; }
 
@@ -152,6 +166,11 @@ class ARROW_EXPORT TDigestOptions : public FunctionOptions {
   uint32_t delta;
   /// input buffer size, default 500
   uint32_t buffer_size;
+  /// If true (the default), null values are ignored. Otherwise, if any value is null,
+  /// emit null.
+  bool skip_nulls;
+  /// If less than this many non-null values are observed, emit null.
+  uint32_t min_count;
 };
 
 /// \brief Control Index kernel behavior
diff --git a/cpp/src/arrow/compute/api_scalar.cc b/cpp/src/arrow/compute/api_scalar.cc
index b7287129cbc..83aaee5f0fe 100644
--- a/cpp/src/arrow/compute/api_scalar.cc
+++ b/cpp/src/arrow/compute/api_scalar.cc
@@ -53,6 +53,7 @@ struct EnumTraits<compute::JoinOptions::NullHandlingBehavior>
     return "<INVALID>";
   }
 };
+
 template <>
 struct EnumTraits<TimeUnit::type>
     : BasicEnumTraits<TimeUnit::type, TimeUnit::type::SECOND, TimeUnit::type::MILLI,
@@ -72,6 +73,7 @@ struct EnumTraits<TimeUnit::type>
     return "<INVALID>";
   }
 };
+
 template <>
 struct EnumTraits<compute::CompareOperator>
     : BasicEnumTraits<
@@ -98,6 +100,80 @@ struct EnumTraits<compute::CompareOperator>
     return "<INVALID>";
   }
 };
+template <>
+struct EnumTraits<compute::AssumeTimezoneOptions::Ambiguous>
+    : BasicEnumTraits<compute::AssumeTimezoneOptions::Ambiguous,
+                      compute::AssumeTimezoneOptions::Ambiguous::AMBIGUOUS_RAISE,
+                      compute::AssumeTimezoneOptions::Ambiguous::AMBIGUOUS_EARLIEST,
+                      compute::AssumeTimezoneOptions::Ambiguous::AMBIGUOUS_LATEST> {
+  static std::string name() { return "AssumeTimezoneOptions::Ambiguous"; }
+  static std::string value_name(compute::AssumeTimezoneOptions::Ambiguous value) {
+    switch (value) {
+      case compute::AssumeTimezoneOptions::Ambiguous::AMBIGUOUS_RAISE:
+        return "AMBIGUOUS_RAISE";
+      case compute::AssumeTimezoneOptions::Ambiguous::AMBIGUOUS_EARLIEST:
+        return "AMBIGUOUS_EARLIEST";
+      case compute::AssumeTimezoneOptions::Ambiguous::AMBIGUOUS_LATEST:
+        return "AMBIGUOUS_LATEST";
+    }
+    return "<INVALID>";
+  }
+};
+template <>
+struct EnumTraits<compute::AssumeTimezoneOptions::Nonexistent>
+    : BasicEnumTraits<compute::AssumeTimezoneOptions::Nonexistent,
+                      compute::AssumeTimezoneOptions::Nonexistent::NONEXISTENT_RAISE,
+                      compute::AssumeTimezoneOptions::Nonexistent::NONEXISTENT_EARLIEST,
+                      compute::AssumeTimezoneOptions::Nonexistent::NONEXISTENT_LATEST> {
+  static std::string name() { return "AssumeTimezoneOptions::Nonexistent"; }
+  static std::string value_name(compute::AssumeTimezoneOptions::Nonexistent value) {
+    switch (value) {
+      case compute::AssumeTimezoneOptions::Nonexistent::NONEXISTENT_RAISE:
+        return "NONEXISTENT_RAISE";
+      case compute::AssumeTimezoneOptions::Nonexistent::NONEXISTENT_EARLIEST:
+        return "NONEXISTENT_EARLIEST";
+      case compute::AssumeTimezoneOptions::Nonexistent::NONEXISTENT_LATEST:
+        return "NONEXISTENT_LATEST";
+    }
+    return "<INVALID>";
+  }
+};
+
+template <>
+struct EnumTraits<compute::RoundMode>
+    : BasicEnumTraits<compute::RoundMode, compute::RoundMode::DOWN,
+                      compute::RoundMode::UP, compute::RoundMode::TOWARDS_ZERO,
+                      compute::RoundMode::TOWARDS_INFINITY, compute::RoundMode::HALF_DOWN,
+                      compute::RoundMode::HALF_UP, compute::RoundMode::HALF_TOWARDS_ZERO,
+                      compute::RoundMode::HALF_TOWARDS_INFINITY,
+                      compute::RoundMode::HALF_TO_EVEN, compute::RoundMode::HALF_TO_ODD> {
+  static std::string name() { return "compute::RoundMode"; }
+  static std::string value_name(compute::RoundMode value) {
+    switch (value) {
+      case compute::RoundMode::DOWN:
+        return "DOWN";
+      case compute::RoundMode::UP:
+        return "UP";
+      case compute::RoundMode::TOWARDS_ZERO:
+        return "TOWARDS_ZERO";
+      case compute::RoundMode::TOWARDS_INFINITY:
+        return "TOWARDS_INFINITY";
+      case compute::RoundMode::HALF_DOWN:
+        return "HALF_DOWN";
+      case compute::RoundMode::HALF_UP:
+        return "HALF_UP";
+      case compute::RoundMode::HALF_TOWARDS_ZERO:
+        return "HALF_TOWARDS_ZERO";
+      case compute::RoundMode::HALF_TOWARDS_INFINITY:
+        return "HALF_TOWARDS_INFINITY";
+      case compute::RoundMode::HALF_TO_EVEN:
+        return "HALF_TO_EVEN";
+      case compute::RoundMode::HALF_TO_ODD:
+        return "HALF_TO_ODD";
+    }
+    return "<INVALID>";
+  }
+};
 }  // namespace internal
 
 namespace compute {
@@ -115,6 +191,12 @@ static auto kArithmeticOptionsType = GetFunctionOptionsType<ArithmeticOptions>(
 static auto kElementWiseAggregateOptionsType =
     GetFunctionOptionsType<ElementWiseAggregateOptions>(
         DataMember("skip_nulls", &ElementWiseAggregateOptions::skip_nulls));
+static auto kRoundOptionsType = GetFunctionOptionsType<RoundOptions>(
+    DataMember("ndigits", &RoundOptions::ndigits),
+    DataMember("round_mode", &RoundOptions::round_mode));
+static auto kRoundToMultipleOptionsType = GetFunctionOptionsType<RoundToMultipleOptions>(
+    DataMember("multiple", &RoundToMultipleOptions::multiple),
+    DataMember("round_mode", &RoundToMultipleOptions::round_mode));
 static auto kJoinOptionsType = GetFunctionOptionsType<JoinOptions>(
     DataMember("null_handling", &JoinOptions::null_handling),
     DataMember("null_replacement", &JoinOptions::null_replacement));
@@ -147,6 +229,10 @@ static auto kStrptimeOptionsType = GetFunctionOptionsType<StrptimeOptions>(
     DataMember("unit", &StrptimeOptions::unit));
 static auto kStrftimeOptionsType = GetFunctionOptionsType<StrftimeOptions>(
     DataMember("format", &StrftimeOptions::format));
+static auto kAssumeTimezoneOptionsType = GetFunctionOptionsType<AssumeTimezoneOptions>(
+    DataMember("timezone", &AssumeTimezoneOptions::timezone),
+    DataMember("ambiguous", &AssumeTimezoneOptions::ambiguous),
+    DataMember("nonexistent", &AssumeTimezoneOptions::nonexistent));
 static auto kPadOptionsType = GetFunctionOptionsType<PadOptions>(
     DataMember("width", &PadOptions::width), DataMember("padding", &PadOptions::padding));
 static auto kTrimOptionsType = GetFunctionOptionsType<TrimOptions>(
@@ -175,6 +261,30 @@ ElementWiseAggregateOptions::ElementWiseAggregateOptions(bool skip_nulls)
       skip_nulls(skip_nulls) {}
 constexpr char ElementWiseAggregateOptions::kTypeName[];
 
+RoundOptions::RoundOptions(int64_t ndigits, RoundMode round_mode)
+    : FunctionOptions(internal::kRoundOptionsType),
+      ndigits(ndigits),
+      round_mode(round_mode) {
+  static_assert(RoundMode::HALF_DOWN > RoundMode::DOWN &&
+                    RoundMode::HALF_DOWN > RoundMode::UP &&
+                    RoundMode::HALF_DOWN > RoundMode::TOWARDS_ZERO &&
+                    RoundMode::HALF_DOWN > RoundMode::TOWARDS_INFINITY &&
+                    RoundMode::HALF_DOWN < RoundMode::HALF_UP &&
+                    RoundMode::HALF_DOWN < RoundMode::HALF_TOWARDS_ZERO &&
+                    RoundMode::HALF_DOWN < RoundMode::HALF_TOWARDS_INFINITY &&
+                    RoundMode::HALF_DOWN < RoundMode::HALF_TO_EVEN &&
+                    RoundMode::HALF_DOWN < RoundMode::HALF_TO_ODD,
+                "Invalid order of round modes. Modes prefixed with HALF need to be "
+                "enumerated last with HALF_DOWN being the first among them.");
+}
+constexpr char RoundOptions::kTypeName[];
+
+RoundToMultipleOptions::RoundToMultipleOptions(double multiple, RoundMode round_mode)
+    : FunctionOptions(internal::kRoundToMultipleOptionsType),
+      multiple(multiple),
+      round_mode(round_mode) {}
+constexpr char RoundToMultipleOptions::kTypeName[];
+
 JoinOptions::JoinOptions(NullHandlingBehavior null_handling, std::string null_replacement)
     : FunctionOptions(internal::kJoinOptionsType),
       null_handling(null_handling),
@@ -250,6 +360,15 @@ StrftimeOptions::StrftimeOptions() : StrftimeOptions(kDefaultFormat) {}
 constexpr char StrftimeOptions::kTypeName[];
 constexpr const char* StrftimeOptions::kDefaultFormat;
 
+AssumeTimezoneOptions::AssumeTimezoneOptions(std::string timezone, Ambiguous ambiguous,
+                                             Nonexistent nonexistent)
+    : FunctionOptions(internal::kAssumeTimezoneOptionsType),
+      timezone(std::move(timezone)),
+      ambiguous(ambiguous),
+      nonexistent(nonexistent) {}
+AssumeTimezoneOptions::AssumeTimezoneOptions() : AssumeTimezoneOptions("UTC") {}
+constexpr char AssumeTimezoneOptions::kTypeName[];
+
 PadOptions::PadOptions(int64_t width, std::string padding)
     : FunctionOptions(internal::kPadOptionsType),
       width(width),
@@ -301,6 +420,8 @@ namespace internal {
 void RegisterScalarOptions(FunctionRegistry* registry) {
   DCHECK_OK(registry->AddFunctionOptionsType(kArithmeticOptionsType));
   DCHECK_OK(registry->AddFunctionOptionsType(kElementWiseAggregateOptionsType));
+  DCHECK_OK(registry->AddFunctionOptionsType(kRoundOptionsType));
+  DCHECK_OK(registry->AddFunctionOptionsType(kRoundToMultipleOptionsType));
   DCHECK_OK(registry->AddFunctionOptionsType(kJoinOptionsType));
   DCHECK_OK(registry->AddFunctionOptionsType(kMatchSubstringOptionsType));
   DCHECK_OK(registry->AddFunctionOptionsType(kSplitOptionsType));
@@ -311,6 +432,7 @@ void RegisterScalarOptions(FunctionRegistry* registry) {
   DCHECK_OK(registry->AddFunctionOptionsType(kSetLookupOptionsType));
   DCHECK_OK(registry->AddFunctionOptionsType(kStrptimeOptionsType));
   DCHECK_OK(registry->AddFunctionOptionsType(kStrftimeOptionsType));
+  DCHECK_OK(registry->AddFunctionOptionsType(kAssumeTimezoneOptionsType));
   DCHECK_OK(registry->AddFunctionOptionsType(kPadOptionsType));
   DCHECK_OK(registry->AddFunctionOptionsType(kTrimOptionsType));
   DCHECK_OK(registry->AddFunctionOptionsType(kSliceOptionsType));
@@ -353,6 +475,15 @@ SCALAR_ARITHMETIC_UNARY(Log10, "log10", "log10_checked")
 SCALAR_ARITHMETIC_UNARY(Log2, "log2", "log2_checked")
 SCALAR_ARITHMETIC_UNARY(Log1p, "log1p", "log1p_checked")
 
+Result<Datum> Round(const Datum& arg, RoundOptions options, ExecContext* ctx) {
+  return CallFunction("round", {arg}, &options, ctx);
+}
+
+Result<Datum> RoundToMultiple(const Datum& arg, RoundToMultipleOptions options,
+                              ExecContext* ctx) {
+  return CallFunction("round_to_multiple", {arg}, &options, ctx);
+}
+
 #define SCALAR_ARITHMETIC_BINARY(NAME, REGISTRY_NAME, REGISTRY_CHECKED_NAME)           \
   Result<Datum> NAME(const Datum& left, const Datum& right, ArithmeticOptions options, \
                      ExecContext* ctx) {                                               \
@@ -512,6 +643,11 @@ Result<Datum> DayOfWeek(const Datum& arg, DayOfWeekOptions options, ExecContext*
   return CallFunction("day_of_week", {arg}, &options, ctx);
 }
 
+Result<Datum> AssumeTimezone(const Datum& arg, AssumeTimezoneOptions options,
+                             ExecContext* ctx) {
+  return CallFunction("assume_timezone", {arg}, &options, ctx);
+}
+
 Result<Datum> Strftime(const Datum& arg, StrftimeOptions options, ExecContext* ctx) {
   return CallFunction("strftime", {arg}, &options, ctx);
 }
diff --git a/cpp/src/arrow/compute/api_scalar.h b/cpp/src/arrow/compute/api_scalar.h
index 2cbc0fde2b2..9f9a2931398 100644
--- a/cpp/src/arrow/compute/api_scalar.h
+++ b/cpp/src/arrow/compute/api_scalar.h
@@ -29,6 +29,7 @@
 #include "arrow/result.h"
 #include "arrow/util/macros.h"
 #include "arrow/util/visibility.h"
+#include "arrow/vendored/datetime.h"
 
 namespace arrow {
 namespace compute {
@@ -49,10 +50,58 @@ class ARROW_EXPORT ElementWiseAggregateOptions : public FunctionOptions {
   explicit ElementWiseAggregateOptions(bool skip_nulls = true);
   constexpr static char const kTypeName[] = "ElementWiseAggregateOptions";
   static ElementWiseAggregateOptions Defaults() { return ElementWiseAggregateOptions{}; }
-
   bool skip_nulls;
 };
 
+/// Rounding and tie-breaking modes for round compute functions.
+/// Additional details and examples are provided in compute.rst.
+enum class RoundMode : int8_t {
+  /// Round to nearest integer less than or equal in magnitude (aka "floor")
+  DOWN,
+  /// Round to nearest integer greater than or equal in magnitude (aka "ceil")
+  UP,
+  /// Get the integral part without fractional digits (aka "trunc")
+  TOWARDS_ZERO,
+  /// Round negative values with DOWN rule and positive values with UP rule
+  TOWARDS_INFINITY,
+  /// Round ties with DOWN rule
+  HALF_DOWN,
+  /// Round ties with UP rule
+  HALF_UP,
+  /// Round ties with TOWARDS_ZERO rule
+  HALF_TOWARDS_ZERO,
+  /// Round ties with TOWARDS_INFINITY rule
+  HALF_TOWARDS_INFINITY,
+  /// Round ties to nearest even integer
+  HALF_TO_EVEN,
+  /// Round ties to nearest odd integer
+  HALF_TO_ODD,
+};
+
+class ARROW_EXPORT RoundOptions : public FunctionOptions {
+ public:
+  explicit RoundOptions(int64_t ndigits = 0,
+                        RoundMode round_mode = RoundMode::HALF_TO_EVEN);
+  constexpr static char const kTypeName[] = "RoundOptions";
+  static RoundOptions Defaults() { return RoundOptions(); }
+  /// Rounding precision (number of digits to round to)
+  int64_t ndigits;
+  /// Rounding and tie-breaking mode
+  RoundMode round_mode;
+};
+
+class ARROW_EXPORT RoundToMultipleOptions : public FunctionOptions {
+ public:
+  explicit RoundToMultipleOptions(double multiple = 1.0,
+                                  RoundMode round_mode = RoundMode::HALF_TO_EVEN);
+  constexpr static char const kTypeName[] = "RoundToMultipleOptions";
+  static RoundToMultipleOptions Defaults() { return RoundToMultipleOptions(); }
+  /// Rounding scale (multiple to round to)
+  double multiple;
+  /// Rounding and tie-breaking mode
+  RoundMode round_mode;
+};
+
 /// Options for var_args_join.
 class ARROW_EXPORT JoinOptions : public FunctionOptions {
  public:
@@ -185,7 +234,7 @@ class ARROW_EXPORT StrftimeOptions : public FunctionOptions {
 
   constexpr static char const kTypeName[] = "StrftimeOptions";
 
-  constexpr static const char* kDefaultFormat = "%Y-%m-%dT%H:%M:%SZ";
+  constexpr static const char* kDefaultFormat = "%Y-%m-%dT%H:%M:%S";
 
   /// The desired format string.
   std::string format;
@@ -278,6 +327,40 @@ struct ARROW_EXPORT DayOfWeekOptions : public FunctionOptions {
   uint32_t week_start;
 };
 
+/// Used to control timestamp timezone conversion and handling ambiguous/nonexistent
+/// times.
+struct ARROW_EXPORT AssumeTimezoneOptions : public FunctionOptions {
+ public:
+  /// \brief How to interpret ambiguous local times that can be interpreted as
+  /// multiple instants (normally two) due to DST shifts.
+  ///
+  /// AMBIGUOUS_EARLIEST emits the earliest instant amongst possible interpretations.
+  /// AMBIGUOUS_LATEST emits the latest instant amongst possible interpretations.
+  enum Ambiguous { AMBIGUOUS_RAISE, AMBIGUOUS_EARLIEST, AMBIGUOUS_LATEST };
+
+  /// \brief How to handle local times that do not exist due to DST shifts.
+  ///
+  /// NONEXISTENT_EARLIEST emits the instant "just before" the DST shift instant
+  /// in the given timestamp precision (for example, for a nanoseconds precision
+  /// timestamp, this is one nanosecond before the DST shift instant).
+  /// NONEXISTENT_LATEST emits the DST shift instant.
+  enum Nonexistent { NONEXISTENT_RAISE, NONEXISTENT_EARLIEST, NONEXISTENT_LATEST };
+
+  explicit AssumeTimezoneOptions(std::string timezone,
+                                 Ambiguous ambiguous = AMBIGUOUS_RAISE,
+                                 Nonexistent nonexistent = NONEXISTENT_RAISE);
+  AssumeTimezoneOptions();
+  constexpr static char const kTypeName[] = "AssumeTimezoneOptions";
+
+  /// Timezone to convert timestamps from
+  std::string timezone;
+
+  /// How to interpret ambiguous local times (due to DST shifts)
+  Ambiguous ambiguous;
+  /// How to interpret non-existent local times (due to DST shifts)
+  Nonexistent nonexistent;
+};
+
 /// @}
 
 /// \brief Get the absolute value of a value.
@@ -524,8 +607,9 @@ Result<Datum> Logb(const Datum& arg, const Datum& base,
                    ExecContext* ctx = NULLPTR);
 
 /// \brief Round to the nearest integer less than or equal in magnitude to the
-/// argument. Array values can be of arbitrary length. If argument is null the
-/// result will be null.
+/// argument.
+///
+/// If argument is null the result will be null.
 ///
 /// \param[in] arg the value to round
 /// \param[in] ctx the function execution context, optional
@@ -534,8 +618,9 @@ ARROW_EXPORT
 Result<Datum> Floor(const Datum& arg, ExecContext* ctx = NULLPTR);
 
 /// \brief Round to the nearest integer greater than or equal in magnitude to the
-/// argument. Array values can be of arbitrary length. If argument is null the
-/// result will be null.
+/// argument.
+///
+/// If argument is null the result will be null.
 ///
 /// \param[in] arg the value to round
 /// \param[in] ctx the function execution context, optional
@@ -543,8 +628,9 @@ Result<Datum> Floor(const Datum& arg, ExecContext* ctx = NULLPTR);
 ARROW_EXPORT
 Result<Datum> Ceil(const Datum& arg, ExecContext* ctx = NULLPTR);
 
-/// \brief Get the integral part without fractional digits. Array values can be
-/// of arbitrary length. If argument is null the result will be null.
+/// \brief Get the integral part without fractional digits.
+///
+/// If argument is null the result will be null.
 ///
 /// \param[in] arg the value to truncate
 /// \param[in] ctx the function execution context, optional
@@ -583,10 +669,35 @@ Result<Datum> MinElementWise(
 ///
 /// \param[in] arg the value to extract sign from
 /// \param[in] ctx the function execution context, optional
-/// \return the elementwise sign function
+/// \return the element-wise sign function
 ARROW_EXPORT
 Result<Datum> Sign(const Datum& arg, ExecContext* ctx = NULLPTR);
 
+/// \brief Round a value to a given precision.
+///
+/// If argument is null the result will be null.
+///
+/// \param[in] arg the value rounded
+/// \param[in] options rounding options (rounding mode and number of digits), optional
+/// \param[in] ctx the function execution context, optional
+/// \return the element-wise rounded value
+ARROW_EXPORT
+Result<Datum> Round(const Datum& arg, RoundOptions options = RoundOptions::Defaults(),
+                    ExecContext* ctx = NULLPTR);
+
+/// \brief Round a value to a given multiple.
+///
+/// If argument is null the result will be null.
+///
+/// \param[in] arg the value to round
+/// \param[in] options rounding options (rounding mode and multiple), optional
+/// \param[in] ctx the function execution context, optional
+/// \return the element-wise rounded value
+ARROW_EXPORT
+Result<Datum> RoundToMultiple(
+    const Datum& arg, RoundToMultipleOptions options = RoundToMultipleOptions::Defaults(),
+    ExecContext* ctx = NULLPTR);
+
 /// \brief Compare a numeric array with a scalar.
 ///
 /// \param[in] left datum to compare, must be an Array
@@ -1025,5 +1136,21 @@ ARROW_EXPORT Result<Datum> Subsecond(const Datum& values, ExecContext* ctx = NUL
 ARROW_EXPORT Result<Datum> Strftime(const Datum& values, StrftimeOptions options,
                                     ExecContext* ctx = NULLPTR);
 
+/// \brief Converts timestamps from local timestamp without a timezone to a timestamp with
+/// timezone, interpreting the local timestamp as being in the specified timezone for each
+/// element of `values`
+///
+/// \param[in] values input to convert
+/// \param[in] options for setting source timezone, exception and ambiguous timestamp
+/// handling.
+/// \param[in] ctx the function execution context, optional
+/// \return the resulting datum
+///
+/// \since 6.0.0
+/// \note API not yet finalized
+ARROW_EXPORT Result<Datum> AssumeTimezone(const Datum& values,
+                                          AssumeTimezoneOptions options,
+                                          ExecContext* ctx = NULLPTR);
+
 }  // namespace compute
 }  // namespace arrow
diff --git a/cpp/src/arrow/compute/api_vector.cc b/cpp/src/arrow/compute/api_vector.cc
index d4c4a915999..34ee0599c3d 100644
--- a/cpp/src/arrow/compute/api_vector.cc
+++ b/cpp/src/arrow/compute/api_vector.cc
@@ -111,6 +111,9 @@ static auto kSortOptionsType =
     GetFunctionOptionsType<SortOptions>(DataMember("sort_keys", &SortOptions::sort_keys));
 static auto kPartitionNthOptionsType = GetFunctionOptionsType<PartitionNthOptions>(
     DataMember("pivot", &PartitionNthOptions::pivot));
+static auto kSelectKOptionsType = GetFunctionOptionsType<SelectKOptions>(
+    DataMember("k", &SelectKOptions::k),
+    DataMember("sort_keys", &SelectKOptions::sort_keys));
 }  // namespace
 }  // namespace internal
 
@@ -140,6 +143,12 @@ PartitionNthOptions::PartitionNthOptions(int64_t pivot)
     : FunctionOptions(internal::kPartitionNthOptionsType), pivot(pivot) {}
 constexpr char PartitionNthOptions::kTypeName[];
 
+SelectKOptions::SelectKOptions(int64_t k, std::vector<SortKey> sort_keys)
+    : FunctionOptions(internal::kSelectKOptionsType),
+      k(k),
+      sort_keys(std::move(sort_keys)) {}
+constexpr char SelectKOptions::kTypeName[];
+
 namespace internal {
 void RegisterVectorOptions(FunctionRegistry* registry) {
   DCHECK_OK(registry->AddFunctionOptionsType(kFilterOptionsType));
@@ -148,6 +157,7 @@ void RegisterVectorOptions(FunctionRegistry* registry) {
   DCHECK_OK(registry->AddFunctionOptionsType(kArraySortOptionsType));
   DCHECK_OK(registry->AddFunctionOptionsType(kSortOptionsType));
   DCHECK_OK(registry->AddFunctionOptionsType(kPartitionNthOptionsType));
+  DCHECK_OK(registry->AddFunctionOptionsType(kSelectKOptionsType));
 }
 }  // namespace internal
 
@@ -162,6 +172,14 @@ Result<std::shared_ptr<Array>> NthToIndices(const Array& values, int64_t n,
   return result.make_array();
 }
 
+Result<std::shared_ptr<Array>> SelectKUnstable(const Datum& datum,
+                                               const SelectKOptions& options,
+                                               ExecContext* ctx) {
+  ARROW_ASSIGN_OR_RAISE(Datum result,
+                        CallFunction("select_k_unstable", {datum}, &options, ctx));
+  return result.make_array();
+}
+
 Result<Datum> ReplaceWithMask(const Datum& values, const Datum& mask,
                               const Datum& replacements, ExecContext* ctx) {
   return CallFunction("replace_with_mask", {values, mask, replacements}, ctx);
diff --git a/cpp/src/arrow/compute/api_vector.h b/cpp/src/arrow/compute/api_vector.h
index 5dc68fc5c83..a1c6f7959e1 100644
--- a/cpp/src/arrow/compute/api_vector.h
+++ b/cpp/src/arrow/compute/api_vector.h
@@ -120,6 +120,43 @@ class ARROW_EXPORT SortOptions : public FunctionOptions {
   std::vector<SortKey> sort_keys;
 };
 
+/// \brief SelectK options
+class ARROW_EXPORT SelectKOptions : public FunctionOptions {
+ public:
+  explicit SelectKOptions(int64_t k = -1, std::vector<SortKey> sort_keys = {});
+
+  constexpr static char const kTypeName[] = "SelectKOptions";
+
+  static SelectKOptions Defaults() { return SelectKOptions{-1, {}}; }
+
+  static SelectKOptions TopKDefault(int64_t k, std::vector<std::string> key_names = {}) {
+    std::vector<SortKey> keys;
+    for (const auto& name : key_names) {
+      keys.emplace_back(SortKey(name, SortOrder::Descending));
+    }
+    if (key_names.empty()) {
+      keys.emplace_back(SortKey("not-used", SortOrder::Descending));
+    }
+    return SelectKOptions{k, keys};
+  }
+  static SelectKOptions BottomKDefault(int64_t k,
+                                       std::vector<std::string> key_names = {}) {
+    std::vector<SortKey> keys;
+    for (const auto& name : key_names) {
+      keys.emplace_back(SortKey(name, SortOrder::Ascending));
+    }
+    if (key_names.empty()) {
+      keys.emplace_back(SortKey("not-used", SortOrder::Ascending));
+    }
+    return SelectKOptions{k, keys};
+  }
+
+  /// The number of `k` elements to keep.
+  int64_t k;
+  /// Column key(s) to order by and how to order by these sort keys.
+  std::vector<SortKey> sort_keys;
+};
+
 /// \brief Partitioning options for NthToIndices
 class ARROW_EXPORT PartitionNthOptions : public FunctionOptions {
  public:
@@ -252,6 +289,24 @@ ARROW_EXPORT
 Result<std::shared_ptr<Array>> NthToIndices(const Array& values, int64_t n,
                                             ExecContext* ctx = NULLPTR);
 
+/// \brief Returns the indices that would select the first `k` elements of the array in
+/// the specified order.
+///
+// Perform an indirect sort of the datum, keeping only the first `k` elements. The output
+// array will contain indices such that the item indicated by the k-th index will be in
+// the position it would be if the datum were sorted by `options.sort_keys`. However,
+// indices of null values will not be part of the output. The sort is not guaranteed to be
+// stable.
+///
+/// \param[in] datum datum to be partitioned
+/// \param[in] options options
+/// \param[in] ctx the function execution context, optional
+/// \return a datum with the same schema as the input
+ARROW_EXPORT
+Result<std::shared_ptr<Array>> SelectKUnstable(const Datum& datum,
+                                               const SelectKOptions& options,
+                                               ExecContext* ctx = NULLPTR);
+
 /// \brief Returns the indices that would sort an array in the
 /// specified order.
 ///
diff --git a/cpp/src/arrow/compute/exec/util.h b/cpp/src/arrow/compute/exec/util.h
index f5c55afe0f5..63f3315f7e0 100644
--- a/cpp/src/arrow/compute/exec/util.h
+++ b/cpp/src/arrow/compute/exec/util.h
@@ -70,6 +70,8 @@ class TempVectorStack {
     top_ = 0;
     buffer_size_ = size;
     ARROW_ASSIGN_OR_RAISE(auto buffer, AllocateResizableBuffer(size, pool));
+    // Ensure later operations don't accidentally read uninitialized memory.
+    std::memset(buffer->mutable_data(), 0xFF, size);
     buffer_ = std::move(buffer);
     return Status::OK();
   }
diff --git a/cpp/src/arrow/compute/function.h b/cpp/src/arrow/compute/function.h
index 6434d5090f6..f08b50699a5 100644
--- a/cpp/src/arrow/compute/function.h
+++ b/cpp/src/arrow/compute/function.h
@@ -227,7 +227,7 @@ class ARROW_EXPORT Function {
   virtual Result<Datum> Execute(const std::vector<Datum>& args,
                                 const FunctionOptions* options, ExecContext* ctx) const;
 
-  /// \brief Returns a the default options for this function.
+  /// \brief Returns the default options for this function.
   ///
   /// Whatever option semantics a Function has, implementations must guarantee
   /// that default_options() is valid to pass to Execute as options.
diff --git a/cpp/src/arrow/compute/function_test.cc b/cpp/src/arrow/compute/function_test.cc
index d7ebdf3de1d..183167490b6 100644
--- a/cpp/src/arrow/compute/function_test.cc
+++ b/cpp/src/arrow/compute/function_test.cc
@@ -15,17 +15,18 @@
 // specific language governing permissions and limitations
 // under the License.
 
+#include "arrow/compute/function.h"
+
+#include <gtest/gtest.h>
+
 #include <memory>
 #include <string>
 #include <vector>
 
-#include <gtest/gtest.h>
-
 #include "arrow/compute/api_aggregate.h"
 #include "arrow/compute/api_scalar.h"
 #include "arrow/compute/api_vector.h"
 #include "arrow/compute/cast.h"
-#include "arrow/compute/function.h"
 #include "arrow/compute/kernel.h"
 #include "arrow/datum.h"
 #include "arrow/status.h"
@@ -57,6 +58,12 @@ TEST(FunctionOptions, Equality) {
   options.emplace_back(new IndexOptions(ScalarFromJSON(boolean(), "null")));
   options.emplace_back(new ArithmeticOptions());
   options.emplace_back(new ArithmeticOptions(/*check_overflow=*/true));
+  options.emplace_back(new RoundOptions());
+  options.emplace_back(
+      new RoundOptions(/*ndigits=*/2, /*round_mode=*/RoundMode::TOWARDS_INFINITY));
+  options.emplace_back(new RoundToMultipleOptions());
+  options.emplace_back(new RoundToMultipleOptions(
+      /*multiple=*/100, /*round_mode=*/RoundMode::TOWARDS_INFINITY));
   options.emplace_back(new ElementWiseAggregateOptions());
   options.emplace_back(new ElementWiseAggregateOptions(/*skip_nulls=*/false));
   options.emplace_back(new JoinOptions());
@@ -80,6 +87,11 @@ TEST(FunctionOptions, Equality) {
   options.emplace_back(new StrptimeOptions("%Y", TimeUnit::type::MILLI));
   options.emplace_back(new StrptimeOptions("%Y", TimeUnit::type::NANO));
   options.emplace_back(new StrftimeOptions("%Y-%m-%dT%H:%M:%SZ", "C"));
+#ifndef _WIN32
+  options.emplace_back(new AssumeTimezoneOptions(
+      "Europe/Amsterdam", AssumeTimezoneOptions::Ambiguous::AMBIGUOUS_RAISE,
+      AssumeTimezoneOptions::Nonexistent::NONEXISTENT_RAISE));
+#endif
   options.emplace_back(new PadOptions(5, " "));
   options.emplace_back(new PadOptions(10, "A"));
   options.emplace_back(new TrimOptions(" "));
@@ -110,6 +122,8 @@ TEST(FunctionOptions, Equality) {
       {SortKey("key", SortOrder::Descending), SortKey("value", SortOrder::Descending)}));
   options.emplace_back(new PartitionNthOptions(/*pivot=*/0));
   options.emplace_back(new PartitionNthOptions(/*pivot=*/42));
+  options.emplace_back(new SelectKOptions(0, {}));
+  options.emplace_back(new SelectKOptions(5, {{SortKey("key", SortOrder::Ascending)}}));
 
   for (size_t i = 0; i < options.size(); i++) {
     const size_t prev_i = i == 0 ? options.size() - 1 : i - 1;
diff --git a/cpp/src/arrow/compute/kernel.h b/cpp/src/arrow/compute/kernel.h
index 099bd95bbf2..01750d1f359 100644
--- a/cpp/src/arrow/compute/kernel.h
+++ b/cpp/src/arrow/compute/kernel.h
@@ -290,9 +290,11 @@ class ARROW_EXPORT OutputType {
   enum ResolveKind { FIXED, COMPUTED };
 
   /// Type resolution function. Given input types and shapes, return output
-  /// type and shape. This function SHOULD _not_ be used to check for arity,
-  /// that is to be performed one or more layers above. May make use of kernel
-  /// state to know what type to output in some cases.
+  /// type and shape.  This function MAY may use the kernel state to decide
+  /// the output type based on the functionoptions.
+  ///
+  /// This function SHOULD _not_ be used to check for arity, that is to be
+  /// performed one or more layers above.
   using Resolver =
       std::function<Result<ValueDescr>(KernelContext*, const std::vector<ValueDescr>&)>;
 
@@ -304,7 +306,8 @@ class ARROW_EXPORT OutputType {
   /// \brief Output the exact type and shape provided by a ValueDescr
   OutputType(ValueDescr descr);  // NOLINT implicit construction
 
-  explicit OutputType(Resolver resolver)
+  /// \brief Output a computed type depending on actual input types
+  OutputType(Resolver resolver)  // NOLINT implicit construction
       : kind_(COMPUTED), resolver_(std::move(resolver)) {}
 
   OutputType(const OutputType& other) {
diff --git a/cpp/src/arrow/compute/kernels/CMakeLists.txt b/cpp/src/arrow/compute/kernels/CMakeLists.txt
index 4096e497c0a..ce7a85f1557 100644
--- a/cpp/src/arrow/compute/kernels/CMakeLists.txt
+++ b/cpp/src/arrow/compute/kernels/CMakeLists.txt
@@ -50,11 +50,13 @@ add_arrow_compute_test(vector_test
                        vector_replace_test.cc
                        vector_selection_test.cc
                        vector_sort_test.cc
+                       select_k_test.cc
                        test_util.cc)
 
 add_arrow_benchmark(vector_hash_benchmark PREFIX "arrow-compute")
 add_arrow_benchmark(vector_sort_benchmark PREFIX "arrow-compute")
 add_arrow_benchmark(vector_partition_benchmark PREFIX "arrow-compute")
+add_arrow_benchmark(vector_topk_benchmark PREFIX "arrow-compute")
 add_arrow_benchmark(vector_replace_benchmark PREFIX "arrow-compute")
 add_arrow_benchmark(vector_selection_benchmark PREFIX "arrow-compute")
 
diff --git a/cpp/src/arrow/compute/kernels/aggregate_basic.cc b/cpp/src/arrow/compute/kernels/aggregate_basic.cc
index 2952eade96b..b19536d33ab 100644
--- a/cpp/src/arrow/compute/kernels/aggregate_basic.cc
+++ b/cpp/src/arrow/compute/kernels/aggregate_basic.cc
@@ -549,6 +549,9 @@ struct IndexInit {
 
   static Result<std::unique_ptr<KernelState>> Init(KernelContext* ctx,
                                                    const KernelInitArgs& args) {
+    if (!args.options) {
+      return Status::Invalid("Must provide IndexOptions for index kernel");
+    }
     IndexInit visitor(ctx, static_cast<const IndexOptions&>(*args.options),
                       *args.inputs[0].type);
     return visitor.Create();
diff --git a/cpp/src/arrow/compute/kernels/aggregate_mode.cc b/cpp/src/arrow/compute/kernels/aggregate_mode.cc
index 6ad0eeb6456..f225f6bf569 100644
--- a/cpp/src/arrow/compute/kernels/aggregate_mode.cc
+++ b/cpp/src/arrow/compute/kernels/aggregate_mode.cc
@@ -130,6 +130,13 @@ struct CountModer {
   Status Exec(KernelContext* ctx, const ExecBatch& batch, Datum* out) {
     // count values in all chunks, ignore nulls
     const Datum& datum = batch[0];
+
+    const ModeOptions& options = ModeState::Get(ctx);
+    if ((!options.skip_nulls && datum.null_count() > 0) ||
+        (datum.length() - datum.null_count() < options.min_count)) {
+      return PrepareOutput<T>(/*n=*/0, ctx, out).status();
+    }
+
     CountValues<CType>(this->counts.data(), datum, this->min);
 
     // generator to emit next value:count pair
@@ -154,9 +161,16 @@ struct CountModer {
 template <>
 struct CountModer<BooleanType> {
   Status Exec(KernelContext* ctx, const ExecBatch& batch, Datum* out) {
+    const Datum& datum = batch[0];
+
+    const ModeOptions& options = ModeState::Get(ctx);
+    if ((!options.skip_nulls && datum.null_count() > 0) ||
+        (datum.length() - datum.null_count() < options.min_count)) {
+      return PrepareOutput<BooleanType>(/*n=*/0, ctx, out).status();
+    }
+
     int64_t counts[2]{};
 
-    const Datum& datum = batch[0];
     for (const auto& array : datum.chunks()) {
       if (array->length() > array->null_count()) {
         const int64_t true_count =
@@ -167,7 +181,6 @@ struct CountModer<BooleanType> {
       }
     }
 
-    const ModeOptions& options = ModeState::Get(ctx);
     const int64_t distinct_values = (counts[0] != 0) + (counts[1] != 0);
     const int64_t n = std::min(options.n, distinct_values);
 
@@ -198,12 +211,19 @@ struct SortModer {
   using Allocator = arrow::stl::allocator<CType>;
 
   Status Exec(KernelContext* ctx, const ExecBatch& batch, Datum* out) {
+    const Datum& datum = batch[0];
+    const int64_t in_length = datum.length() - datum.null_count();
+
+    const ModeOptions& options = ModeState::Get(ctx);
+    if ((!options.skip_nulls && datum.null_count() > 0) ||
+        (in_length < options.min_count)) {
+      return PrepareOutput<T>(/*n=*/0, ctx, out).status();
+    }
+
     // copy all chunks to a buffer, ignore nulls and nans
     std::vector<CType, Allocator> in_buffer(Allocator(ctx->memory_pool()));
 
     uint64_t nan_count = 0;
-    const Datum& datum = batch[0];
-    const int64_t in_length = datum.length() - datum.null_count();
     if (in_length > 0) {
       in_buffer.resize(in_length);
       CopyNonNullValues(datum, in_buffer.data());
@@ -305,6 +325,13 @@ struct Moder<InType, enable_if_t<is_floating_type<InType>::value>> {
 template <typename T>
 Status ScalarMode(KernelContext* ctx, const Scalar& scalar, Datum* out) {
   using CType = typename T::c_type;
+
+  const ModeOptions& options = ModeState::Get(ctx);
+  if ((!options.skip_nulls && !scalar.is_valid) ||
+      (static_cast<uint32_t>(scalar.is_valid) < options.min_count)) {
+    return PrepareOutput<T>(/*n=*/0, ctx, out).status();
+  }
+
   if (scalar.is_valid) {
     bool called = false;
     return Finalize<T>(ctx, out, [&]() {
diff --git a/cpp/src/arrow/compute/kernels/aggregate_quantile.cc b/cpp/src/arrow/compute/kernels/aggregate_quantile.cc
index 7d2ffe0770c..bfd97f813e5 100644
--- a/cpp/src/arrow/compute/kernels/aggregate_quantile.cc
+++ b/cpp/src/arrow/compute/kernels/aggregate_quantile.cc
@@ -79,12 +79,18 @@ struct SortQuantiler {
 
   Status Exec(KernelContext* ctx, const ExecBatch& batch, Datum* out) {
     const QuantileOptions& options = QuantileState::Get(ctx);
+    const Datum& datum = batch[0];
 
     // copy all chunks to a buffer, ignore nulls and nans
     std::vector<CType, Allocator> in_buffer(Allocator(ctx->memory_pool()));
+    int64_t in_length = 0;
+    if ((!options.skip_nulls && datum.null_count() > 0) ||
+        (datum.length() - datum.null_count() < options.min_count)) {
+      in_length = 0;
+    } else {
+      in_length = datum.length() - datum.null_count();
+    }
 
-    const Datum& datum = batch[0];
-    const int64_t in_length = datum.length() - datum.null_count();
     if (in_length > 0) {
       in_buffer.resize(in_length);
       CopyNonNullValues(datum, in_buffer.data());
@@ -232,7 +238,11 @@ struct CountQuantiler {
 
     // count values in all chunks, ignore nulls
     const Datum& datum = batch[0];
-    int64_t in_length = CountValues<CType>(this->counts.data(), datum, this->min);
+    int64_t in_length = 0;
+    if ((options.skip_nulls || (!options.skip_nulls && datum.null_count() == 0)) &&
+        (datum.length() - datum.null_count() >= options.min_count)) {
+      in_length = CountValues<CType>(this->counts.data(), datum, this->min);
+    }
 
     // prepare out array
     int64_t out_length = options.q.size();
@@ -394,7 +404,7 @@ Status ScalarQuantile(KernelContext* ctx, const QuantileOptions& options,
                       const Scalar& scalar, Datum* out) {
   using CType = typename T::c_type;
   ArrayData* output = out->mutable_array();
-  if (!scalar.is_valid) {
+  if (!scalar.is_valid || options.min_count > 1) {
     output->length = 0;
     output->null_count = 0;
     return Status::OK();
diff --git a/cpp/src/arrow/compute/kernels/aggregate_tdigest.cc b/cpp/src/arrow/compute/kernels/aggregate_tdigest.cc
index be8d66c4c24..3b616c664a9 100644
--- a/cpp/src/arrow/compute/kernels/aggregate_tdigest.cc
+++ b/cpp/src/arrow/compute/kernels/aggregate_tdigest.cc
@@ -37,14 +37,23 @@ struct TDigestImpl : public ScalarAggregator {
   using CType = typename ArrowType::c_type;
 
   explicit TDigestImpl(const TDigestOptions& options)
-      : q{options.q}, tdigest{options.delta, options.buffer_size} {}
+      : options{options},
+        tdigest{options.delta, options.buffer_size},
+        count{0},
+        all_valid{true} {}
 
   Status Consume(KernelContext*, const ExecBatch& batch) override {
+    if (!this->all_valid) return Status::OK();
+    if (!options.skip_nulls && batch[0].null_count() > 0) {
+      this->all_valid = false;
+      return Status::OK();
+    }
     if (batch[0].is_array()) {
       const ArrayData& data = *batch[0].array();
       const CType* values = data.GetValues<CType>(1);
 
       if (data.length > data.GetNullCount()) {
+        this->count += data.length - data.GetNullCount();
         VisitSetBitRunsVoid(data.buffers[0], data.offset, data.length,
                             [&](int64_t pos, int64_t len) {
                               for (int64_t i = 0; i < len; ++i) {
@@ -55,6 +64,7 @@ struct TDigestImpl : public ScalarAggregator {
     } else {
       const CType value = UnboxScalar<ArrowType>::Unbox(*batch[0].scalar());
       if (batch[0].scalar()->is_valid) {
+        this->count += 1;
         for (int64_t i = 0; i < batch.length; i++) {
           this->tdigest.NanAdd(value);
         }
@@ -64,13 +74,21 @@ struct TDigestImpl : public ScalarAggregator {
   }
 
   Status MergeFrom(KernelContext*, KernelState&& src) override {
-    auto& other = checked_cast<ThisType&>(src);
+    const auto& other = checked_cast<const ThisType&>(src);
+    if (!this->all_valid || !other.all_valid) {
+      this->all_valid = false;
+      return Status::OK();
+    }
     this->tdigest.Merge(other.tdigest);
+    this->count += other.count;
     return Status::OK();
   }
 
   Status Finalize(KernelContext* ctx, Datum* out) override {
-    const int64_t out_length = this->tdigest.is_empty() ? 0 : this->q.size();
+    const int64_t out_length =
+        (this->tdigest.is_empty() || !this->all_valid || this->count < options.min_count)
+            ? 0
+            : options.q.size();
     auto out_data = ArrayData::Make(float64(), out_length, 0);
     out_data->buffers.resize(2, nullptr);
 
@@ -79,7 +97,7 @@ struct TDigestImpl : public ScalarAggregator {
                             ctx->Allocate(out_length * sizeof(double)));
       double* out_buffer = out_data->template GetMutableValues<double>(1);
       for (int64_t i = 0; i < out_length; ++i) {
-        out_buffer[i] = this->tdigest.Quantile(this->q[i]);
+        out_buffer[i] = this->tdigest.Quantile(this->options.q[i]);
       }
     }
 
@@ -87,8 +105,10 @@ struct TDigestImpl : public ScalarAggregator {
     return Status::OK();
   }
 
-  const std::vector<double> q;
+  const TDigestOptions options;
   TDigest tdigest;
+  int64_t count;
+  bool all_valid;
 };
 
 struct TDigestInitState {
diff --git a/cpp/src/arrow/compute/kernels/aggregate_test.cc b/cpp/src/arrow/compute/kernels/aggregate_test.cc
index eb73e703b6e..fcf48e25a92 100644
--- a/cpp/src/arrow/compute/kernels/aggregate_test.cc
+++ b/cpp/src/arrow/compute/kernels/aggregate_test.cc
@@ -1853,6 +1853,10 @@ TYPED_TEST(TestNumericIndexKernel, Basics) {
   this->AssertIndexIs(chunked_input2, value, 4);
   this->AssertIndexIs(chunked_input3, value, -1);
   this->AssertIndexIs(chunked_input4, value, 5);
+
+  EXPECT_RAISES_WITH_MESSAGE_THAT(
+      Invalid, ::testing::HasSubstr("Must provide IndexOptions"),
+      CallFunction("index", {ArrayFromJSON(this->type_singleton(), "[0]")}));
 }
 TYPED_TEST(TestNumericIndexKernel, Random) {
   constexpr auto kChunks = 4;
@@ -1954,10 +1958,10 @@ class TestPrimitiveModeKernel : public ::testing::Test {
   using Traits = TypeTraits<ArrowType>;
   using CType = typename ArrowType::c_type;
 
-  void AssertModesAre(const Datum& array, const int n,
+  void AssertModesAre(const Datum& array, const ModeOptions options,
                       const std::vector<CType>& expected_modes,
                       const std::vector<int64_t>& expected_counts) {
-    ASSERT_OK_AND_ASSIGN(Datum out, Mode(array, ModeOptions{n}));
+    ASSERT_OK_AND_ASSIGN(Datum out, Mode(array, options));
     ValidateOutput(out);
     const StructArray out_array(out.array());
     ASSERT_EQ(out_array.length(), expected_modes.size());
@@ -1978,11 +1982,18 @@ class TestPrimitiveModeKernel : public ::testing::Test {
                       const std::vector<CType>& expected_modes,
                       const std::vector<int64_t>& expected_counts) {
     auto array = ArrayFromJSON(type_singleton(), json);
-    AssertModesAre(array, n, expected_modes, expected_counts);
+    AssertModesAre(array, ModeOptions(n), expected_modes, expected_counts);
+  }
+
+  void AssertModesAre(const std::string& json, const ModeOptions options,
+                      const std::vector<CType>& expected_modes,
+                      const std::vector<int64_t>& expected_counts) {
+    auto array = ArrayFromJSON(type_singleton(), json);
+    AssertModesAre(array, options, expected_modes, expected_counts);
   }
 
   void AssertModeIs(const Datum& array, CType expected_mode, int64_t expected_count) {
-    AssertModesAre(array, 1, {expected_mode}, {expected_count});
+    AssertModesAre(array, ModeOptions(1), {expected_mode}, {expected_count});
   }
 
   void AssertModeIs(const std::string& json, CType expected_mode,
@@ -1997,8 +2008,8 @@ class TestPrimitiveModeKernel : public ::testing::Test {
     AssertModeIs(chunked, expected_mode, expected_count);
   }
 
-  void AssertModesEmpty(const Datum& array, int n) {
-    ASSERT_OK_AND_ASSIGN(Datum out, Mode(array, ModeOptions{n}));
+  void AssertModesEmpty(const Datum& array, ModeOptions options) {
+    ASSERT_OK_AND_ASSIGN(Datum out, Mode(array, options));
     auto out_array = out.make_array();
     ValidateOutput(*out_array);
     ASSERT_EQ(out.array()->length, 0);
@@ -2006,12 +2017,17 @@ class TestPrimitiveModeKernel : public ::testing::Test {
 
   void AssertModesEmpty(const std::string& json, int n = 1) {
     auto array = ArrayFromJSON(type_singleton(), json);
-    AssertModesEmpty(array, n);
+    AssertModesEmpty(array, ModeOptions(n));
   }
 
   void AssertModesEmpty(const std::vector<std::string>& json, int n = 1) {
     auto chunked = ChunkedArrayFromJSON(type_singleton(), json);
-    AssertModesEmpty(chunked, n);
+    AssertModesEmpty(chunked, ModeOptions(n));
+  }
+
+  void AssertModesEmpty(const std::string& json, ModeOptions options) {
+    auto array = ArrayFromJSON(type_singleton(), json);
+    AssertModesEmpty(array, options);
   }
 
   std::shared_ptr<DataType> type_singleton() { return Traits::type_singleton(); }
@@ -2049,13 +2065,37 @@ TEST_F(TestBooleanModeKernel, Basics) {
                        {true, false}, {3, 2});
   this->AssertModesEmpty({"[null, null]", "[]", "[null]"}, 4);
 
-  auto ty = struct_({field("mode", boolean()), field("count", int64())});
-  Datum mode_true = ArrayFromJSON(ty, "[[true, 1]]");
-  Datum mode_false = ArrayFromJSON(ty, "[[false, 1]]");
-  Datum mode_empty = ArrayFromJSON(ty, "[]");
-  EXPECT_THAT(Mode(Datum(true)), ResultWith(mode_true));
-  EXPECT_THAT(Mode(Datum(false)), ResultWith(mode_false));
-  EXPECT_THAT(Mode(MakeNullScalar(boolean())), ResultWith(mode_empty));
+  auto in_ty = boolean();
+  this->AssertModesAre("[true, false, false, null]", ModeOptions(/*n=*/1), {false}, {2});
+  this->AssertModesEmpty("[true, false, false, null]",
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false));
+  this->AssertModesAre("[true, false, false, null]",
+                       ModeOptions(/*n=*/1, /*skip_nulls=*/true, /*min_count=*/3),
+                       {false}, {2});
+  this->AssertModesEmpty("[false, false, null]",
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/true, /*min_count=*/3));
+  this->AssertModesAre("[true, false, false]",
+                       ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/3),
+                       {false}, {2});
+  this->AssertModesEmpty("[true, false, false, null]",
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/3));
+  this->AssertModesEmpty("[true, false]",
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/3));
+  this->AssertModesAre(ScalarFromJSON(in_ty, "true"),
+                       ModeOptions(/*n=*/1, /*skip_nulls=*/false), {true}, {1});
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "null"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false));
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "true"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/true, /*min_count=*/2));
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "null"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/true, /*min_count=*/2));
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "true"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/2));
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "null"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/2));
+
+  this->AssertModesAre(ScalarFromJSON(in_ty, "true"), ModeOptions(/*n=*/1), {true}, {1});
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "null"), ModeOptions(/*n=*/1));
 }
 
 TYPED_TEST_SUITE(TestIntegerModeKernel, IntegralArrowTypes);
@@ -2077,10 +2117,35 @@ TYPED_TEST(TestIntegerModeKernel, Basics) {
   this->AssertModesEmpty("[null, null, null]", 10);
 
   auto in_ty = this->type_singleton();
-  auto ty = struct_({field("mode", in_ty), field("count", int64())});
-  EXPECT_THAT(Mode(*MakeScalar(in_ty, 5)),
-              ResultWith(Datum(ArrayFromJSON(ty, "[[5, 1]]"))));
-  EXPECT_THAT(Mode(MakeNullScalar(in_ty)), ResultWith(Datum(ArrayFromJSON(ty, "[]"))));
+
+  this->AssertModesAre("[1, 2, 2, null]", ModeOptions(/*n=*/1), {2}, {2});
+  this->AssertModesEmpty("[1, 2, 2, null]", ModeOptions(/*n=*/1, /*skip_nulls=*/false));
+  this->AssertModesAre("[1, 2, 2, null]",
+                       ModeOptions(/*n=*/1, /*skip_nulls=*/true, /*min_count=*/3), {2},
+                       {2});
+  this->AssertModesEmpty("[2, 2, null]",
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/true, /*min_count=*/3));
+  this->AssertModesAre(
+      "[1, 2, 2]", ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/3), {2}, {2});
+  this->AssertModesEmpty("[1, 2, 2, null]",
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/3));
+  this->AssertModesEmpty("[1, 2]",
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/3));
+  this->AssertModesAre(ScalarFromJSON(in_ty, "1"),
+                       ModeOptions(/*n=*/1, /*skip_nulls=*/false), {1}, {1});
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "null"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false));
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "1"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/true, /*min_count=*/2));
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "null"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/true, /*min_count=*/2));
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "1"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/2));
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "null"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/2));
+
+  this->AssertModesAre(ScalarFromJSON(in_ty, "5"), ModeOptions(/*n=*/1), {5}, {1});
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "null"), ModeOptions(/*n=*/1));
 }
 
 TYPED_TEST_SUITE(TestFloatingModeKernel, RealArrowTypes);
@@ -2108,10 +2173,35 @@ TYPED_TEST(TestFloatingModeKernel, Floats) {
   this->AssertModesAre("[NaN, NaN, 1, null, 1, 2, 2]", 3, {1, 2, NAN}, {2, 2, 2});
 
   auto in_ty = this->type_singleton();
-  auto ty = struct_({field("mode", in_ty), field("count", int64())});
-  EXPECT_THAT(Mode(*MakeScalar(in_ty, 5.0)),
-              ResultWith(Datum(ArrayFromJSON(ty, "[[5.0, 1]]"))));
-  EXPECT_THAT(Mode(MakeNullScalar(in_ty)), ResultWith(Datum(ArrayFromJSON(ty, "[]"))));
+
+  this->AssertModesAre("[1, 2, 2, null]", ModeOptions(/*n=*/1), {2}, {2});
+  this->AssertModesEmpty("[1, 2, 2, null]", ModeOptions(/*n=*/1, /*skip_nulls=*/false));
+  this->AssertModesAre("[1, 2, 2, null]",
+                       ModeOptions(/*n=*/1, /*skip_nulls=*/true, /*min_count=*/3), {2},
+                       {2});
+  this->AssertModesEmpty("[2, 2, null]",
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/true, /*min_count=*/3));
+  this->AssertModesAre(
+      "[1, 2, 2]", ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/3), {2}, {2});
+  this->AssertModesEmpty("[1, 2, 2, null]",
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/3));
+  this->AssertModesEmpty("[1, 2]",
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/3));
+  this->AssertModesAre(ScalarFromJSON(in_ty, "1"),
+                       ModeOptions(/*n=*/1, /*skip_nulls=*/false), {1}, {1});
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "null"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false));
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "1"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/true, /*min_count=*/2));
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "null"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/true, /*min_count=*/2));
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "1"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/2));
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "null"),
+                         ModeOptions(/*n=*/1, /*skip_nulls=*/false, /*min_count=*/2));
+
+  this->AssertModesAre(ScalarFromJSON(in_ty, "5"), ModeOptions(/*n=*/1), {5}, {1});
+  this->AssertModesEmpty(ScalarFromJSON(in_ty, "null"), ModeOptions(/*n=*/1));
 }
 
 TEST_F(TestInt8ModeKernelValueRange, Basics) {
@@ -2672,6 +2762,36 @@ TYPED_TEST(TestIntegerQuantileKernel, Basics) {
   this->AssertQuantilesEmpty({"[null, null]", "[]", "[null]"}, {0.3, 0.4});
 
   auto ty = this->type_singleton();
+
+  QuantileOptions keep_nulls(/*q=*/0.5, QuantileOptions::LINEAR, /*skip_nulls=*/false,
+                             /*min_count=*/0);
+  QuantileOptions min_count(/*q=*/0.5, QuantileOptions::LINEAR, /*skip_nulls=*/true,
+                            /*min_count=*/3);
+  QuantileOptions keep_nulls_min_count(/*q=*/0.5, QuantileOptions::LINEAR,
+                                       /*skip_nulls=*/false, /*min_count=*/3);
+  auto not_empty = ResultWith(ArrayFromJSON(float64(), "[3.0]"));
+  auto empty = ResultWith(ArrayFromJSON(float64(), "[]"));
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 2, 4, 5]"), keep_nulls), not_empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 2, 4, 5, null]"), keep_nulls), empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 5]"), keep_nulls), not_empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 5, null]"), keep_nulls), empty);
+  EXPECT_THAT(Quantile(ScalarFromJSON(ty, "3"), keep_nulls), not_empty);
+  EXPECT_THAT(Quantile(ScalarFromJSON(ty, "null"), keep_nulls), empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 2, 4, 5]"), min_count), not_empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 2, 4, 5, null]"), min_count), not_empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 5]"), min_count), empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 5, null]"), min_count), empty);
+  EXPECT_THAT(Quantile(ScalarFromJSON(ty, "3"), min_count), empty);
+  EXPECT_THAT(Quantile(ScalarFromJSON(ty, "null"), min_count), empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 2, 4, 5]"), keep_nulls_min_count),
+              not_empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 2, 4, 5, null]"), keep_nulls_min_count),
+              empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 5]"), keep_nulls_min_count), empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 5, null]"), keep_nulls_min_count), empty);
+  EXPECT_THAT(Quantile(ScalarFromJSON(ty, "3"), keep_nulls_min_count), empty);
+  EXPECT_THAT(Quantile(ScalarFromJSON(ty, "null"), keep_nulls_min_count), empty);
+
   for (const auto interpolation : this->interpolations_) {
     QuantileOptions options({0.0, 0.5, 1.0}, interpolation);
     auto expected_ty = (interpolation == QuantileOptions::LINEAR ||
@@ -2718,6 +2838,36 @@ TYPED_TEST(TestFloatingQuantileKernel, Floats) {
   this->AssertQuantilesEmpty({"[NaN, NaN]", "[]", "[null]"}, {0.3, 0.4});
 
   auto ty = this->type_singleton();
+
+  QuantileOptions keep_nulls(/*q=*/0.5, QuantileOptions::LINEAR, /*skip_nulls=*/false,
+                             /*min_count=*/0);
+  QuantileOptions min_count(/*q=*/0.5, QuantileOptions::LINEAR, /*skip_nulls=*/true,
+                            /*min_count=*/3);
+  QuantileOptions keep_nulls_min_count(/*q=*/0.5, QuantileOptions::LINEAR,
+                                       /*skip_nulls=*/false, /*min_count=*/3);
+  auto not_empty = ResultWith(ArrayFromJSON(float64(), "[3.0]"));
+  auto empty = ResultWith(ArrayFromJSON(float64(), "[]"));
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 2, 4, 5]"), keep_nulls), not_empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 2, 4, 5, null]"), keep_nulls), empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 5]"), keep_nulls), not_empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 5, null]"), keep_nulls), empty);
+  EXPECT_THAT(Quantile(ScalarFromJSON(ty, "3"), keep_nulls), not_empty);
+  EXPECT_THAT(Quantile(ScalarFromJSON(ty, "null"), keep_nulls), empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 2, 4, 5]"), min_count), not_empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 2, 4, 5, null]"), min_count), not_empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 5]"), min_count), empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 5, null]"), min_count), empty);
+  EXPECT_THAT(Quantile(ScalarFromJSON(ty, "3"), min_count), empty);
+  EXPECT_THAT(Quantile(ScalarFromJSON(ty, "null"), min_count), empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 2, 4, 5]"), keep_nulls_min_count),
+              not_empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 2, 4, 5, null]"), keep_nulls_min_count),
+              empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 5]"), keep_nulls_min_count), empty);
+  EXPECT_THAT(Quantile(ArrayFromJSON(ty, "[1, 5, null]"), keep_nulls_min_count), empty);
+  EXPECT_THAT(Quantile(ScalarFromJSON(ty, "3"), keep_nulls_min_count), empty);
+  EXPECT_THAT(Quantile(ScalarFromJSON(ty, "null"), keep_nulls_min_count), empty);
+
   for (const auto interpolation : this->interpolations_) {
     QuantileOptions options({0.0, 0.5, 1.0}, interpolation);
     auto expected_ty = (interpolation == QuantileOptions::LINEAR ||
@@ -3015,5 +3165,44 @@ TEST(TestTDigestKernel, Scalar) {
   }
 }
 
+TEST(TestTDigestKernel, Options) {
+  auto ty = float64();
+  TDigestOptions keep_nulls(/*q=*/0.5, /*delta=*/100, /*buffer_size=*/500,
+                            /*skip_nulls=*/false, /*min_count=*/0);
+  TDigestOptions min_count(/*q=*/0.5, /*delta=*/100, /*buffer_size=*/500,
+                           /*skip_nulls=*/true, /*min_count=*/3);
+  TDigestOptions keep_nulls_min_count(/*q=*/0.5, /*delta=*/100, /*buffer_size=*/500,
+                                      /*skip_nulls=*/false, /*min_count=*/3);
+
+  EXPECT_THAT(TDigest(ArrayFromJSON(ty, "[1.0, 2.0, 3.0]"), keep_nulls),
+              ResultWith(ArrayFromJSON(ty, "[2.0]")));
+  EXPECT_THAT(TDigest(ArrayFromJSON(ty, "[1.0, 2.0, 3.0, null]"), keep_nulls),
+              ResultWith(ArrayFromJSON(ty, "[]")));
+  EXPECT_THAT(TDigest(ScalarFromJSON(ty, "1.0"), keep_nulls),
+              ResultWith(ArrayFromJSON(ty, "[1.0]")));
+  EXPECT_THAT(TDigest(ScalarFromJSON(ty, "null"), keep_nulls),
+              ResultWith(ArrayFromJSON(ty, "[]")));
+
+  EXPECT_THAT(TDigest(ArrayFromJSON(ty, "[1.0, 2.0, 3.0, null]"), min_count),
+              ResultWith(ArrayFromJSON(ty, "[2.0]")));
+  EXPECT_THAT(TDigest(ArrayFromJSON(ty, "[1.0, 2.0, null]"), min_count),
+              ResultWith(ArrayFromJSON(ty, "[]")));
+  EXPECT_THAT(TDigest(ScalarFromJSON(ty, "1.0"), min_count),
+              ResultWith(ArrayFromJSON(ty, "[]")));
+  EXPECT_THAT(TDigest(ScalarFromJSON(ty, "null"), min_count),
+              ResultWith(ArrayFromJSON(ty, "[]")));
+
+  EXPECT_THAT(TDigest(ArrayFromJSON(ty, "[1.0, 2.0, 3.0]"), keep_nulls_min_count),
+              ResultWith(ArrayFromJSON(ty, "[2.0]")));
+  EXPECT_THAT(TDigest(ArrayFromJSON(ty, "[1.0, 2.0]"), keep_nulls_min_count),
+              ResultWith(ArrayFromJSON(ty, "[]")));
+  EXPECT_THAT(TDigest(ArrayFromJSON(ty, "[1.0, 2.0, 3.0, null]"), keep_nulls_min_count),
+              ResultWith(ArrayFromJSON(ty, "[]")));
+  EXPECT_THAT(TDigest(ScalarFromJSON(ty, "1.0"), keep_nulls_min_count),
+              ResultWith(ArrayFromJSON(ty, "[]")));
+  EXPECT_THAT(TDigest(ScalarFromJSON(ty, "null"), keep_nulls_min_count),
+              ResultWith(ArrayFromJSON(ty, "[]")));
+}
+
 }  // namespace compute
 }  // namespace arrow
diff --git a/cpp/src/arrow/compute/kernels/codegen_internal.cc b/cpp/src/arrow/compute/kernels/codegen_internal.cc
index f8b90085010..f230ca7ff73 100644
--- a/cpp/src/arrow/compute/kernels/codegen_internal.cc
+++ b/cpp/src/arrow/compute/kernels/codegen_internal.cc
@@ -17,6 +17,7 @@
 
 #include "arrow/compute/kernels/codegen_internal.h"
 
+#include <cmath>
 #include <functional>
 #include <memory>
 #include <mutex>
@@ -145,12 +146,6 @@ const std::vector<Type::type>& DecimalTypeIds() {
   return g_decimal_type_ids;
 }
 
-const std::vector<TimeUnit::type>& AllTimeUnits() {
-  static std::vector<TimeUnit::type> units = {TimeUnit::SECOND, TimeUnit::MILLI,
-                                              TimeUnit::MICRO, TimeUnit::NANO};
-  return units;
-}
-
 const std::vector<std::shared_ptr<DataType>>& NumericTypes() {
   std::call_once(codegen_static_initialized, InitStaticData);
   return g_numeric_types;
@@ -341,6 +336,91 @@ std::shared_ptr<DataType> CommonBinary(const std::vector<ValueDescr>& descrs) {
   return large_binary();
 }
 
+Status CastBinaryDecimalArgs(DecimalPromotion promotion,
+                             std::vector<ValueDescr>* descrs) {
+  auto& left_type = (*descrs)[0].type;
+  auto& right_type = (*descrs)[1].type;
+  DCHECK(is_decimal(left_type->id()) || is_decimal(right_type->id()));
+
+  // decimal + float = float
+  if (is_floating(left_type->id())) {
+    right_type = left_type;
+    return Status::OK();
+  } else if (is_floating(right_type->id())) {
+    left_type = right_type;
+    return Status::OK();
+  }
+
+  // precision, scale of left and right args
+  int32_t p1, s1, p2, s2;
+
+  // decimal + integer = decimal
+  if (is_decimal(left_type->id())) {
+    auto decimal = checked_cast<const DecimalType*>(left_type.get());
+    p1 = decimal->precision();
+    s1 = decimal->scale();
+  } else {
+    DCHECK(is_integer(left_type->id()));
+    ARROW_ASSIGN_OR_RAISE(p1, MaxDecimalDigitsForInteger(left_type->id()));
+    s1 = 0;
+  }
+  if (is_decimal(right_type->id())) {
+    auto decimal = checked_cast<const DecimalType*>(right_type.get());
+    p2 = decimal->precision();
+    s2 = decimal->scale();
+  } else {
+    DCHECK(is_integer(right_type->id()));
+    ARROW_ASSIGN_OR_RAISE(p2, MaxDecimalDigitsForInteger(right_type->id()));
+    s2 = 0;
+  }
+  if (s1 < 0 || s2 < 0) {
+    return Status::NotImplemented("Decimals with negative scales not supported");
+  }
+
+  // decimal128 + decimal256 = decimal256
+  Type::type casted_type_id = Type::DECIMAL128;
+  if (left_type->id() == Type::DECIMAL256 || right_type->id() == Type::DECIMAL256) {
+    casted_type_id = Type::DECIMAL256;
+  }
+
+  // decimal promotion rules compatible with amazon redshift
+  // https://docs.aws.amazon.com/redshift/latest/dg/r_numeric_computations201.html
+  int32_t left_scaleup, right_scaleup;
+
+  switch (promotion) {
+    case DecimalPromotion::kAdd: {
+      left_scaleup = std::max(s1, s2) - s1;
+      right_scaleup = std::max(s1, s2) - s2;
+      break;
+    }
+    case DecimalPromotion::kMultiply: {
+      left_scaleup = right_scaleup = 0;
+      break;
+    }
+    case DecimalPromotion::kDivide: {
+      left_scaleup = std::max(4, s1 + p2 - s2 + 1) + s2 - s1;
+      right_scaleup = 0;
+      break;
+    }
+    default:
+      DCHECK(false) << "Invalid DecimalPromotion value " << static_cast<int>(promotion);
+  }
+  ARROW_ASSIGN_OR_RAISE(
+      left_type, DecimalType::Make(casted_type_id, p1 + left_scaleup, s1 + left_scaleup));
+  ARROW_ASSIGN_OR_RAISE(right_type, DecimalType::Make(casted_type_id, p2 + right_scaleup,
+                                                      s2 + right_scaleup));
+  return Status::OK();
+}
+
+bool HasDecimal(const std::vector<ValueDescr>& descrs) {
+  for (const auto& descr : descrs) {
+    if (is_decimal(descr.type->id())) {
+      return true;
+    }
+  }
+  return false;
+}
+
 }  // namespace internal
 }  // namespace compute
 }  // namespace arrow
diff --git a/cpp/src/arrow/compute/kernels/codegen_internal.h b/cpp/src/arrow/compute/kernels/codegen_internal.h
index 9c8b2cef198..98ca835a14c 100644
--- a/cpp/src/arrow/compute/kernels/codegen_internal.h
+++ b/cpp/src/arrow/compute/kernels/codegen_internal.h
@@ -94,8 +94,8 @@ struct OptionsWrapper : public KernelState {
 /// KernelContext and the FunctionOptions as argument
 template <typename StateType, typename OptionsType>
 struct KernelStateFromFunctionOptions : public KernelState {
-  explicit KernelStateFromFunctionOptions(KernelContext* ctx, OptionsType state)
-      : state(StateType(ctx, std::move(state))) {}
+  explicit KernelStateFromFunctionOptions(KernelContext* ctx, OptionsType options)
+      : state(StateType(ctx, std::move(options))) {}
 
   static Result<std::unique_ptr<KernelState>> Init(KernelContext* ctx,
                                                    const KernelInitArgs& args) {
@@ -415,9 +415,6 @@ const std::vector<std::shared_ptr<DataType>>& IntTypes();
 const std::vector<std::shared_ptr<DataType>>& FloatingPointTypes();
 const std::vector<Type::type>& DecimalTypeIds();
 
-ARROW_EXPORT
-const std::vector<TimeUnit::type>& AllTimeUnits();
-
 // Returns a vector of example instances of parametric types such as
 //
 // * Decimal
@@ -1313,6 +1310,19 @@ std::shared_ptr<DataType> CommonTimestamp(const std::vector<ValueDescr>& descrs)
 ARROW_EXPORT
 std::shared_ptr<DataType> CommonBinary(const std::vector<ValueDescr>& descrs);
 
+/// How to promote decimal precision/scale in CastBinaryDecimalArgs.
+enum class DecimalPromotion : uint8_t {
+  kAdd,
+  kMultiply,
+  kDivide,
+};
+
+ARROW_EXPORT
+Status CastBinaryDecimalArgs(DecimalPromotion promotion, std::vector<ValueDescr>* descrs);
+
+ARROW_EXPORT
+bool HasDecimal(const std::vector<ValueDescr>& descrs);
+
 }  // namespace internal
 }  // namespace compute
 }  // namespace arrow
diff --git a/cpp/src/arrow/compute/kernels/hash_aggregate.cc b/cpp/src/arrow/compute/kernels/hash_aggregate.cc
index 3ea692857cf..23bb73f2a7f 100644
--- a/cpp/src/arrow/compute/kernels/hash_aggregate.cc
+++ b/cpp/src/arrow/compute/kernels/hash_aggregate.cc
@@ -1593,6 +1593,8 @@ struct GroupedTDigestImpl : public GroupedAggregator {
     options_ = *checked_cast<const TDigestOptions*>(options);
     ctx_ = ctx;
     pool_ = ctx->memory_pool();
+    counts_ = TypedBufferBuilder<int64_t>(pool_);
+    no_nulls_ = TypedBufferBuilder<bool>(pool_);
     return Status::OK();
   }
 
@@ -1602,12 +1604,21 @@ struct GroupedTDigestImpl : public GroupedAggregator {
     for (int64_t i = 0; i < added_groups; i++) {
       tdigests_.emplace_back(options_.delta, options_.buffer_size);
     }
+    RETURN_NOT_OK(counts_.Append(new_num_groups, 0));
+    RETURN_NOT_OK(no_nulls_.Append(new_num_groups, true));
     return Status::OK();
   }
 
   Status Consume(const ExecBatch& batch) override {
-    VisitGroupedValuesNonNull<Type>(
-        batch, [&](uint32_t g, CType value) { tdigests_[g].NanAdd(value); });
+    int64_t* counts = counts_.mutable_data();
+    uint8_t* no_nulls = no_nulls_.mutable_data();
+    VisitGroupedValues<Type>(
+        batch,
+        [&](uint32_t g, CType value) {
+          tdigests_[g].NanAdd(value);
+          counts[g]++;
+        },
+        [&](uint32_t g) { BitUtil::SetBitTo(no_nulls, g, false); });
     return Status::OK();
   }
 
@@ -1615,15 +1626,26 @@ struct GroupedTDigestImpl : public GroupedAggregator {
                const ArrayData& group_id_mapping) override {
     auto other = checked_cast<GroupedTDigestImpl*>(&raw_other);
 
+    int64_t* counts = counts_.mutable_data();
+    uint8_t* no_nulls = no_nulls_.mutable_data();
+
+    const int64_t* other_counts = other->counts_.data();
+    const uint8_t* other_no_nulls = no_nulls_.mutable_data();
+
     auto g = group_id_mapping.GetValues<uint32_t>(1);
     for (int64_t other_g = 0; other_g < group_id_mapping.length; ++other_g, ++g) {
       tdigests_[*g].Merge(other->tdigests_[other_g]);
+      counts[*g] += other_counts[other_g];
+      BitUtil::SetBitTo(
+          no_nulls, *g,
+          BitUtil::GetBit(no_nulls, *g) && BitUtil::GetBit(other_no_nulls, other_g));
     }
 
     return Status::OK();
   }
 
   Result<Datum> Finalize() override {
+    const int64_t* counts = counts_.data();
     std::shared_ptr<Buffer> null_bitmap;
     ARROW_ASSIGN_OR_RAISE(
         std::shared_ptr<Buffer> values,
@@ -1633,7 +1655,7 @@ struct GroupedTDigestImpl : public GroupedAggregator {
 
     double* results = reinterpret_cast<double*>(values->mutable_data());
     for (int64_t i = 0; static_cast<size_t>(i) < tdigests_.size(); ++i) {
-      if (!tdigests_[i].is_empty()) {
+      if (!tdigests_[i].is_empty() && counts[i] >= options_.min_count) {
         for (int64_t j = 0; j < slot_length; j++) {
           results[i * slot_length + j] = tdigests_[i].Quantile(options_.q[j]);
         }
@@ -1649,6 +1671,18 @@ struct GroupedTDigestImpl : public GroupedAggregator {
       std::fill(&results[i * slot_length], &results[(i + 1) * slot_length], 0.0);
     }
 
+    if (!options_.skip_nulls) {
+      null_count = kUnknownNullCount;
+      if (null_bitmap) {
+        arrow::internal::BitmapAnd(null_bitmap->data(), /*left_offset=*/0,
+                                   no_nulls_.data(), /*right_offset=*/0,
+                                   static_cast<int64_t>(tdigests_.size()),
+                                   /*out_offset=*/0, null_bitmap->mutable_data());
+      } else {
+        ARROW_ASSIGN_OR_RAISE(null_bitmap, no_nulls_.Finish());
+      }
+    }
+
     auto child = ArrayData::Make(float64(), tdigests_.size() * options_.q.size(),
                                  {nullptr, std::move(values)}, /*null_count=*/0);
     return ArrayData::Make(out_type(), tdigests_.size(), {std::move(null_bitmap)},
@@ -1661,6 +1695,8 @@ struct GroupedTDigestImpl : public GroupedAggregator {
 
   TDigestOptions options_;
   std::vector<TDigest> tdigests_;
+  TypedBufferBuilder<int64_t> counts_;
+  TypedBufferBuilder<bool> no_nulls_;
   ExecContext* ctx_;
   MemoryPool* pool_;
 };
diff --git a/cpp/src/arrow/compute/kernels/hash_aggregate_test.cc b/cpp/src/arrow/compute/kernels/hash_aggregate_test.cc
index 32e8efa0ab8..df13bd569ea 100644
--- a/cpp/src/arrow/compute/kernels/hash_aggregate_test.cc
+++ b/cpp/src/arrow/compute/kernels/hash_aggregate_test.cc
@@ -1086,27 +1086,40 @@ TEST(GroupBy, VarianceAndStddev) {
 TEST(GroupBy, TDigest) {
   auto batch = RecordBatchFromJSON(
       schema({field("argument", float64()), field("key", int64())}), R"([
-    [1,   1],
-    [null,  1],
-    [0,   2],
-    [null,  3],
-    [4,   null],
-    [3,  1],
-    [0, 2],
-    [-1, 2],
-    [1,  null],
-    [NaN,  3]
+    [1,    1],
+    [null, 1],
+    [0,    2],
+    [null, 3],
+    [1,    4],
+    [4,    null],
+    [3,    1],
+    [0,    2],
+    [-1,   2],
+    [1,    null],
+    [NaN,  3],
+    [1,    4],
+    [1,    4],
+    [null, 4]
   ])");
 
   TDigestOptions options1(std::vector<double>{0.5, 0.9, 0.99});
   TDigestOptions options2(std::vector<double>{0.5, 0.9, 0.99}, /*delta=*/50,
                           /*buffer_size=*/1024);
+  TDigestOptions keep_nulls(/*q=*/0.5, /*delta=*/100, /*buffer_size=*/500,
+                            /*skip_nulls=*/false, /*min_count=*/0);
+  TDigestOptions min_count(/*q=*/0.5, /*delta=*/100, /*buffer_size=*/500,
+                           /*skip_nulls=*/true, /*min_count=*/3);
+  TDigestOptions keep_nulls_min_count(/*q=*/0.5, /*delta=*/100, /*buffer_size=*/500,
+                                      /*skip_nulls=*/false, /*min_count=*/3);
   ASSERT_OK_AND_ASSIGN(Datum aggregated_and_grouped,
                        internal::GroupBy(
                            {
                                batch->GetColumnByName("argument"),
                                batch->GetColumnByName("argument"),
                                batch->GetColumnByName("argument"),
+                               batch->GetColumnByName("argument"),
+                               batch->GetColumnByName("argument"),
+                               batch->GetColumnByName("argument"),
                            },
                            {
                                batch->GetColumnByName("key"),
@@ -1115,6 +1128,9 @@ TEST(GroupBy, TDigest) {
                                {"hash_tdigest", nullptr},
                                {"hash_tdigest", &options1},
                                {"hash_tdigest", &options2},
+                               {"hash_tdigest", &keep_nulls},
+                               {"hash_tdigest", &min_count},
+                               {"hash_tdigest", &keep_nulls_min_count},
                            }));
 
   AssertDatumsApproxEqual(
@@ -1122,13 +1138,17 @@ TEST(GroupBy, TDigest) {
                         field("hash_tdigest", fixed_size_list(float64(), 1)),
                         field("hash_tdigest", fixed_size_list(float64(), 3)),
                         field("hash_tdigest", fixed_size_list(float64(), 3)),
+                        field("hash_tdigest", fixed_size_list(float64(), 1)),
+                        field("hash_tdigest", fixed_size_list(float64(), 1)),
+                        field("hash_tdigest", fixed_size_list(float64(), 1)),
                         field("key_0", int64()),
                     }),
                     R"([
-    [[1.0], [1.0, 3.0, 3.0], [1.0, 3.0, 3.0], 1],
-    [[0.0], [0.0, 0.0, 0.0], [0.0, 0.0, 0.0], 2],
-    [null,  null,            null,            3],
-    [[1.0], [1.0, 4.0, 4.0], [1.0, 4.0, 4.0], null]
+    [[1.0], [1.0, 3.0, 3.0], [1.0, 3.0, 3.0], null,  null,  null,  1],
+    [[0.0], [0.0, 0.0, 0.0], [0.0, 0.0, 0.0], [0.0], [0.0], [0.0], 2],
+    [null,  null,            null,            null,  null,  null,  3],
+    [[1.0], [1.0, 1.0, 1.0], [1.0, 1.0, 1.0], null,  [1.0], null,  4],
+    [[1.0], [1.0, 4.0, 4.0], [1.0, 4.0, 4.0], [1.0], null,  null,  null]
   ])"),
       aggregated_and_grouped,
       /*verbose=*/true);
diff --git a/cpp/src/arrow/compute/kernels/scalar_arithmetic.cc b/cpp/src/arrow/compute/kernels/scalar_arithmetic.cc
index 7692f037124..4a686ea6db5 100644
--- a/cpp/src/arrow/compute/kernels/scalar_arithmetic.cc
+++ b/cpp/src/arrow/compute/kernels/scalar_arithmetic.cc
@@ -19,8 +19,10 @@
 #include <cmath>
 #include <limits>
 #include <utility>
+#include <vector>
 
-#include "arrow/compute/kernels/codegen_internal.h"
+#include "arrow/compare.h"
+#include "arrow/compute/api_scalar.h"
 #include "arrow/compute/kernels/common.h"
 #include "arrow/compute/kernels/util_internal.h"
 #include "arrow/type.h"
@@ -78,24 +80,27 @@ using enable_if_decimal_value =
 
 struct AbsoluteValue {
   template <typename T, typename Arg>
-  static constexpr enable_if_floating_point<T> Call(KernelContext*, T arg, Status*) {
+  static constexpr enable_if_floating_point<Arg, T> Call(KernelContext*, Arg arg,
+                                                         Status*) {
     return std::fabs(arg);
   }
 
   template <typename T, typename Arg>
-  static constexpr enable_if_unsigned_c_integer<T> Call(KernelContext*, T arg, Status*) {
+  static constexpr enable_if_unsigned_c_integer<Arg, T> Call(KernelContext*, Arg arg,
+                                                             Status*) {
     return arg;
   }
 
   template <typename T, typename Arg>
-  static constexpr enable_if_signed_c_integer<T> Call(KernelContext*, T arg, Status* st) {
+  static constexpr enable_if_signed_c_integer<Arg, T> Call(KernelContext*, Arg arg,
+                                                           Status* st) {
     return (arg < 0) ? arrow::internal::SafeSignedNegate(arg) : arg;
   }
 };
 
 struct AbsoluteValueChecked {
   template <typename T, typename Arg>
-  static enable_if_signed_c_integer<T> Call(KernelContext*, Arg arg, Status* st) {
+  static enable_if_signed_c_integer<Arg, T> Call(KernelContext*, Arg arg, Status* st) {
     static_assert(std::is_same<T, Arg>::value, "");
     if (arg == std::numeric_limits<Arg>::min()) {
       *st = Status::Invalid("overflow");
@@ -105,13 +110,15 @@ struct AbsoluteValueChecked {
   }
 
   template <typename T, typename Arg>
-  static enable_if_unsigned_c_integer<T> Call(KernelContext* ctx, Arg arg, Status* st) {
+  static enable_if_unsigned_c_integer<Arg, T> Call(KernelContext* ctx, Arg arg,
+                                                   Status* st) {
     static_assert(std::is_same<T, Arg>::value, "");
     return arg;
   }
 
   template <typename T, typename Arg>
-  static constexpr enable_if_floating_point<T> Call(KernelContext*, Arg arg, Status* st) {
+  static constexpr enable_if_floating_point<Arg, T> Call(KernelContext*, Arg arg,
+                                                         Status* st) {
     static_assert(std::is_same<T, Arg>::value, "");
     return std::fabs(arg);
   }
@@ -378,7 +385,7 @@ struct Negate {
 
 struct NegateChecked {
   template <typename T, typename Arg>
-  static enable_if_signed_c_integer<T> Call(KernelContext*, Arg arg, Status* st) {
+  static enable_if_signed_c_integer<Arg, T> Call(KernelContext*, Arg arg, Status* st) {
     static_assert(std::is_same<T, Arg>::value, "");
     T result = 0;
     if (ARROW_PREDICT_FALSE(NegateWithOverflow(arg, &result))) {
@@ -388,7 +395,8 @@ struct NegateChecked {
   }
 
   template <typename T, typename Arg>
-  static enable_if_unsigned_c_integer<T> Call(KernelContext* ctx, Arg arg, Status* st) {
+  static enable_if_unsigned_c_integer<Arg, T> Call(KernelContext* ctx, Arg arg,
+                                                   Status* st) {
     static_assert(std::is_same<T, Arg>::value, "");
     DCHECK(false) << "This is included only for the purposes of instantiability from the "
                      "arithmetic kernel generator";
@@ -396,7 +404,8 @@ struct NegateChecked {
   }
 
   template <typename T, typename Arg>
-  static constexpr enable_if_floating_point<T> Call(KernelContext*, Arg arg, Status* st) {
+  static constexpr enable_if_floating_point<Arg, T> Call(KernelContext*, Arg arg,
+                                                         Status* st) {
     static_assert(std::is_same<T, Arg>::value, "");
     return -arg;
   }
@@ -466,18 +475,20 @@ struct PowerChecked {
 
 struct Sign {
   template <typename T, typename Arg>
-  static constexpr enable_if_floating_point<T> Call(KernelContext*, Arg arg, Status*) {
+  static constexpr enable_if_floating_point<Arg, T> Call(KernelContext*, Arg arg,
+                                                         Status*) {
     return std::isnan(arg) ? arg : ((arg == 0) ? 0 : (std::signbit(arg) ? -1 : 1));
   }
 
   template <typename T, typename Arg>
-  static constexpr enable_if_unsigned_c_integer<T> Call(KernelContext*, Arg arg,
-                                                        Status*) {
-    return arg > 0;
+  static constexpr enable_if_unsigned_c_integer<Arg, T> Call(KernelContext*, Arg arg,
+                                                             Status*) {
+    return (arg > 0) ? 1 : 0;
   }
 
   template <typename T, typename Arg>
-  static constexpr enable_if_signed_c_integer<T> Call(KernelContext*, Arg arg, Status*) {
+  static constexpr enable_if_signed_c_integer<Arg, T> Call(KernelContext*, Arg arg,
+                                                           Status*) {
     return (arg > 0) ? 1 : ((arg == 0) ? 0 : -1);
   }
 };
@@ -852,24 +863,242 @@ struct LogbChecked {
   }
 };
 
+struct RoundUtil {
+  // Calculate powers of ten with arbitrary integer exponent
+  template <typename T = double>
+  static enable_if_floating_point<T> Pow10(int64_t power) {
+    static constexpr T lut[] = {1e0F, 1e1F, 1e2F,  1e3F,  1e4F,  1e5F,  1e6F,  1e7F,
+                                1e8F, 1e9F, 1e10F, 1e11F, 1e12F, 1e13F, 1e14F, 1e15F};
+    int64_t lut_size = (sizeof(lut) / sizeof(*lut));
+    int64_t abs_power = std::abs(power);
+    auto pow10 = lut[std::min(abs_power, lut_size - 1)];
+    while (abs_power-- >= lut_size) {
+      pow10 *= 1e1F;
+    }
+    return (power >= 0) ? pow10 : (1 / pow10);
+  }
+};
+
+// Specializations of rounding implementations for round kernels
+template <typename, RoundMode>
+struct RoundImpl;
+
+template <typename T>
+struct RoundImpl<T, RoundMode::DOWN> {
+  static constexpr enable_if_floating_point<T> Round(const T val) {
+    return std::floor(val);
+  }
+};
+
+template <typename T>
+struct RoundImpl<T, RoundMode::UP> {
+  static constexpr enable_if_floating_point<T> Round(const T val) {
+    return std::ceil(val);
+  }
+};
+
+template <typename T>
+struct RoundImpl<T, RoundMode::TOWARDS_ZERO> {
+  static constexpr enable_if_floating_point<T> Round(const T val) {
+    return std::trunc(val);
+  }
+};
+
+template <typename T>
+struct RoundImpl<T, RoundMode::TOWARDS_INFINITY> {
+  static constexpr enable_if_floating_point<T> Round(const T val) {
+    return std::signbit(val) ? std::floor(val) : std::ceil(val);
+  }
+};
+
+// NOTE: RoundImpl variants for the HALF_* rounding modes are only
+// invoked when the fractional part is equal to 0.5 (std::round is invoked
+// otherwise).
+
+template <typename T>
+struct RoundImpl<T, RoundMode::HALF_DOWN> {
+  static constexpr enable_if_floating_point<T> Round(const T val) {
+    return RoundImpl<T, RoundMode::DOWN>::Round(val);
+  }
+};
+
+template <typename T>
+struct RoundImpl<T, RoundMode::HALF_UP> {
+  static constexpr enable_if_floating_point<T> Round(const T val) {
+    return RoundImpl<T, RoundMode::UP>::Round(val);
+  }
+};
+
+template <typename T>
+struct RoundImpl<T, RoundMode::HALF_TOWARDS_ZERO> {
+  static constexpr enable_if_floating_point<T> Round(const T val) {
+    return RoundImpl<T, RoundMode::TOWARDS_ZERO>::Round(val);
+  }
+};
+
+template <typename T>
+struct RoundImpl<T, RoundMode::HALF_TOWARDS_INFINITY> {
+  static constexpr enable_if_floating_point<T> Round(const T val) {
+    return RoundImpl<T, RoundMode::TOWARDS_INFINITY>::Round(val);
+  }
+};
+
+template <typename T>
+struct RoundImpl<T, RoundMode::HALF_TO_EVEN> {
+  static constexpr enable_if_floating_point<T> Round(const T val) {
+    return std::round(val * T(0.5)) * 2;
+  }
+};
+
+template <typename T>
+struct RoundImpl<T, RoundMode::HALF_TO_ODD> {
+  static constexpr enable_if_floating_point<T> Round(const T val) {
+    return std::floor(val * T(0.5)) + std::ceil(val * T(0.5));
+  }
+};
+
+// Specializations of kernel state for round kernels
+template <typename>
+struct RoundOptionsWrapper;
+
+template <>
+struct RoundOptionsWrapper<RoundOptions> : public OptionsWrapper<RoundOptions> {
+  using OptionsType = RoundOptions;
+  using State = RoundOptionsWrapper<OptionsType>;
+  double pow10;
+
+  explicit RoundOptionsWrapper(OptionsType options) : OptionsWrapper(std::move(options)) {
+    // Only positive exponents for powers of 10 are used because combining
+    // multiply and division operations produced more stable rounding than
+    // using multiply-only.  Refer to NumPy's round implementation:
+    // https://github.com/numpy/numpy/blob/7b2f20b406d27364c812f7a81a9c901afbd3600c/numpy/core/src/multiarray/calculation.c#L589
+    pow10 = RoundUtil::Pow10(std::abs(options.ndigits));
+  }
+
+  static Result<std::unique_ptr<KernelState>> Init(KernelContext* ctx,
+                                                   const KernelInitArgs& args) {
+    if (auto options = static_cast<const OptionsType*>(args.options)) {
+      return ::arrow::internal::make_unique<State>(*options);
+    }
+    return Status::Invalid(
+        "Attempted to initialize KernelState from null FunctionOptions");
+  }
+};
+
+template <>
+struct RoundOptionsWrapper<RoundToMultipleOptions>
+    : public OptionsWrapper<RoundToMultipleOptions> {
+  using OptionsType = RoundToMultipleOptions;
+
+  static Result<std::unique_ptr<KernelState>> Init(KernelContext* ctx,
+                                                   const KernelInitArgs& args) {
+    ARROW_ASSIGN_OR_RAISE(auto state, OptionsWrapper<OptionsType>::Init(ctx, args));
+    auto options = Get(*state);
+    if (options.multiple <= 0) {
+      return Status::Invalid("Rounding multiple has to be a positive value");
+    }
+    return std::move(state);
+  }
+};
+
+template <RoundMode RndMode>
+struct Round {
+  using State = RoundOptionsWrapper<RoundOptions>;
+
+  template <typename T, typename Arg>
+  static enable_if_floating_point<Arg, T> Call(KernelContext* ctx, Arg arg, Status* st) {
+    static_assert(std::is_same<T, Arg>::value, "");
+    // Do not process Inf or NaN because they will trigger the overflow error at end of
+    // function.
+    if (!std::isfinite(arg)) {
+      return arg;
+    }
+    auto state = static_cast<State*>(ctx->state());
+    auto options = state->options;
+    auto pow10 = T(state->pow10);
+    auto round_val = (options.ndigits >= 0) ? (arg * pow10) : (arg / pow10);
+    auto frac = round_val - std::floor(round_val);
+    if (frac != T(0)) {
+      // Use std::round() if in tie-breaking mode and scaled value is not 0.5.
+      if ((RndMode >= RoundMode::HALF_DOWN) && (frac != T(0.5))) {
+        round_val = std::round(round_val);
+      } else {
+        round_val = RoundImpl<T, RndMode>::Round(round_val);
+      }
+      // Equality check is ommitted so that the common case of 10^0 (integer rounding)
+      // uses multiply-only
+      round_val = (options.ndigits > 0) ? (round_val / pow10) : (round_val * pow10);
+      if (!std::isfinite(round_val)) {
+        *st = Status::Invalid("overflow occurred during rounding");
+        return arg;
+      }
+    } else {
+      // If scaled value is an integer, then no rounding is needed.
+      round_val = arg;
+    }
+    return round_val;
+  }
+};
+
+template <RoundMode RndMode>
+struct RoundToMultiple {
+  using State = RoundOptionsWrapper<RoundToMultipleOptions>;
+
+  template <typename T, typename Arg>
+  static enable_if_floating_point<Arg, T> Call(KernelContext* ctx, Arg arg, Status* st) {
+    static_assert(std::is_same<T, Arg>::value, "");
+    // Do not process Inf or NaN because they will trigger the overflow error at end of
+    // function.
+    if (!std::isfinite(arg)) {
+      return arg;
+    }
+    auto options = State::Get(ctx);
+    auto round_val = arg / T(options.multiple);
+    auto frac = round_val - std::floor(round_val);
+    if (frac != T(0)) {
+      // Use std::round() if in tie-breaking mode and scaled value is not 0.5.
+      if ((RndMode >= RoundMode::HALF_DOWN) && (frac != T(0.5))) {
+        round_val = std::round(round_val);
+      } else {
+        round_val = RoundImpl<T, RndMode>::Round(round_val);
+      }
+      round_val *= T(options.multiple);
+      if (!std::isfinite(round_val)) {
+        *st = Status::Invalid("overflow occurred during rounding");
+        return arg;
+      }
+    } else {
+      // If scaled value is an integer, then no rounding is needed.
+      round_val = arg;
+    }
+    return round_val;
+  }
+};
+
 struct Floor {
   template <typename T, typename Arg>
-  static constexpr enable_if_floating_point<T> Call(KernelContext*, Arg arg, Status*) {
-    return std::floor(arg);
+  static constexpr enable_if_floating_point<Arg, T> Call(KernelContext*, Arg arg,
+                                                         Status*) {
+    static_assert(std::is_same<T, Arg>::value, "");
+    return RoundImpl<T, RoundMode::DOWN>::Round(arg);
   }
 };
 
 struct Ceil {
   template <typename T, typename Arg>
-  static constexpr enable_if_floating_point<T> Call(KernelContext*, Arg arg, Status*) {
-    return std::ceil(arg);
+  static constexpr enable_if_floating_point<Arg, T> Call(KernelContext*, Arg arg,
+                                                         Status*) {
+    static_assert(std::is_same<T, Arg>::value, "");
+    return RoundImpl<T, RoundMode::UP>::Round(arg);
   }
 };
 
 struct Trunc {
   template <typename T, typename Arg>
-  static constexpr enable_if_floating_point<T> Call(KernelContext*, Arg arg, Status*) {
-    return std::trunc(arg);
+  static constexpr enable_if_floating_point<Arg, T> Call(KernelContext*, Arg arg,
+                                                         Status*) {
+    static_assert(std::is_same<T, Arg>::value, "");
+    return RoundImpl<T, RoundMode::TOWARDS_ZERO>::Round(arg);
   }
 };
 
@@ -965,78 +1194,6 @@ ArrayKernelExec GenerateArithmeticFloatingPoint(detail::GetTypeId get_id) {
   }
 }
 
-Status CastBinaryDecimalArgs(const std::string& func_name,
-                             std::vector<ValueDescr>* values) {
-  auto& left_type = (*values)[0].type;
-  auto& right_type = (*values)[1].type;
-  DCHECK(is_decimal(left_type->id()) || is_decimal(right_type->id()));
-
-  // decimal + float = float
-  if (is_floating(left_type->id())) {
-    right_type = left_type;
-    return Status::OK();
-  } else if (is_floating(right_type->id())) {
-    left_type = right_type;
-    return Status::OK();
-  }
-
-  // precision, scale of left and right args
-  int32_t p1, s1, p2, s2;
-
-  // decimal + integer = decimal
-  if (is_decimal(left_type->id())) {
-    auto decimal = checked_cast<const DecimalType*>(left_type.get());
-    p1 = decimal->precision();
-    s1 = decimal->scale();
-  } else {
-    DCHECK(is_integer(left_type->id()));
-    p1 = static_cast<int32_t>(std::ceil(std::log10(bit_width(left_type->id()))));
-    s1 = 0;
-  }
-  if (is_decimal(right_type->id())) {
-    auto decimal = checked_cast<const DecimalType*>(right_type.get());
-    p2 = decimal->precision();
-    s2 = decimal->scale();
-  } else {
-    DCHECK(is_integer(right_type->id()));
-    p2 = static_cast<int32_t>(std::ceil(std::log10(bit_width(right_type->id()))));
-    s2 = 0;
-  }
-  if (s1 < 0 || s2 < 0) {
-    return Status::NotImplemented("Decimals with negative scales not supported");
-  }
-
-  // decimal128 + decimal256 = decimal256
-  Type::type casted_type_id = Type::DECIMAL128;
-  if (left_type->id() == Type::DECIMAL256 || right_type->id() == Type::DECIMAL256) {
-    casted_type_id = Type::DECIMAL256;
-  }
-
-  // decimal promotion rules compatible with amazon redshift
-  // https://docs.aws.amazon.com/redshift/latest/dg/r_numeric_computations201.html
-  int32_t left_scaleup, right_scaleup;
-
-  // "add_checked" -> "add"
-  const std::string op = func_name.substr(0, func_name.find("_"));
-  if (op == "add" || op == "subtract") {
-    left_scaleup = std::max(s1, s2) - s1;
-    right_scaleup = std::max(s1, s2) - s2;
-  } else if (op == "multiply") {
-    left_scaleup = right_scaleup = 0;
-  } else if (op == "divide") {
-    left_scaleup = std::max(4, s1 + p2 - s2 + 1) + s2 - s1;
-    right_scaleup = 0;
-  } else {
-    return Status::Invalid("Invalid decimal function: ", func_name);
-  }
-
-  ARROW_ASSIGN_OR_RAISE(
-      left_type, DecimalType::Make(casted_type_id, p1 + left_scaleup, s1 + left_scaleup));
-  ARROW_ASSIGN_OR_RAISE(right_type, DecimalType::Make(casted_type_id, p2 + right_scaleup,
-                                                      s2 + right_scaleup));
-  return Status::OK();
-}
-
 // resolve decimal binary operation output type per *casted* args
 template <typename OutputGetter>
 Result<ValueDescr> ResolveDecimalBinaryOperationOutput(
@@ -1166,17 +1323,21 @@ struct ArithmeticFunction : ScalarFunction {
   }
 
   Status CheckDecimals(std::vector<ValueDescr>* values) const {
-    bool has_decimal = false;
-    for (const auto& value : *values) {
-      if (is_decimal(value.type->id())) {
-        has_decimal = true;
-        break;
-      }
-    }
-    if (!has_decimal) return Status::OK();
+    if (!HasDecimal(*values)) return Status::OK();
 
     if (values->size() == 2) {
-      return CastBinaryDecimalArgs(name(), values);
+      // "add_checked" -> "add"
+      const auto func_name = name();
+      const std::string op = func_name.substr(0, func_name.find("_"));
+      if (op == "add" || op == "subtract") {
+        return CastBinaryDecimalArgs(DecimalPromotion::kAdd, values);
+      } else if (op == "multiply") {
+        return CastBinaryDecimalArgs(DecimalPromotion::kMultiply, values);
+      } else if (op == "divide") {
+        return CastBinaryDecimalArgs(DecimalPromotion::kDivide, values);
+      } else {
+        return Status::Invalid("Invalid decimal function: ", func_name);
+      }
     }
     return Status::OK();
   }
@@ -1276,6 +1437,65 @@ std::shared_ptr<ScalarFunction> MakeUnaryArithmeticFunctionNotNull(
   return func;
 }
 
+// Generate a kernel given an arithmetic rounding functor
+template <template <RoundMode> class Op>
+ArrayKernelExec GenerateExecForRound(RoundMode rmode, detail::GetTypeId ty) {
+  switch (rmode) {
+    case RoundMode::DOWN:
+      return GenerateArithmeticFloatingPoint<ScalarUnaryNotNull, Op<RoundMode::DOWN>>(ty);
+    case RoundMode::UP:
+      return GenerateArithmeticFloatingPoint<ScalarUnaryNotNull, Op<RoundMode::UP>>(ty);
+    case RoundMode::TOWARDS_ZERO:
+      return GenerateArithmeticFloatingPoint<ScalarUnaryNotNull,
+                                             Op<RoundMode::TOWARDS_ZERO>>(ty);
+    case RoundMode::TOWARDS_INFINITY:
+      return GenerateArithmeticFloatingPoint<ScalarUnaryNotNull,
+                                             Op<RoundMode::TOWARDS_INFINITY>>(ty);
+    case RoundMode::HALF_DOWN:
+      return GenerateArithmeticFloatingPoint<ScalarUnaryNotNull,
+                                             Op<RoundMode::HALF_DOWN>>(ty);
+    case RoundMode::HALF_UP:
+      return GenerateArithmeticFloatingPoint<ScalarUnaryNotNull, Op<RoundMode::HALF_UP>>(
+          ty);
+    case RoundMode::HALF_TOWARDS_ZERO:
+      return GenerateArithmeticFloatingPoint<ScalarUnaryNotNull,
+                                             Op<RoundMode::HALF_TOWARDS_ZERO>>(ty);
+    case RoundMode::HALF_TOWARDS_INFINITY:
+      return GenerateArithmeticFloatingPoint<ScalarUnaryNotNull,
+                                             Op<RoundMode::HALF_TOWARDS_INFINITY>>(ty);
+    case RoundMode::HALF_TO_EVEN:
+      return GenerateArithmeticFloatingPoint<ScalarUnaryNotNull,
+                                             Op<RoundMode::HALF_TO_EVEN>>(ty);
+    case RoundMode::HALF_TO_ODD:
+      return GenerateArithmeticFloatingPoint<ScalarUnaryNotNull,
+                                             Op<RoundMode::HALF_TO_ODD>>(ty);
+    default:
+      DCHECK(false);
+      return ExecFail;
+  }
+}
+
+// Like MakeUnaryArithmeticFunction, but for unary rounding functions that control
+// kernel dispatch based on RoundMode, only on non-null output.
+template <template <RoundMode> class Op, typename OptionsType>
+std::shared_ptr<ScalarFunction> MakeUnaryRoundFunction(std::string name,
+                                                       const FunctionDoc* doc) {
+  using State = RoundOptionsWrapper<OptionsType>;
+
+  static const OptionsType kDefaultOptions = OptionsType::Defaults();
+  auto func = std::make_shared<ArithmeticFloatingPointFunction>(name, Arity::Unary(), doc,
+                                                                &kDefaultOptions);
+  for (const auto& ty : FloatingPointTypes()) {
+    auto exec = [&](KernelContext* ctx, const ExecBatch& batch, Datum* out) {
+      auto options = State::Get(ctx);
+      auto exec_ = GenerateExecForRound<Op>(options.round_mode, ty);
+      return exec_(ctx, batch, out);
+    };
+    DCHECK_OK(func->AddKernel({ty}, ty, exec, State::Init));
+  }
+  return func;
+}
+
 // Like MakeUnaryArithmeticFunction, but for signed arithmetic ops that need to run
 // only on non-null output.
 template <typename Op>
@@ -1319,9 +1539,8 @@ std::shared_ptr<ScalarFunction> MakeUnaryArithmeticFunctionFloatingPoint(
   auto func =
       std::make_shared<ArithmeticFloatingPointFunction>(name, Arity::Unary(), doc);
   for (const auto& ty : FloatingPointTypes()) {
-    auto output = is_integer(ty->id()) ? float64() : ty;
     auto exec = GenerateArithmeticFloatingPoint<ScalarUnary, Op>(ty);
-    DCHECK_OK(func->AddKernel({ty}, output, exec));
+    DCHECK_OK(func->AddKernel({ty}, ty, exec));
   }
   return func;
 }
@@ -1332,9 +1551,8 @@ std::shared_ptr<ScalarFunction> MakeUnaryArithmeticFunctionFloatingPointNotNull(
   auto func =
       std::make_shared<ArithmeticFloatingPointFunction>(name, Arity::Unary(), doc);
   for (const auto& ty : FloatingPointTypes()) {
-    auto output = is_integer(ty->id()) ? float64() : ty;
     auto exec = GenerateArithmeticFloatingPoint<ScalarUnaryNotNull, Op>(ty);
-    DCHECK_OK(func->AddKernel({ty}, output, exec));
+    DCHECK_OK(func->AddKernel({ty}, ty, exec));
   }
   return func;
 }
@@ -1345,9 +1563,8 @@ std::shared_ptr<ScalarFunction> MakeArithmeticFunctionFloatingPoint(
   auto func =
       std::make_shared<ArithmeticFloatingPointFunction>(name, Arity::Binary(), doc);
   for (const auto& ty : FloatingPointTypes()) {
-    auto output = is_integer(ty->id()) ? float64() : ty;
     auto exec = GenerateArithmeticFloatingPoint<ScalarBinaryEqualTypes, Op>(ty);
-    DCHECK_OK(func->AddKernel({ty, ty}, output, exec));
+    DCHECK_OK(func->AddKernel({ty, ty}, ty, exec));
   }
   return func;
 }
@@ -1667,6 +1884,22 @@ const FunctionDoc trunc_doc{
     ("Calculate the nearest integer not greater in magnitude than to the "
      "argument element-wise."),
     {"x"}};
+
+const FunctionDoc round_doc{
+    "Round to a given precision",
+    ("Options are used to control the number of digits and rounding mode.\n"
+     "Default behavior is to round to the nearest integer and use half-to-even "
+     "rule to break ties."),
+    {"x"},
+    "RoundOptions"};
+
+const FunctionDoc round_to_multiple_doc{
+    "Round to a given multiple",
+    ("Options are used to control the rounding multiple and rounding mode.\n"
+     "Default behavior is to round to the nearest integer and use half-to-even "
+     "rule to break ties."),
+    {"x"},
+    "RoundToMultipleOptions"};
 }  // namespace
 
 void RegisterScalarArithmetic(FunctionRegistry* registry) {
@@ -1696,7 +1929,7 @@ void RegisterScalarArithmetic(FunctionRegistry* registry) {
   AddDecimalBinaryKernels<Subtract>("subtract", &subtract);
 
   // Add subtract(timestamp, timestamp) -> duration
-  for (auto unit : AllTimeUnits()) {
+  for (auto unit : ::arrow::internal::AllTimeUnits()) {
     InputType in_type(match::TimestampTypeUnit(unit));
     auto exec = ArithmeticExecFromOp<ScalarBinaryEqualTypes, Subtract>(Type::TIMESTAMP);
     DCHECK_OK(subtract->AddKernel({in_type, in_type}, duration(unit), std::move(exec)));
@@ -1884,6 +2117,14 @@ void RegisterScalarArithmetic(FunctionRegistry* registry) {
 
   auto trunc = MakeUnaryArithmeticFunctionFloatingPoint<Trunc>("trunc", &trunc_doc);
   DCHECK_OK(registry->AddFunction(std::move(trunc)));
+
+  auto round = MakeUnaryRoundFunction<Round, RoundOptions>("round", &round_doc);
+  DCHECK_OK(registry->AddFunction(std::move(round)));
+
+  auto round_to_multiple =
+      MakeUnaryRoundFunction<RoundToMultiple, RoundToMultipleOptions>(
+          "round_to_multiple", &round_to_multiple_doc);
+  DCHECK_OK(registry->AddFunction(std::move(round_to_multiple)));
 }
 
 }  // namespace internal
diff --git a/cpp/src/arrow/compute/kernels/scalar_arithmetic_test.cc b/cpp/src/arrow/compute/kernels/scalar_arithmetic_test.cc
index 2939e47666e..11a730c71f3 100644
--- a/cpp/src/arrow/compute/kernels/scalar_arithmetic_test.cc
+++ b/cpp/src/arrow/compute/kernels/scalar_arithmetic_test.cc
@@ -16,11 +16,9 @@
 // under the License.
 
 #include <algorithm>
-#define _USE_MATH_DEFINES
 #include <cmath>
 #include <memory>
 #include <string>
-#include <type_traits>
 #include <utility>
 
 #include <gtest/gtest.h>
@@ -28,12 +26,12 @@
 #include "arrow/array.h"
 #include "arrow/buffer.h"
 #include "arrow/compute/api.h"
-#include "arrow/compute/kernels/codegen_internal.h"
 #include "arrow/compute/kernels/test_util.h"
 #include "arrow/type.h"
 #include "arrow/type_traits.h"
 #include "arrow/util/bit_util.h"
 #include "arrow/util/checked_cast.h"
+#include "arrow/util/math_constants.h"
 #include "arrow/util/string.h"
 
 #include "arrow/testing/gtest_common.h"
@@ -43,8 +41,19 @@
 namespace arrow {
 namespace compute {
 
-template <typename T>
-class TestUnaryArithmetic : public TestBase {
+using IntegralTypes = testing::Types<Int8Type, Int16Type, Int32Type, Int64Type, UInt8Type,
+                                     UInt16Type, UInt32Type, UInt64Type>;
+
+using SignedIntegerTypes = testing::Types<Int8Type, Int16Type, Int32Type, Int64Type>;
+
+using UnsignedIntegerTypes =
+    testing::Types<UInt8Type, UInt16Type, UInt32Type, UInt64Type>;
+
+// TODO(kszucs): add half-float
+using FloatingTypes = testing::Types<FloatType, DoubleType>;
+
+template <typename T, typename OptionsType>
+class TestBaseUnaryArithmetic : public TestBase {
  protected:
   using ArrowType = T;
   using CType = typename ArrowType::c_type;
@@ -54,9 +63,7 @@ class TestUnaryArithmetic : public TestBase {
   }
 
   using UnaryFunction =
-      std::function<Result<Datum>(const Datum&, ArithmeticOptions, ExecContext*)>;
-
-  void SetUp() override { options_.check_overflow = false; }
+      std::function<Result<Datum>(const Datum&, OptionsType, ExecContext*)>;
 
   std::shared_ptr<Scalar> MakeNullScalar() {
     return arrow::MakeNullScalar(type_singleton());
@@ -66,6 +73,8 @@ class TestUnaryArithmetic : public TestBase {
     return *arrow::MakeScalar(type_singleton(), value);
   }
 
+  void SetUp() override {}
+
   // (CScalar, CScalar)
   void AssertUnaryOp(UnaryFunction func, CType argument, CType expected) {
     auto arg = MakeScalar(argument);
@@ -150,16 +159,23 @@ class TestUnaryArithmetic : public TestBase {
     AssertArraysApproxEqual(*expected, *actual, /*verbose=*/true, equal_options_);
   }
 
-  void SetOverflowCheck(bool value = true) { options_.check_overflow = value; }
-
   void SetNansEqual(bool value = true) {
-    this->equal_options_ = equal_options_.nans_equal(value);
+    equal_options_ = equal_options_.nans_equal(value);
   }
 
-  ArithmeticOptions options_ = ArithmeticOptions();
+  OptionsType options_ = OptionsType();
   EqualOptions equal_options_ = EqualOptions::Defaults();
 };
 
+// Subclasses of TestBaseUnaryArithmetic for different FunctionOptions.
+template <typename T>
+class TestUnaryArithmetic : public TestBaseUnaryArithmetic<T, ArithmeticOptions> {
+ protected:
+  using Base = TestBaseUnaryArithmetic<T, ArithmeticOptions>;
+  using Base::options_;
+  void SetOverflowCheck(bool value) { options_.check_overflow = value; }
+};
+
 template <typename T>
 class TestUnaryArithmeticIntegral : public TestUnaryArithmetic<T> {};
 
@@ -172,6 +188,49 @@ class TestUnaryArithmeticUnsigned : public TestUnaryArithmeticIntegral<T> {};
 template <typename T>
 class TestUnaryArithmeticFloating : public TestUnaryArithmetic<T> {};
 
+template <typename T>
+class TestUnaryRound : public TestBaseUnaryArithmetic<T, RoundOptions> {
+ protected:
+  using Base = TestBaseUnaryArithmetic<T, RoundOptions>;
+  using Base::options_;
+  void SetRoundMode(RoundMode value) { options_.round_mode = value; }
+  void SetRoundNdigits(int64_t value) { options_.ndigits = value; }
+};
+
+template <typename T>
+class TestUnaryRoundIntegral : public TestUnaryRound<T> {};
+
+template <typename T>
+class TestUnaryRoundSigned : public TestUnaryRoundIntegral<T> {};
+
+template <typename T>
+class TestUnaryRoundUnsigned : public TestUnaryRoundIntegral<T> {};
+
+template <typename T>
+class TestUnaryRoundFloating : public TestUnaryRound<T> {};
+
+template <typename T>
+class TestUnaryRoundToMultiple
+    : public TestBaseUnaryArithmetic<T, RoundToMultipleOptions> {
+ protected:
+  using Base = TestBaseUnaryArithmetic<T, RoundToMultipleOptions>;
+  using Base::options_;
+  void SetRoundMode(RoundMode value) { options_.round_mode = value; }
+  void SetRoundMultiple(double value) { options_.multiple = value; }
+};
+
+template <typename T>
+class TestUnaryRoundToMultipleIntegral : public TestUnaryRoundToMultiple<T> {};
+
+template <typename T>
+class TestUnaryRoundToMultipleSigned : public TestUnaryRoundToMultipleIntegral<T> {};
+
+template <typename T>
+class TestUnaryRoundToMultipleUnsigned : public TestUnaryRoundToMultipleIntegral<T> {};
+
+template <typename T>
+class TestUnaryRoundToMultipleFloating : public TestUnaryRoundToMultiple<T> {};
+
 template <typename T>
 class TestBinaryArithmetic : public TestBase {
  protected:
@@ -405,18 +464,6 @@ class TestBitWiseArithmetic : public TestBase {
   }
 };
 
-// InputType - OutputType pairs
-using IntegralTypes = testing::Types<Int8Type, Int16Type, Int32Type, Int64Type, UInt8Type,
-                                     UInt16Type, UInt32Type, UInt64Type>;
-
-using SignedIntegerTypes = testing::Types<Int8Type, Int16Type, Int32Type, Int64Type>;
-
-using UnsignedIntegerTypes =
-    testing::Types<UInt8Type, UInt16Type, UInt32Type, UInt64Type>;
-
-// TODO(kszucs): add half-float
-using FloatingTypes = testing::Types<FloatType, DoubleType>;
-
 TYPED_TEST_SUITE(TestUnaryArithmeticIntegral, IntegralTypes);
 TYPED_TEST_SUITE(TestUnaryArithmeticSigned, SignedIntegerTypes);
 TYPED_TEST_SUITE(TestUnaryArithmeticUnsigned, UnsignedIntegerTypes);
@@ -515,7 +562,7 @@ TEST(TestBinaryArithmetic, SubtractTimestamps) {
   auto rhs = rand.Int64(length, 0, 100000000);
   auto expected_int64 = (*Subtract(lhs, rhs)).make_array();
 
-  for (auto unit : internal::AllTimeUnits()) {
+  for (auto unit : ::arrow::internal::AllTimeUnits()) {
     auto timestamp_ty = timestamp(unit);
     auto duration_ty = duration(unit);
 
@@ -1089,7 +1136,8 @@ TEST(TestUnaryArithmetic, DispatchBest) {
   }
 
   // Fail on null type
-  for (std::string name : {"atan", "sign", "floor", "ceil", "trunc"}) {
+  for (std::string name :
+       {"atan", "sign", "floor", "ceil", "trunc", "round", "round_to_multiple"}) {
     CheckDispatchFails(name, {null()});
   }
 
@@ -1114,7 +1162,8 @@ TEST(TestUnaryArithmetic, DispatchBest) {
   }
 
   // Float types
-  for (std::string name : {"atan", "floor", "ceil", "trunc"}) {
+  for (std::string name :
+       {"atan", "sign", "floor", "ceil", "trunc", "round", "round_to_multiple"}) {
     for (const auto& ty : {float32(), float64()}) {
       CheckDispatchBest(name, {ty}, {ty});
       CheckDispatchBest(name, {dictionary(int8(), ty)}, {ty});
@@ -1135,7 +1184,8 @@ TEST(TestUnaryArithmetic, DispatchBest) {
   }
 
   // Integer -> Float64
-  for (std::string name : {"atan", "floor", "ceil", "trunc"}) {
+  for (std::string name :
+       {"atan", "floor", "ceil", "trunc", "round", "round_to_multiple"}) {
     for (const auto& ty :
          {int8(), int16(), int32(), int64(), uint8(), uint16(), uint32(), uint64()}) {
       CheckDispatchBest(name, {ty}, {float64()});
@@ -1352,6 +1402,213 @@ TYPED_TEST(TestUnaryArithmeticFloating, AbsoluteValue) {
   }
 }
 
+TYPED_TEST_SUITE(TestUnaryRoundIntegral, IntegralTypes);
+TYPED_TEST_SUITE(TestUnaryRoundSigned, SignedIntegerTypes);
+TYPED_TEST_SUITE(TestUnaryRoundUnsigned, UnsignedIntegerTypes);
+TYPED_TEST_SUITE(TestUnaryRoundFloating, FloatingTypes);
+
+const std::vector<RoundMode> kRoundModes{
+    RoundMode::DOWN,
+    RoundMode::UP,
+    RoundMode::TOWARDS_ZERO,
+    RoundMode::TOWARDS_INFINITY,
+    RoundMode::HALF_DOWN,
+    RoundMode::HALF_UP,
+    RoundMode::HALF_TOWARDS_ZERO,
+    RoundMode::HALF_TOWARDS_INFINITY,
+    RoundMode::HALF_TO_EVEN,
+    RoundMode::HALF_TO_ODD,
+};
+
+TYPED_TEST(TestUnaryRoundSigned, Round) {
+  // Test different rounding modes for integer rounding
+  std::string values("[0, 1, -13, -50, 115]");
+  this->SetRoundNdigits(0);
+  for (const auto& round_mode : kRoundModes) {
+    this->SetRoundMode(round_mode);
+    this->AssertUnaryOp(Round, values, ArrayFromJSON(float64(), values));
+  }
+
+  // Test different round N-digits for nearest rounding mode
+  std::vector<std::pair<int64_t, std::string>> ndigits_and_expected{{
+      {-2, "[0, 0, -0, -100, 100]"},
+      {-1, "[0, 0, -10, -50, 120]"},
+      {0, values},
+      {1, values},
+      {2, values},
+  }};
+  this->SetRoundMode(RoundMode::HALF_TOWARDS_INFINITY);
+  for (const auto& pair : ndigits_and_expected) {
+    this->SetRoundNdigits(pair.first);
+    this->AssertUnaryOp(Round, values, ArrayFromJSON(float64(), pair.second));
+  }
+}
+
+TYPED_TEST(TestUnaryRoundUnsigned, Round) {
+  // Test different rounding modes for integer rounding
+  std::string values("[0, 1, 13, 50, 115]");
+  this->SetRoundNdigits(0);
+  for (const auto& round_mode : kRoundModes) {
+    this->SetRoundMode(round_mode);
+    this->AssertUnaryOp(Round, values, ArrayFromJSON(float64(), values));
+  }
+
+  // Test different round N-digits for nearest rounding mode
+  std::vector<std::pair<int64_t, std::string>> ndigits_and_expected{{
+      {-2, "[0, 0, 0, 100, 100]"},
+      {-1, "[0, 0, 10, 50, 120]"},
+      {0, values},
+      {1, values},
+      {2, values},
+  }};
+  this->SetRoundMode(RoundMode::HALF_TOWARDS_INFINITY);
+  for (const auto& pair : ndigits_and_expected) {
+    this->SetRoundNdigits(pair.first);
+    this->AssertUnaryOp(Round, values, ArrayFromJSON(float64(), pair.second));
+  }
+}
+
+TYPED_TEST(TestUnaryRoundFloating, Round) {
+  this->SetNansEqual(true);
+
+  // Test different rounding modes
+  std::string values("[3.2, 3.5, 3.7, 4.5, -3.2, -3.5, -3.7]");
+  std::vector<std::pair<RoundMode, std::string>> rmode_and_expected{{
+      {RoundMode::DOWN, "[3, 3, 3, 4, -4, -4, -4]"},
+      {RoundMode::UP, "[4, 4, 4, 5, -3, -3, -3]"},
+      {RoundMode::TOWARDS_ZERO, "[3, 3, 3, 4, -3, -3, -3]"},
+      {RoundMode::TOWARDS_INFINITY, "[4, 4, 4, 5, -4, -4, -4]"},
+      {RoundMode::HALF_DOWN, "[3, 3, 4, 4, -3, -4, -4]"},
+      {RoundMode::HALF_UP, "[3, 4, 4, 5, -3, -3, -4]"},
+      {RoundMode::HALF_TOWARDS_ZERO, "[3, 3, 4, 4, -3, -3, -4]"},
+      {RoundMode::HALF_TOWARDS_INFINITY, "[3, 4, 4, 5, -3, -4, -4]"},
+      {RoundMode::HALF_TO_EVEN, "[3, 4, 4, 4, -3, -4, -4]"},
+      {RoundMode::HALF_TO_ODD, "[3, 3, 4, 5, -3, -3, -4]"},
+  }};
+  this->SetRoundNdigits(0);
+  for (const auto& pair : rmode_and_expected) {
+    this->SetRoundMode(pair.first);
+    this->AssertUnaryOp(Round, "[]", "[]");
+    this->AssertUnaryOp(Round, "[null, 0, Inf, -Inf, NaN, -NaN]",
+                        "[null, 0, Inf, -Inf, NaN, -NaN]");
+    this->AssertUnaryOp(Round, values, pair.second);
+  }
+
+  // Test different round N-digits for nearest rounding mode
+  values = "[320, 3.5, 3.075, 4.5, -3.212, -35.1234, -3.045]";
+  std::vector<std::pair<int64_t, std::string>> ndigits_and_expected{{
+      {-2, "[300, 0, 0, 0, -0, -0, -0]"},
+      {-1, "[320, 0, 0, 0, -0, -40, -0]"},
+      {0, "[320, 4, 3, 5, -3, -35, -3]"},
+      {1, "[320, 3.5, 3.1, 4.5, -3.2, -35.1, -3]"},
+      {2, "[320, 3.5, 3.08, 4.5, -3.21, -35.12, -3.05]"},
+  }};
+  this->SetRoundMode(RoundMode::HALF_TOWARDS_INFINITY);
+  for (const auto& pair : ndigits_and_expected) {
+    this->SetRoundNdigits(pair.first);
+    this->AssertUnaryOp(Round, values, pair.second);
+  }
+}
+
+TYPED_TEST_SUITE(TestUnaryRoundToMultipleIntegral, IntegralTypes);
+TYPED_TEST_SUITE(TestUnaryRoundToMultipleSigned, SignedIntegerTypes);
+TYPED_TEST_SUITE(TestUnaryRoundToMultipleUnsigned, UnsignedIntegerTypes);
+TYPED_TEST_SUITE(TestUnaryRoundToMultipleFloating, FloatingTypes);
+
+TYPED_TEST(TestUnaryRoundToMultipleSigned, RoundToMultiple) {
+  // Test different rounding modes for integer rounding
+  std::string values("[0, 1, -13, -50, 115]");
+  this->SetRoundMultiple(1);
+  for (const auto& round_mode : kRoundModes) {
+    this->SetRoundMode(round_mode);
+    this->AssertUnaryOp(RoundToMultiple, values, ArrayFromJSON(float64(), values));
+  }
+
+  // Test different round multiples for nearest rounding mode
+  std::vector<std::pair<double, std::string>> multiple_and_expected{{
+      {2, "[0, 2, -14, -50, 116]"},
+      {0.05, "[0, 1, -13, -50, 115]"},
+      {0.1, values},
+      {10, "[0, 0, -10, -50, 120]"},
+      {100, "[0, 0, -0, -100, 100]"},
+  }};
+  this->SetRoundMode(RoundMode::HALF_TOWARDS_INFINITY);
+  for (const auto& pair : multiple_and_expected) {
+    this->SetRoundMultiple(pair.first);
+    this->AssertUnaryOp(RoundToMultiple, values, ArrayFromJSON(float64(), pair.second));
+  }
+}
+
+TYPED_TEST(TestUnaryRoundToMultipleUnsigned, RoundToMultiple) {
+  // Test different rounding modes for integer rounding
+  std::string values("[0, 1, 13, 50, 115]");
+  this->SetRoundMultiple(1);
+  for (const auto& round_mode : kRoundModes) {
+    this->SetRoundMode(round_mode);
+    this->AssertUnaryOp(RoundToMultiple, values, ArrayFromJSON(float64(), values));
+  }
+
+  // Test different round multiples for nearest rounding mode
+  std::vector<std::pair<double, std::string>> multiple_and_expected{{
+      {2, "[0, 2, 14, 50, 116]"},
+      {0.05, "[0, 1, 13, 50, 115]"},
+      {0.1, values},
+      {10, "[0, 0, 10, 50, 120]"},
+      {100, "[0, 0, 0, 100, 100]"},
+  }};
+  this->SetRoundMode(RoundMode::HALF_TOWARDS_INFINITY);
+  for (const auto& pair : multiple_and_expected) {
+    this->SetRoundMultiple(pair.first);
+    this->AssertUnaryOp(RoundToMultiple, values, ArrayFromJSON(float64(), pair.second));
+  }
+}
+
+TYPED_TEST(TestUnaryRoundToMultipleFloating, RoundToMultiple) {
+  this->SetNansEqual(true);
+
+  // Test different rounding modes for integer rounding
+  std::string values("[3.2, 3.5, 3.7, 4.5, -3.2, -3.5, -3.7]");
+  std::vector<std::pair<RoundMode, std::string>> rmode_and_expected{{
+      {RoundMode::DOWN, "[3, 3, 3, 4, -4, -4, -4]"},
+      {RoundMode::UP, "[4, 4, 4, 5, -3, -3, -3]"},
+      {RoundMode::TOWARDS_ZERO, "[3, 3, 3, 4, -3, -3, -3]"},
+      {RoundMode::TOWARDS_INFINITY, "[4, 4, 4, 5, -4, -4, -4]"},
+      {RoundMode::HALF_DOWN, "[3, 3, 4, 4, -3, -4, -4]"},
+      {RoundMode::HALF_UP, "[3, 4, 4, 5, -3, -3, -4]"},
+      {RoundMode::HALF_TOWARDS_ZERO, "[3, 3, 4, 4, -3, -3, -4]"},
+      {RoundMode::HALF_TOWARDS_INFINITY, "[3, 4, 4, 5, -3, -4, -4]"},
+      {RoundMode::HALF_TO_EVEN, "[3, 4, 4, 4, -3, -4, -4]"},
+      {RoundMode::HALF_TO_ODD, "[3, 3, 4, 5, -3, -3, -4]"},
+  }};
+  this->SetRoundMultiple(1);
+  for (const auto& pair : rmode_and_expected) {
+    this->SetRoundMode(pair.first);
+    this->AssertUnaryOp(RoundToMultiple, "[]", "[]");
+    this->AssertUnaryOp(RoundToMultiple, "[null, 0, Inf, -Inf, NaN, -NaN]",
+                        "[null, 0, Inf, -Inf, NaN, -NaN]");
+    this->AssertUnaryOp(RoundToMultiple, values, pair.second);
+  }
+
+  // Test different round multiples for nearest rounding mode
+  values = "[320, 3.5, 3.075, 4.5, -3.212, -35.1234, -3.045]";
+  std::vector<std::pair<double, std::string>> multiple_and_expected{{
+      {2, "[320, 4, 4, 4, -4, -36, -4]"},
+      {0.05, "[320, 3.5, 3.1, 4.5, -3.2, -35.1, -3.05]"},
+      {0.1, "[320, 3.5, 3.1, 4.5, -3.2, -35.1, -3]"},
+      {10, "[320, 0, 0, 0, -0, -40, -0]"},
+      {100, "[300, 0, 0, 0, -0, -0, -0]"},
+  }};
+  this->SetRoundMode(RoundMode::HALF_TOWARDS_INFINITY);
+  for (const auto& pair : multiple_and_expected) {
+    this->SetRoundMultiple(pair.first);
+    this->AssertUnaryOp(RoundToMultiple, values, pair.second);
+  }
+
+  this->SetRoundMultiple(-2);
+  this->AssertUnaryOpRaises(RoundToMultiple, values,
+                            "multiple has to be a positive value");
+}
+
 TEST(TestBinaryDecimalArithmetic, DispatchBest) {
   // decimal, floating point
   for (std::string name : {"add", "subtract", "multiply", "divide"}) {
@@ -1365,6 +1622,18 @@ TEST(TestBinaryDecimalArithmetic, DispatchBest) {
     }
   }
 
+  // decimal, integer
+  for (std::string name : {"add", "subtract", "multiply", "divide"}) {
+    for (std::string suffix : {"", "_checked"}) {
+      name += suffix;
+
+      CheckDispatchBest(name, {int64(), decimal128(1, 0)},
+                        {decimal128(1, 0), decimal128(1, 0)});
+      CheckDispatchBest(name, {decimal128(1, 0), int64()},
+                        {decimal128(1, 0), decimal128(1, 0)});
+    }
+  }
+
   // decimal, decimal
   for (std::string name : {"add", "subtract"}) {
     for (std::string suffix : {"", "_checked"}) {
@@ -1410,8 +1679,6 @@ TEST(TestBinaryDecimalArithmetic, DispatchBest) {
                         {decimal256(6, 4), decimal256(6, 4)});
     }
   }
-
-  // TODO(ARROW-13067): add 'integer, decimal' tests
 }
 
 // reference result from bc (precsion=100, scale=40)
diff --git a/cpp/src/arrow/compute/kernels/scalar_cast_numeric.cc b/cpp/src/arrow/compute/kernels/scalar_cast_numeric.cc
index cd89a57ed77..1ce6896deba 100644
--- a/cpp/src/arrow/compute/kernels/scalar_cast_numeric.cc
+++ b/cpp/src/arrow/compute/kernels/scalar_cast_numeric.cc
@@ -391,6 +391,50 @@ struct CastFunctor<O, I,
   }
 };
 
+// ----------------------------------------------------------------------
+// Integer to decimal
+
+struct IntegerToDecimal {
+  template <typename OutValue, typename IntegerType>
+  OutValue Call(KernelContext*, IntegerType val, Status* st) const {
+    auto maybe_decimal = OutValue(val).Rescale(0, out_scale_);
+    if (ARROW_PREDICT_TRUE(maybe_decimal.ok())) {
+      return maybe_decimal.MoveValueUnsafe();
+    }
+    *st = maybe_decimal.status();
+    return OutValue{};
+  }
+
+  int32_t out_scale_;
+};
+
+template <typename O, typename I>
+struct CastFunctor<O, I,
+                   enable_if_t<is_decimal_type<O>::value && is_integer_type<I>::value>> {
+  static Status Exec(KernelContext* ctx, const ExecBatch& batch, Datum* out) {
+    const auto& out_type = checked_cast<const O&>(*out->type());
+    const auto out_scale = out_type.scale();
+    const auto out_precision = out_type.precision();
+
+    // verify precision and scale
+    if (out_scale < 0) {
+      return Status::Invalid("Scale must be non-negative");
+    }
+    ARROW_ASSIGN_OR_RAISE(int32_t precision, MaxDecimalDigitsForInteger(I::type_id));
+    precision += out_scale;
+    if (out_precision < precision) {
+      return Status::Invalid(
+          "Precision is not great enough for the result. "
+          "It should be at least ",
+          precision);
+    }
+
+    applicator::ScalarUnaryNotNullStateful<O, I, IntegerToDecimal> kernel(
+        IntegerToDecimal{out_scale});
+    return kernel.Exec(ctx, batch, out);
+  }
+};
+
 // ----------------------------------------------------------------------
 // Decimal to decimal
 
@@ -641,6 +685,12 @@ std::shared_ptr<CastFunction> GetCastToDecimal128() {
   DCHECK_OK(func->AddKernel(Type::DOUBLE, {float64()}, sig_out_ty,
                             CastFunctor<Decimal128Type, DoubleType>::Exec));
 
+  // Cast from integer
+  for (const std::shared_ptr<DataType>& in_ty : IntTypes()) {
+    auto exec = GenerateInteger<CastFunctor, Decimal128Type>(in_ty->id());
+    DCHECK_OK(func->AddKernel(in_ty->id(), {in_ty}, sig_out_ty, std::move(exec)));
+  }
+
   // Cast from other decimal
   auto exec = CastFunctor<Decimal128Type, Decimal128Type>::Exec;
   // We resolve the output type of this kernel from the CastOptions
@@ -664,6 +714,12 @@ std::shared_ptr<CastFunction> GetCastToDecimal256() {
   DCHECK_OK(func->AddKernel(Type::DOUBLE, {float64()}, sig_out_ty,
                             CastFunctor<Decimal256Type, DoubleType>::Exec));
 
+  // Cast from integer
+  for (const std::shared_ptr<DataType>& in_ty : IntTypes()) {
+    auto exec = GenerateInteger<CastFunctor, Decimal256Type>(in_ty->id());
+    DCHECK_OK(func->AddKernel(in_ty->id(), {in_ty}, sig_out_ty, std::move(exec)));
+  }
+
   // Cast from other decimal
   auto exec = CastFunctor<Decimal256Type, Decimal128Type>::Exec;
   DCHECK_OK(
diff --git a/cpp/src/arrow/compute/kernels/scalar_cast_test.cc b/cpp/src/arrow/compute/kernels/scalar_cast_test.cc
index 90d41894578..8948146e6c3 100644
--- a/cpp/src/arrow/compute/kernels/scalar_cast_test.cc
+++ b/cpp/src/arrow/compute/kernels/scalar_cast_test.cc
@@ -71,9 +71,11 @@ static std::vector<std::shared_ptr<DataType>> kNumericTypes = {
     uint8(), int8(),   uint16(), int16(),   uint32(),
     int32(), uint64(), int64(),  float32(), float64()};
 
-static std::vector<std::shared_ptr<DataType>> kDictionaryIndexTypes = {
+static std::vector<std::shared_ptr<DataType>> kIntegerTypes = {
     int8(), uint8(), int16(), uint16(), int32(), uint32(), int64(), uint64()};
 
+static std::vector<std::shared_ptr<DataType>> kDictionaryIndexTypes = kIntegerTypes;
+
 static std::vector<std::shared_ptr<DataType>> kBaseBinaryTypes = {
     binary(), utf8(), large_binary(), large_utf8()};
 
@@ -587,6 +589,36 @@ TEST(Cast, Decimal256ToInt) {
   CheckCast(negative_scale, ArrayFromJSON(int64(), "[1234567890000, -120000]"), options);
 }
 
+TEST(Cast, IntegerToDecimal) {
+  for (auto decimal_type : {decimal128(21, 2), decimal256(21, 2)}) {
+    for (auto integer_type : kIntegerTypes) {
+      CheckCast(
+          ArrayFromJSON(integer_type, "[0, 7, null, 100, 99]"),
+          ArrayFromJSON(decimal_type, R"(["0.00", "7.00", null, "100.00", "99.00"])"));
+    }
+  }
+
+  // extreme value
+  for (auto decimal_type : {decimal128(19, 0), decimal256(19, 0)}) {
+    CheckCast(ArrayFromJSON(int64(), "[-9223372036854775808, 9223372036854775807]"),
+              ArrayFromJSON(decimal_type,
+                            R"(["-9223372036854775808", "9223372036854775807"])"));
+    CheckCast(ArrayFromJSON(uint64(), "[0, 18446744073709551615]"),
+              ArrayFromJSON(decimal_type, R"(["0", "18446744073709551615"])"));
+  }
+
+  // insufficient output precision
+  {
+    CastOptions options;
+
+    options.to_type = decimal128(5, 3);
+    CheckCastFails(ArrayFromJSON(int8(), "[0]"), options);
+
+    options.to_type = decimal256(76, 67);
+    CheckCastFails(ArrayFromJSON(int32(), "[0]"), options);
+  }
+}
+
 TEST(Cast, Decimal128ToDecimal128) {
   CastOptions options;
 
@@ -1453,34 +1485,42 @@ TEST(Cast, StringToBoolean) {
 TEST(Cast, StringToInt) {
   for (auto string_type : {utf8(), large_utf8()}) {
     for (auto signed_type : {int8(), int16(), int32(), int64()}) {
-      CheckCast(ArrayFromJSON(string_type, R"(["0", null, "127", "-1", "0"])"),
-                ArrayFromJSON(signed_type, "[0, null, 127, -1, 0]"));
+      CheckCast(
+          ArrayFromJSON(string_type, R"(["0", null, "127", "-1", "0", "0x0", "0x7F"])"),
+          ArrayFromJSON(signed_type, "[0, null, 127, -1, 0, 0, 127]"));
     }
 
-    CheckCast(
-        ArrayFromJSON(string_type, R"(["2147483647", null, "-2147483648", "0", "0"])"),
-        ArrayFromJSON(int32(), "[2147483647, null, -2147483648, 0, 0]"));
+    CheckCast(ArrayFromJSON(string_type, R"(["2147483647", null, "-2147483648", "0", 
+          "0X0", "0x7FFFFFFF", "0XFFFFfFfF", "0Xf0000000"])"),
+              ArrayFromJSON(
+                  int32(),
+                  "[2147483647, null, -2147483648, 0, 0, 2147483647, -1, -268435456]"));
 
-    CheckCast(ArrayFromJSON(
-                  string_type,
-                  R"(["9223372036854775807", null, "-9223372036854775808", "0", "0"])"),
+    CheckCast(ArrayFromJSON(string_type,
+                            R"(["9223372036854775807", null, "-9223372036854775808", "0", 
+                    "0x0", "0x7FFFFFFFFFFFFFFf", "0XF000000000000001"])"),
               ArrayFromJSON(int64(),
-                            "[9223372036854775807, null, -9223372036854775808, 0, 0]"));
+                            "[9223372036854775807, null, -9223372036854775808, 0, 0, "
+                            "9223372036854775807, -1152921504606846975]"));
 
     for (auto unsigned_type : {uint8(), uint16(), uint32(), uint64()}) {
-      CheckCast(ArrayFromJSON(string_type, R"(["0", null, "127", "255", "0"])"),
-                ArrayFromJSON(unsigned_type, "[0, null, 127, 255, 0]"));
+      CheckCast(ArrayFromJSON(string_type,
+                              R"(["0", null, "127", "255", "0", "0X0", "0xff", "0x7f"])"),
+                ArrayFromJSON(unsigned_type, "[0, null, 127, 255, 0, 0, 255, 127]"));
     }
 
     CheckCast(
-        ArrayFromJSON(string_type, R"(["2147483647", null, "4294967295", "0", "0"])"),
-        ArrayFromJSON(uint32(), "[2147483647, null, 4294967295, 0, 0]"));
-
-    CheckCast(ArrayFromJSON(
-                  string_type,
-                  R"(["9223372036854775807", null, "18446744073709551615", "0", "0"])"),
+        ArrayFromJSON(string_type, R"(["2147483647", null, "4294967295", "0", 
+                                    "0x0", "0x7FFFFFFf", "0xFFFFFFFF"])"),
+        ArrayFromJSON(uint32(),
+                      "[2147483647, null, 4294967295, 0, 0, 2147483647, 4294967295]"));
+
+    CheckCast(ArrayFromJSON(string_type,
+                            R"(["9223372036854775807", null, "18446744073709551615", "0", 
+                    "0x0", "0x7FFFFFFFFFFFFFFf", "0xfFFFFFFFFFFFFFFf"])"),
               ArrayFromJSON(uint64(),
-                            "[9223372036854775807, null, 18446744073709551615, 0, 0]"));
+                            "[9223372036854775807, null, 18446744073709551615, 0, 0, "
+                            "9223372036854775807, 18446744073709551615]"));
 
     for (std::string not_int8 : {
              "z",
@@ -1488,16 +1528,14 @@ TEST(Cast, StringToInt) {
              "128",
              "-129",
              "0.5",
+             "0x",
+             "0xfff",
          }) {
       auto options = CastOptions::Safe(int8());
       CheckCastFails(ArrayFromJSON(string_type, "[\"" + not_int8 + "\"]"), options);
     }
 
-    for (std::string not_uint8 : {
-             "256",
-             "-1",
-             "0.5",
-         }) {
+    for (std::string not_uint8 : {"256", "-1", "0.5", "0x", "0x3wa", "0x123"}) {
       auto options = CastOptions::Safe(uint8());
       CheckCastFails(ArrayFromJSON(string_type, "[\"" + not_uint8 + "\"]"), options);
     }
diff --git a/cpp/src/arrow/compute/kernels/scalar_compare.cc b/cpp/src/arrow/compute/kernels/scalar_compare.cc
index 4342d776c38..5d0d41f4e0d 100644
--- a/cpp/src/arrow/compute/kernels/scalar_compare.cc
+++ b/cpp/src/arrow/compute/kernels/scalar_compare.cc
@@ -24,6 +24,7 @@
 
 namespace arrow {
 
+using internal::AllTimeUnits;
 using internal::checked_cast;
 using internal::checked_pointer_cast;
 using util::string_view;
@@ -172,6 +173,8 @@ struct CompareFunction : ScalarFunction {
       ReplaceTypes(type, values);
     } else if (auto type = CommonBinary(*values)) {
       ReplaceTypes(type, values);
+    } else if (HasDecimal(*values)) {
+      RETURN_NOT_OK(CastBinaryDecimalArgs(DecimalPromotion::kAdd, values));
     }
 
     if (auto kernel = DispatchExactImpl(this, *values)) return kernel;
@@ -259,6 +262,12 @@ std::shared_ptr<ScalarFunction> MakeCompareFunction(std::string name,
     DCHECK_OK(func->AddKernel({ty, ty}, boolean(), std::move(exec)));
   }
 
+  for (const auto id : DecimalTypeIds()) {
+    auto exec = GenerateDecimal<applicator::ScalarBinaryEqualTypes, BooleanType, Op>(id);
+    DCHECK_OK(
+        func->AddKernel({InputType(id), InputType(id)}, boolean(), std::move(exec)));
+  }
+
   return func;
 }
 
diff --git a/cpp/src/arrow/compute/kernels/scalar_compare_test.cc b/cpp/src/arrow/compute/kernels/scalar_compare_test.cc
index 37680945a3e..a5bc89d87f3 100644
--- a/cpp/src/arrow/compute/kernels/scalar_compare_test.cc
+++ b/cpp/src/arrow/compute/kernels/scalar_compare_test.cc
@@ -453,6 +453,109 @@ TEST(TestCompareTimestamps, Basics) {
   CheckArrayCase(seconds_utc, CompareOperator::EQUAL, "[false, false, true]");
 }
 
+template <typename ArrowType>
+class TestCompareDecimal : public ::testing::Test {};
+TYPED_TEST_SUITE(TestCompareDecimal, DecimalArrowTypes);
+
+TYPED_TEST(TestCompareDecimal, ArrayScalar) {
+  auto ty = std::make_shared<TypeParam>(3, 2);
+
+  std::vector<std::pair<std::string, std::string>> cases = {
+      std::make_pair("equal", "[1, 0, 0, null]"),
+      std::make_pair("not_equal", "[0, 1, 1, null]"),
+      std::make_pair("less", "[0, 0, 1, null]"),
+      std::make_pair("less_equal", "[1, 0, 1, null]"),
+      std::make_pair("greater", "[0, 1, 0, null]"),
+      std::make_pair("greater_equal", "[1, 1, 0, null]"),
+  };
+
+  auto lhs = ArrayFromJSON(ty, R"(["1.23", "2.34", "-1.23", null])");
+  auto lhs_float = ArrayFromJSON(float64(), "[1.23, 2.34, -1.23, null]");
+  auto lhs_intlike = ArrayFromJSON(ty, R"(["1.00", "2.00", "-1.00", null])");
+  auto rhs = ScalarFromJSON(ty, R"("1.23")");
+  auto rhs_float = ScalarFromJSON(float64(), "1.23");
+  auto rhs_int = ScalarFromJSON(int64(), "1");
+  for (const auto& op : cases) {
+    const auto& function = op.first;
+    const auto& expected = op.second;
+
+    SCOPED_TRACE(function);
+    CheckScalarBinary(function, lhs, rhs, ArrayFromJSON(boolean(), expected));
+    CheckScalarBinary(function, lhs_float, rhs, ArrayFromJSON(boolean(), expected));
+    CheckScalarBinary(function, lhs, rhs_float, ArrayFromJSON(boolean(), expected));
+    CheckScalarBinary(function, lhs_intlike, rhs_int, ArrayFromJSON(boolean(), expected));
+  }
+}
+
+TYPED_TEST(TestCompareDecimal, ScalarArray) {
+  auto ty = std::make_shared<TypeParam>(3, 2);
+
+  std::vector<std::pair<std::string, std::string>> cases = {
+      std::make_pair("equal", "[1, 0, 0, null]"),
+      std::make_pair("not_equal", "[0, 1, 1, null]"),
+      std::make_pair("less", "[0, 1, 0, null]"),
+      std::make_pair("less_equal", "[1, 1, 0, null]"),
+      std::make_pair("greater", "[0, 0, 1, null]"),
+      std::make_pair("greater_equal", "[1, 0, 1, null]"),
+  };
+
+  auto lhs = ScalarFromJSON(ty, R"("1.23")");
+  auto lhs_float = ScalarFromJSON(float64(), "1.23");
+  auto lhs_int = ScalarFromJSON(int64(), "1");
+  auto rhs = ArrayFromJSON(ty, R"(["1.23", "2.34", "-1.23", null])");
+  auto rhs_float = ArrayFromJSON(float64(), "[1.23, 2.34, -1.23, null]");
+  auto rhs_intlike = ArrayFromJSON(ty, R"(["1.00", "2.00", "-1.00", null])");
+  for (const auto& op : cases) {
+    const auto& function = op.first;
+    const auto& expected = op.second;
+
+    SCOPED_TRACE(function);
+    CheckScalarBinary(function, lhs, rhs, ArrayFromJSON(boolean(), expected));
+    CheckScalarBinary(function, lhs_float, rhs, ArrayFromJSON(boolean(), expected));
+    CheckScalarBinary(function, lhs, rhs_float, ArrayFromJSON(boolean(), expected));
+    CheckScalarBinary(function, lhs_int, rhs_intlike, ArrayFromJSON(boolean(), expected));
+  }
+}
+
+TYPED_TEST(TestCompareDecimal, ArrayArray) {
+  auto ty = std::make_shared<TypeParam>(3, 2);
+
+  std::vector<std::pair<std::string, std::string>> cases = {
+      std::make_pair("equal", "[1, 0, 0, 1, 0, 0, null, null]"),
+      std::make_pair("not_equal", "[0, 1, 1, 0, 1, 1, null, null]"),
+      std::make_pair("less", "[0, 1, 0, 0, 1, 0, null, null]"),
+      std::make_pair("less_equal", "[1, 1, 0, 1, 1, 0, null, null]"),
+      std::make_pair("greater", "[0, 0, 1, 0, 0, 1, null, null]"),
+      std::make_pair("greater_equal", "[1, 0, 1, 1, 0, 1, null, null]"),
+  };
+
+  auto lhs = ArrayFromJSON(
+      ty, R"(["1.23", "1.23", "2.34", "-1.23", "-1.23", "1.23", "1.23", null])");
+  auto lhs_float =
+      ArrayFromJSON(float64(), "[1.23, 1.23, 2.34, -1.23, -1.23, 1.23, 1.23, null]");
+  auto lhs_intlike = ArrayFromJSON(
+      ty, R"(["1.00", "1.00", "2.00", "-1.00", "-1.00", "1.00", "1.00", null])");
+  auto rhs = ArrayFromJSON(
+      ty, R"(["1.23", "2.34", "1.23", "-1.23", "1.23", "-1.23", null, "1.23"])");
+  auto rhs_float =
+      ArrayFromJSON(float64(), "[1.23, 2.34, 1.23, -1.23, 1.23, -1.23, null, 1.23]");
+  auto rhs_int = ArrayFromJSON(int64(), "[1, 2, 1, -1, 1, -1, null, 1]");
+  for (const auto& op : cases) {
+    const auto& function = op.first;
+    const auto& expected = op.second;
+
+    SCOPED_TRACE(function);
+    CheckScalarBinary(function, ArrayFromJSON(ty, R"([])"), ArrayFromJSON(ty, R"([])"),
+                      ArrayFromJSON(boolean(), "[]"));
+    CheckScalarBinary(function, ArrayFromJSON(ty, R"([null])"),
+                      ArrayFromJSON(ty, R"([null])"), ArrayFromJSON(boolean(), "[null]"));
+    CheckScalarBinary(function, lhs, rhs, ArrayFromJSON(boolean(), expected));
+    CheckScalarBinary(function, lhs_float, rhs, ArrayFromJSON(boolean(), expected));
+    CheckScalarBinary(function, lhs, rhs_float, ArrayFromJSON(boolean(), expected));
+    CheckScalarBinary(function, lhs_intlike, rhs_int, ArrayFromJSON(boolean(), expected));
+  }
+}
+
 TEST(TestCompareKernel, DispatchBest) {
   for (std::string name :
        {"equal", "not_equal", "less", "less_equal", "greater", "greater_equal"}) {
@@ -490,6 +593,17 @@ TEST(TestCompareKernel, DispatchBest) {
 
     CheckDispatchBest(name, {utf8(), binary()}, {binary(), binary()});
     CheckDispatchBest(name, {large_utf8(), binary()}, {large_binary(), large_binary()});
+
+    CheckDispatchBest(name, {decimal128(3, 2), decimal128(6, 3)},
+                      {decimal128(4, 3), decimal128(6, 3)});
+    CheckDispatchBest(name, {decimal128(3, 2), decimal256(3, 2)},
+                      {decimal256(3, 2), decimal256(3, 2)});
+    CheckDispatchBest(name, {decimal128(3, 2), float64()}, {float64(), float64()});
+    CheckDispatchBest(name, {float64(), decimal128(3, 2)}, {float64(), float64()});
+    CheckDispatchBest(name, {decimal128(3, 2), int64()},
+                      {decimal128(3, 2), decimal128(3, 2)});
+    CheckDispatchBest(name, {int64(), decimal128(3, 2)},
+                      {decimal128(3, 2), decimal128(3, 2)});
   }
 }
 
diff --git a/cpp/src/arrow/compute/kernels/scalar_string.cc b/cpp/src/arrow/compute/kernels/scalar_string.cc
index aa953119d47..1f043adb0b5 100644
--- a/cpp/src/arrow/compute/kernels/scalar_string.cc
+++ b/cpp/src/arrow/compute/kernels/scalar_string.cc
@@ -73,10 +73,7 @@ Status RegexStatus(const RE2& regex) {
 
 // IsAlpha/Digit etc
 
-template <typename T>
-static inline bool IsAsciiCharacter(T character) {
-  return character < 128;
-}
+static inline bool IsAsciiCharacter(uint8_t character) { return character < 128; }
 
 static inline bool IsLowerCaseCharacterAscii(uint8_t ascii_character) {
   return (ascii_character >= 'a') && (ascii_character <= 'z');
@@ -1746,8 +1743,7 @@ struct IsNumericUnicode : CharacterPredicateUnicode<IsNumericUnicode> {
 struct IsAscii {
   static bool Call(KernelContext*, const uint8_t* input,
                    size_t input_string_nascii_characters, Status*) {
-    return std::all_of(input, input + input_string_nascii_characters,
-                       IsAsciiCharacter<uint8_t>);
+    return std::all_of(input, input + input_string_nascii_characters, IsAsciiCharacter);
   }
 };
 
diff --git a/cpp/src/arrow/compute/kernels/scalar_temporal.cc b/cpp/src/arrow/compute/kernels/scalar_temporal.cc
index 44c7f75a038..e7aeb3fcf0b 100644
--- a/cpp/src/arrow/compute/kernels/scalar_temporal.cc
+++ b/cpp/src/arrow/compute/kernels/scalar_temporal.cc
@@ -16,6 +16,7 @@
 // under the License.
 
 #include <cmath>
+#include <initializer_list>
 #include <sstream>
 
 #include "arrow/builder.h"
@@ -27,6 +28,7 @@
 
 namespace arrow {
 
+using internal::AllTimeUnits;
 using internal::checked_cast;
 using internal::checked_pointer_cast;
 
@@ -49,6 +51,7 @@ using arrow_vendored::date::weekday;
 using arrow_vendored::date::weeks;
 using arrow_vendored::date::year_month_day;
 using arrow_vendored::date::years;
+using arrow_vendored::date::zoned_time;
 using arrow_vendored::date::literals::dec;
 using arrow_vendored::date::literals::jan;
 using arrow_vendored::date::literals::last;
@@ -59,6 +62,7 @@ using internal::applicator::SimpleUnary;
 
 using DayOfWeekState = OptionsWrapper<DayOfWeekOptions>;
 using StrftimeState = OptionsWrapper<StrftimeOptions>;
+using AssumeTimezoneState = OptionsWrapper<AssumeTimezoneOptions>;
 
 const std::shared_ptr<DataType>& IsoCalendarType() {
   static auto type = struct_({field("iso_year", int64()), field("iso_week", int64()),
@@ -122,13 +126,14 @@ struct ZonedLocalizer {
 
 //
 // Executor class for temporal component extractors, i.e. scalar kernels
-// with the signature Timestamp -> <non-temporal scalar type `OutType`>
+// with the signature temporal type -> <non-temporal scalar type `OutType`>
 //
 // The `Op` parameter is templated on the Duration (which depends on the timestamp
 // unit) and a Localizer class (depending on whether the timestamp has a
 // timezone defined).
 //
-template <template <typename...> class Op, typename Duration, typename OutType>
+template <template <typename...> class Op, typename Duration, typename InType,
+          typename OutType>
 struct TemporalComponentExtractBase {
   template <typename OptionsType>
   static Status ExecWithOptions(KernelContext* ctx, const OptionsType* options,
@@ -151,10 +156,35 @@ struct TemporalComponentExtractBase {
   }
 };
 
-template <template <typename...> class Op, typename Duration, typename OutType>
+template <template <typename...> class Op, typename OutType>
+struct TemporalComponentExtractBase<Op, days, Date32Type, OutType> {
+  template <typename OptionsType>
+  static Status ExecWithOptions(KernelContext* ctx, const OptionsType* options,
+                                const ExecBatch& batch, Datum* out) {
+    using ExecTemplate = Op<days, NonZonedLocalizer>;
+    auto op = ExecTemplate(options, NonZonedLocalizer());
+    applicator::ScalarUnaryNotNullStateful<OutType, Date32Type, ExecTemplate> kernel{op};
+    return kernel.Exec(ctx, batch, out);
+  }
+};
+
+template <template <typename...> class Op, typename OutType>
+struct TemporalComponentExtractBase<Op, std::chrono::milliseconds, Date64Type, OutType> {
+  template <typename OptionsType>
+  static Status ExecWithOptions(KernelContext* ctx, const OptionsType* options,
+                                const ExecBatch& batch, Datum* out) {
+    using ExecTemplate = Op<std::chrono::milliseconds, NonZonedLocalizer>;
+    auto op = ExecTemplate(options, NonZonedLocalizer());
+    applicator::ScalarUnaryNotNullStateful<OutType, Date64Type, ExecTemplate> kernel{op};
+    return kernel.Exec(ctx, batch, out);
+  }
+};
+
+template <template <typename...> class Op, typename Duration, typename InType,
+          typename OutType>
 struct TemporalComponentExtract
-    : public TemporalComponentExtractBase<Op, Duration, OutType> {
-  using Base = TemporalComponentExtractBase<Op, Duration, OutType>;
+    : public TemporalComponentExtractBase<Op, Duration, InType, OutType> {
+  using Base = TemporalComponentExtractBase<Op, Duration, InType, OutType>;
 
   static Status Exec(KernelContext* ctx, const ExecBatch& batch, Datum* out) {
     const FunctionOptions* options = nullptr;
@@ -162,10 +192,11 @@ struct TemporalComponentExtract
   }
 };
 
-template <template <typename...> class Op, typename Duration, typename OutType>
+template <template <typename...> class Op, typename Duration, typename InType,
+          typename OutType>
 struct TemporalComponentExtractDayOfWeek
-    : public TemporalComponentExtractBase<Op, Duration, OutType> {
-  using Base = TemporalComponentExtractBase<Op, Duration, OutType>;
+    : public TemporalComponentExtractBase<Op, Duration, InType, OutType> {
+  using Base = TemporalComponentExtractBase<Op, Duration, InType, OutType>;
 
   static Status Exec(KernelContext* ctx, const ExecBatch& batch, Datum* out) {
     const DayOfWeekOptions& options = DayOfWeekState::Get(ctx);
@@ -178,8 +209,30 @@ struct TemporalComponentExtractDayOfWeek
   }
 };
 
+template <template <typename...> class Op, typename Duration, typename InType,
+          typename OutType>
+struct AssumeTimezoneExtractor
+    : public TemporalComponentExtractBase<Op, Duration, InType, OutType> {
+  using Base = TemporalComponentExtractBase<Op, Duration, InType, OutType>;
+
+  static Status Exec(KernelContext* ctx, const ExecBatch& batch, Datum* out) {
+    const AssumeTimezoneOptions& options = AssumeTimezoneState::Get(ctx);
+    const auto& timezone = GetInputTimezone(batch.values[0]);
+    if (!timezone.empty()) {
+      return Status::Invalid("Timestamps already have a timezone: '", timezone,
+                             "'. Cannot localize to '", options.timezone, "'.");
+    }
+    ARROW_ASSIGN_OR_RAISE(auto tz, LocateZone(options.timezone));
+    using ExecTemplate = Op<Duration>;
+    auto op = ExecTemplate(&options, tz);
+    applicator::ScalarUnaryNotNullStateful<OutType, TimestampType, ExecTemplate> kernel{
+        op};
+    return kernel.Exec(ctx, batch, out);
+  }
+};
+
 // ----------------------------------------------------------------------
-// Extract year from timestamp
+// Extract year from temporal types
 //
 // This class and the following (`Month`, etc.) are to be used as the `Op`
 // parameter to `TemporalComponentExtract`.
@@ -200,7 +253,7 @@ struct Year {
 };
 
 // ----------------------------------------------------------------------
-// Extract month from timestamp
+// Extract month from temporal types
 
 template <typename Duration, typename Localizer>
 struct Month {
@@ -218,7 +271,7 @@ struct Month {
 };
 
 // ----------------------------------------------------------------------
-// Extract day from timestamp
+// Extract day from temporal types
 
 template <typename Duration, typename Localizer>
 struct Day {
@@ -236,7 +289,7 @@ struct Day {
 };
 
 // ----------------------------------------------------------------------
-// Extract day of week from timestamp
+// Extract day of week from temporal types
 //
 // By default week starts on Monday represented by 0 and ends on Sunday represented
 // by 6. Start day of the week (Monday=1, Sunday=7) and numbering start (0 or 1) can be
@@ -267,7 +320,7 @@ struct DayOfWeek {
 };
 
 // ----------------------------------------------------------------------
-// Extract day of year from timestamp
+// Extract day of year from temporal types
 
 template <typename Duration, typename Localizer>
 struct DayOfYear {
@@ -285,7 +338,7 @@ struct DayOfYear {
 };
 
 // ----------------------------------------------------------------------
-// Extract ISO Year values from timestamp
+// Extract ISO Year values from temporal types
 //
 // First week of an ISO year has the majority (4 or more) of it's days in January.
 // Last week of an ISO year has the year's last Thursday in it.
@@ -310,7 +363,7 @@ struct ISOYear {
 };
 
 // ----------------------------------------------------------------------
-// Extract ISO week from timestamp
+// Extract ISO week from temporal types
 //
 // First week of an ISO year has the majority (4 or more) of it's days in January.
 // Last week of an ISO year has the year's last Thursday in it.
@@ -338,7 +391,7 @@ struct ISOWeek {
 };
 
 // ----------------------------------------------------------------------
-// Extract quarter from timestamp
+// Extract quarter from temporal types
 
 template <typename Duration, typename Localizer>
 struct Quarter {
@@ -467,7 +520,7 @@ struct Nanosecond {
 // Convert timestamps to a string representation with an arbitrary format
 
 #ifndef _WIN32
-template <typename Duration>
+template <typename Duration, typename InType>
 struct Strftime {
   const StrftimeOptions& options;
   const time_zone* tz;
@@ -476,11 +529,17 @@ struct Strftime {
   static Result<Strftime> Make(KernelContext* ctx, const DataType& type) {
     const StrftimeOptions& options = StrftimeState::Get(ctx);
 
-    const auto& timezone = GetInputTimezone(type);
+    auto timezone = GetInputTimezone(type);
     if (timezone.empty()) {
-      return Status::Invalid(
-          "Timestamps without a time zone cannot be reliably formatted.");
+      if ((options.format.find("%z") != std::string::npos) ||
+          (options.format.find("%Z") != std::string::npos)) {
+        return Status::Invalid(
+            "Timezone not present, cannot convert to string with timezone: ",
+            options.format);
+      }
+      timezone = "UTC";
     }
+
     ARROW_ASSIGN_OR_RAISE(const time_zone* tz, LocateZone(timezone));
 
     ARROW_ASSIGN_OR_RAISE(std::locale locale, GetLocale(options.locale));
@@ -545,8 +604,7 @@ struct Strftime {
 
     Result<std::string> operator()(int64_t arg) {
       bufstream.str("");
-      const auto zt = arrow_vendored::date::zoned_time<Duration>{
-          tz, sys_time<Duration>(Duration{arg})};
+      const auto zt = zoned_time<Duration>{tz, sys_time<Duration>(Duration{arg})};
       try {
         arrow_vendored::date::to_stream(bufstream, format, zt);
       } catch (const std::runtime_error& ex) {
@@ -558,9 +616,8 @@ struct Strftime {
     }
   };
 };
-
 #else
-template <typename Duration>
+template <typename Duration, typename InType>
 struct Strftime {
   static Status Call(KernelContext* ctx, const Scalar& in, Scalar* out) {
     return Status::NotImplemented("Strftime not yet implemented on windows.");
@@ -571,11 +628,86 @@ struct Strftime {
 };
 #endif
 
+// ----------------------------------------------------------------------
+// Convert timestamps from local timestamp without a timezone to timestamps with a
+// timezone, interpreting the local timestamp as being in the specified timezone
+
+Result<ValueDescr> ResolveAssumeTimezoneOutput(KernelContext* ctx,
+                                               const std::vector<ValueDescr>& args) {
+  auto in_type = checked_cast<const TimestampType*>(args[0].type.get());
+  auto type = timestamp(in_type->unit(), AssumeTimezoneState::Get(ctx).timezone);
+  return ValueDescr(std::move(type));
+}
+
+template <typename Duration>
+struct AssumeTimezone {
+  explicit AssumeTimezone(const AssumeTimezoneOptions* options, const time_zone* tz)
+      : options(*options), tz_(tz) {}
+
+  template <typename T, typename Arg0>
+  T get_local_time(Arg0 arg, const time_zone* tz) const {
+    return static_cast<T>(zoned_time<Duration>(tz, local_time<Duration>(Duration{arg}))
+                              .get_sys_time()
+                              .time_since_epoch()
+                              .count());
+  }
+
+  template <typename T, typename Arg0>
+  T get_local_time(Arg0 arg, const arrow_vendored::date::choose choose,
+                   const time_zone* tz) const {
+    return static_cast<T>(
+        zoned_time<Duration>(tz, local_time<Duration>(Duration{arg}), choose)
+            .get_sys_time()
+            .time_since_epoch()
+            .count());
+  }
+
+  template <typename T, typename Arg0>
+  T Call(KernelContext*, Arg0 arg, Status* st) const {
+    try {
+      return get_local_time<T, Arg0>(arg, tz_);
+    } catch (const arrow_vendored::date::nonexistent_local_time& e) {
+      switch (options.nonexistent) {
+        case AssumeTimezoneOptions::Nonexistent::NONEXISTENT_RAISE: {
+          *st = Status::Invalid("Timestamp doesn't exist in timezone '", options.timezone,
+                                "': ", e.what());
+          return arg;
+        }
+        case AssumeTimezoneOptions::Nonexistent::NONEXISTENT_EARLIEST: {
+          return get_local_time<T, Arg0>(arg, arrow_vendored::date::choose::latest, tz_) -
+                 1;
+        }
+        case AssumeTimezoneOptions::Nonexistent::NONEXISTENT_LATEST: {
+          return get_local_time<T, Arg0>(arg, arrow_vendored::date::choose::latest, tz_);
+        }
+      }
+    } catch (const arrow_vendored::date::ambiguous_local_time& e) {
+      switch (options.ambiguous) {
+        case AssumeTimezoneOptions::Ambiguous::AMBIGUOUS_RAISE: {
+          *st = Status::Invalid("Timestamp is ambiguous in timezone '", options.timezone,
+                                "': ", e.what());
+          return arg;
+        }
+        case AssumeTimezoneOptions::Ambiguous::AMBIGUOUS_EARLIEST: {
+          return get_local_time<T, Arg0>(arg, arrow_vendored::date::choose::earliest,
+                                         tz_);
+        }
+        case AssumeTimezoneOptions::Ambiguous::AMBIGUOUS_LATEST: {
+          return get_local_time<T, Arg0>(arg, arrow_vendored::date::choose::latest, tz_);
+        }
+      }
+    }
+    return 0;
+  }
+  AssumeTimezoneOptions options;
+  const time_zone* tz_;
+};
+
 // ----------------------------------------------------------------------
 // Extract ISO calendar values from timestamp
 
 template <typename Duration, typename Localizer>
-inline std::array<int64_t, 3> GetIsoCalendar(int64_t arg, Localizer&& localizer) {
+std::array<int64_t, 3> GetIsoCalendar(int64_t arg, Localizer&& localizer) {
   const auto t = floor<days>(localizer.template ConvertTimePoint<Duration>(arg));
   const auto ymd = year_month_day(t);
   auto y = year_month_day{t + days{3}}.year();
@@ -589,20 +721,75 @@ inline std::array<int64_t, 3> GetIsoCalendar(int64_t arg, Localizer&& localizer)
           static_cast<int64_t>(weekday(ymd).iso_encoding())};
 }
 
+template <typename Duration, typename InType>
+struct ISOCalendarWrapper {
+  static Result<std::array<int64_t, 3>> Get(const Scalar& in) {
+    const auto& in_val = internal::UnboxScalar<const InType>::Unbox(in);
+    return GetIsoCalendar<Duration>(in_val, NonZonedLocalizer{});
+  }
+};
+
 template <typename Duration>
+struct ISOCalendarWrapper<Duration, TimestampType> {
+  static Result<std::array<int64_t, 3>> Get(const Scalar& in) {
+    const auto& in_val = internal::UnboxScalar<const TimestampType>::Unbox(in);
+    const auto& timezone = GetInputTimezone(in);
+    if (timezone.empty()) {
+      return GetIsoCalendar<Duration>(in_val, NonZonedLocalizer{});
+    } else {
+      ARROW_ASSIGN_OR_RAISE(auto tz, LocateZone(timezone));
+      return GetIsoCalendar<Duration>(in_val, ZonedLocalizer{tz});
+    }
+  }
+};
+
+template <typename Duration, typename InType, typename BuilderType>
+struct ISOCalendarVisitValueFunction {
+  static Result<std::function<Status(typename InType::c_type arg)>> Get(
+      const std::vector<BuilderType*>& field_builders, const ArrayData&,
+      StructBuilder* struct_builder) {
+    return [=](typename InType::c_type arg) {
+      const auto iso_calendar = GetIsoCalendar<Duration>(arg, NonZonedLocalizer{});
+      field_builders[0]->UnsafeAppend(iso_calendar[0]);
+      field_builders[1]->UnsafeAppend(iso_calendar[1]);
+      field_builders[2]->UnsafeAppend(iso_calendar[2]);
+      return struct_builder->Append();
+    };
+  }
+};
+
+template <typename Duration, typename BuilderType>
+struct ISOCalendarVisitValueFunction<Duration, TimestampType, BuilderType> {
+  static Result<std::function<Status(typename TimestampType::c_type arg)>> Get(
+      const std::vector<BuilderType*>& field_builders, const ArrayData& in,
+      StructBuilder* struct_builder) {
+    const auto& timezone = GetInputTimezone(in);
+    if (timezone.empty()) {
+      return [=](TimestampType::c_type arg) {
+        const auto iso_calendar = GetIsoCalendar<Duration>(arg, NonZonedLocalizer{});
+        field_builders[0]->UnsafeAppend(iso_calendar[0]);
+        field_builders[1]->UnsafeAppend(iso_calendar[1]);
+        field_builders[2]->UnsafeAppend(iso_calendar[2]);
+        return struct_builder->Append();
+      };
+    }
+    ARROW_ASSIGN_OR_RAISE(auto tz, LocateZone(timezone));
+    return [=](TimestampType::c_type arg) {
+      const auto iso_calendar = GetIsoCalendar<Duration>(arg, ZonedLocalizer{tz});
+      field_builders[0]->UnsafeAppend(iso_calendar[0]);
+      field_builders[1]->UnsafeAppend(iso_calendar[1]);
+      field_builders[2]->UnsafeAppend(iso_calendar[2]);
+      return struct_builder->Append();
+    };
+  }
+};
+
+template <typename Duration, typename InType>
 struct ISOCalendar {
   static Status Call(KernelContext* ctx, const Scalar& in, Scalar* out) {
-    std::string timezone = GetInputTimezone(in);
-
     if (in.is_valid) {
-      const auto& in_val = internal::UnboxScalar<const TimestampType>::Unbox(in);
-      std::array<int64_t, 3> iso_calendar;
-      if (timezone.empty()) {
-        iso_calendar = GetIsoCalendar<Duration>(in_val, NonZonedLocalizer{});
-      } else {
-        ARROW_ASSIGN_OR_RAISE(auto tz, LocateZone(timezone));
-        iso_calendar = GetIsoCalendar<Duration>(in_val, ZonedLocalizer{tz});
-      }
+      ARROW_ASSIGN_OR_RAISE(auto iso_calendar,
+                            (ISOCalendarWrapper<Duration, InType>::Get(in)));
       ScalarVector values = {std::make_shared<Int64Scalar>(iso_calendar[0]),
                              std::make_shared<Int64Scalar>(iso_calendar[1]),
                              std::make_shared<Int64Scalar>(iso_calendar[2])};
@@ -616,7 +803,6 @@ struct ISOCalendar {
 
   static Status Call(KernelContext* ctx, const ArrayData& in, ArrayData* out) {
     using BuilderType = typename TypeTraits<Int64Type>::BuilderType;
-    std::string timezone = GetInputTimezone(in);
 
     std::unique_ptr<ArrayBuilder> array_builder;
     RETURN_NOT_OK(MakeBuilder(ctx->memory_pool(), IsoCalendarType(), &array_builder));
@@ -631,27 +817,12 @@ struct ISOCalendar {
       RETURN_NOT_OK(field_builders[i]->Reserve(1));
     }
     auto visit_null = [&]() { return struct_builder->AppendNull(); };
-    if (timezone.empty()) {
-      auto visit_value = [&](int64_t arg) {
-        const auto iso_calendar = GetIsoCalendar<Duration>(arg, NonZonedLocalizer{});
-        field_builders[0]->UnsafeAppend(iso_calendar[0]);
-        field_builders[1]->UnsafeAppend(iso_calendar[1]);
-        field_builders[2]->UnsafeAppend(iso_calendar[2]);
-        return struct_builder->Append();
-      };
-      RETURN_NOT_OK(VisitArrayDataInline<Int64Type>(in, visit_value, visit_null));
-    } else {
-      ARROW_ASSIGN_OR_RAISE(auto tz, LocateZone(timezone));
-      auto visit_value = [&](int64_t arg) {
-        const auto iso_calendar = GetIsoCalendar<Duration>(arg, ZonedLocalizer{tz});
-        field_builders[0]->UnsafeAppend(iso_calendar[0]);
-        field_builders[1]->UnsafeAppend(iso_calendar[1]);
-        field_builders[2]->UnsafeAppend(iso_calendar[2]);
-        return struct_builder->Append();
-      };
-      RETURN_NOT_OK(VisitArrayDataInline<Int64Type>(in, visit_value, visit_null));
-    }
-
+    std::function<Status(typename InType::c_type arg)> visit_value;
+    ARROW_ASSIGN_OR_RAISE(
+        visit_value, (ISOCalendarVisitValueFunction<Duration, InType, BuilderType>::Get(
+                         field_builders, in, struct_builder)));
+    RETURN_NOT_OK(
+        VisitArrayDataInline<typename InType::PhysicalType>(in, visit_value, visit_null));
     std::shared_ptr<Array> out_array;
     RETURN_NOT_OK(struct_builder->Finish(&out_array));
     *out = *std::move(out_array->data());
@@ -659,262 +830,368 @@ struct ISOCalendar {
   }
 };
 
-template <
-    template <typename...> class Op,
-    template <template <typename...> class OpExec, typename Duration, typename OutType>
-    class ExecTemplate,
-    typename OutType>
+// Which types to generate a kernel for
+enum EnabledTypes : uint8_t { WithDates, WithTimestamps };
+
+template <template <typename...> class Op,
+          template <template <typename...> class OpExec, typename Duration,
+                    typename InType, typename OutType>
+          class ExecTemplate,
+          typename OutType>
 std::shared_ptr<ScalarFunction> MakeTemporal(
-    std::string name, const std::shared_ptr<arrow::DataType> out_type,
+    std::string name, std::initializer_list<EnabledTypes> in_types, OutputType out_type,
     const FunctionDoc* doc, const FunctionOptions* default_options = NULLPTR,
     KernelInit init = NULLPTR) {
+  DCHECK_NE(in_types.size(), 0);
   auto func =
       std::make_shared<ScalarFunction>(name, Arity::Unary(), doc, default_options);
 
-  for (auto unit : internal::AllTimeUnits()) {
-    InputType in_type{match::TimestampTypeUnit(unit)};
-    switch (unit) {
-      case TimeUnit::SECOND: {
-        auto exec = ExecTemplate<Op, std::chrono::seconds, OutType>::Exec;
-        DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
-        break;
-      }
-      case TimeUnit::MILLI: {
-        auto exec = ExecTemplate<Op, std::chrono::milliseconds, OutType>::Exec;
-        DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
+  for (const auto in_type : in_types) {
+    switch (in_type) {
+      case WithDates: {
+        auto exec32 = ExecTemplate<Op, days, Date32Type, OutType>::Exec;
+        DCHECK_OK(func->AddKernel({date32()}, out_type, std::move(exec32), init));
+        auto exec64 =
+            ExecTemplate<Op, std::chrono::milliseconds, Date64Type, OutType>::Exec;
+        DCHECK_OK(func->AddKernel({date64()}, out_type, std::move(exec64), init));
         break;
       }
-      case TimeUnit::MICRO: {
-        auto exec = ExecTemplate<Op, std::chrono::microseconds, OutType>::Exec;
-        DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
-        break;
-      }
-      case TimeUnit::NANO: {
-        auto exec = ExecTemplate<Op, std::chrono::nanoseconds, OutType>::Exec;
-        DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
+
+      case WithTimestamps: {
+        for (auto unit : AllTimeUnits()) {
+          InputType in_type{match::TimestampTypeUnit(unit)};
+          switch (unit) {
+            case TimeUnit::SECOND: {
+              auto exec =
+                  ExecTemplate<Op, std::chrono::seconds, TimestampType, OutType>::Exec;
+              DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
+              break;
+            }
+            case TimeUnit::MILLI: {
+              auto exec = ExecTemplate<Op, std::chrono::milliseconds, TimestampType,
+                                       OutType>::Exec;
+              DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
+              break;
+            }
+            case TimeUnit::MICRO: {
+              auto exec = ExecTemplate<Op, std::chrono::microseconds, TimestampType,
+                                       OutType>::Exec;
+              DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
+              break;
+            }
+            case TimeUnit::NANO: {
+              auto exec = ExecTemplate<Op, std::chrono::nanoseconds, TimestampType,
+                                       OutType>::Exec;
+              DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
+              break;
+            }
+          }
+        }
         break;
       }
     }
   }
+
   return func;
 }
 
 template <template <typename...> class Op>
 std::shared_ptr<ScalarFunction> MakeSimpleUnaryTemporal(
-    std::string name, const std::shared_ptr<arrow::DataType> out_type,
-    const FunctionDoc* doc, const FunctionOptions* default_options = NULLPTR,
-    KernelInit init = NULLPTR) {
+    std::string name, std::initializer_list<EnabledTypes> in_types,
+    const std::shared_ptr<arrow::DataType> out_type, const FunctionDoc* doc,
+    const FunctionOptions* default_options = NULLPTR, KernelInit init = NULLPTR) {
+  DCHECK_NE(in_types.size(), 0);
   auto func =
       std::make_shared<ScalarFunction>(name, Arity::Unary(), doc, default_options);
 
-  for (auto unit : internal::AllTimeUnits()) {
-    InputType in_type{match::TimestampTypeUnit(unit)};
-    switch (unit) {
-      case TimeUnit::SECOND: {
-        auto exec = SimpleUnary<Op<std::chrono::seconds>>;
-        DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
-        break;
-      }
-      case TimeUnit::MILLI: {
-        auto exec = SimpleUnary<Op<std::chrono::milliseconds>>;
-        DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
+  for (const auto in_type : in_types) {
+    switch (in_type) {
+      case WithDates: {
+        auto exec32 = SimpleUnary<Op<days, Date32Type>>;
+        DCHECK_OK(func->AddKernel({date32()}, out_type, std::move(exec32), init));
+        auto exec64 = SimpleUnary<Op<std::chrono::milliseconds, Date64Type>>;
+        DCHECK_OK(func->AddKernel({date64()}, out_type, std::move(exec64), init));
         break;
       }
-      case TimeUnit::MICRO: {
-        auto exec = SimpleUnary<Op<std::chrono::microseconds>>;
-        DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
-        break;
-      }
-      case TimeUnit::NANO: {
-        auto exec = SimpleUnary<Op<std::chrono::nanoseconds>>;
-        DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
+      case WithTimestamps: {
+        for (auto unit : AllTimeUnits()) {
+          InputType in_type{match::TimestampTypeUnit(unit)};
+          switch (unit) {
+            case TimeUnit::SECOND: {
+              auto exec = SimpleUnary<Op<std::chrono::seconds, TimestampType>>;
+              DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
+              break;
+            }
+            case TimeUnit::MILLI: {
+              auto exec = SimpleUnary<Op<std::chrono::milliseconds, TimestampType>>;
+              DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
+              break;
+            }
+            case TimeUnit::MICRO: {
+              auto exec = SimpleUnary<Op<std::chrono::microseconds, TimestampType>>;
+              DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
+              break;
+            }
+            case TimeUnit::NANO: {
+              auto exec = SimpleUnary<Op<std::chrono::nanoseconds, TimestampType>>;
+              DCHECK_OK(func->AddKernel({in_type}, out_type, std::move(exec), init));
+              break;
+            }
+          }
+        }
         break;
       }
     }
   }
+
   return func;
 }
 
 const FunctionDoc year_doc{
-    "Extract year from timestamp",
-    "Returns an error if timestamp has a defined timezone. Null values return null.",
+    "Extract year from temporal types",
+    ("Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc month_doc{
     "Extract month number",
     ("Month is encoded as January=1, December=12.\n"
-     "Returns an error if timestamp has a defined timezone. Null values return null."),
+     "Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc day_doc{
     "Extract day number",
-    "Returns an error if timestamp has a defined timezone. Null values return null.",
+    ("Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc day_of_week_doc{
     "Extract day of the week number",
-    ("By default, the week starts on Monday represented by 0 and ends on Sunday "
+    ("By default, the week starts on Monday represented by 0 and ends on Sunday\n"
      "represented by 6.\n"
-     "DayOfWeekOptions.week_start can be used to set another starting day using ISO "
-     "convention (Monday=1, Sunday=7). Day numbering can start with 0 or 1 using "
-     "DayOfWeekOptions.one_based_numbering parameter.\n"
-     "Returns an error if timestamp has a defined timezone. Null values return null."),
+     "`DayOfWeekOptions.week_start` can be used to set another starting day using\n"
+     "the ISO numbering convention (1=start week on Monday, 7=start week on Sunday).\n"
+     "Day numbers can start at 0 or 1 based on `DayOfWeekOptions.one_based_numbering`.\n"
+     "Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"},
     "DayOfWeekOptions"};
 
 const FunctionDoc day_of_year_doc{
     "Extract number of day of year",
     ("January 1st maps to day number 1, February 1st to 32, etc.\n"
-     "Returns an error if timestamp has a defined timezone. Null values return null."),
+     "Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc iso_year_doc{
     "Extract ISO year number",
     ("First week of an ISO year has the majority (4 or more) of its days in January."
-     "Returns an error if timestamp has a defined timezone. Null values return null."),
+     "Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc iso_week_doc{
     "Extract ISO week of year number",
     ("First ISO week has the majority (4 or more) of its days in January.\n"
      "Week of the year starts with 1 and can run up to 53.\n"
-     "Returns an error if timestamp has a defined timezone. Null values return null."),
+     "Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc iso_calendar_doc{
     "Extract (ISO year, ISO week, ISO day of week) struct",
     ("ISO week starts on Monday denoted by 1 and ends on Sunday denoted by 7.\n"
-     "Returns an error if timestamp has a defined timezone. Null values return null."),
+     "Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc quarter_doc{
     "Extract quarter of year number",
     ("First quarter maps to 1 and forth quarter maps to 4.\n"
-     "Returns an error if timestamp has a defined timezone. Null values return null."),
+     "Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc hour_doc{
     "Extract hour value",
-    "Returns an error if timestamp has a defined timezone. Null values return null.",
+    ("Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc minute_doc{
     "Extract minute values",
-    "Returns an error if timestamp has a defined timezone. Null values return null.",
+    ("Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc second_doc{
     "Extract second values",
-    "Returns an error if timestamp has a defined timezone. Null values return null.",
+    ("Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc millisecond_doc{
     "Extract millisecond values",
     ("Millisecond returns number of milliseconds since the last full second.\n"
-     "Returns an error if timestamp has a defined timezone. Null values return null."),
+     "Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc microsecond_doc{
     "Extract microsecond values",
     ("Millisecond returns number of microseconds since the last full millisecond.\n"
-     "Returns an error if timestamp has a defined timezone. Null values return null."),
+     "Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc nanosecond_doc{
     "Extract nanosecond values",
     ("Nanosecond returns number of nanoseconds since the last full microsecond.\n"
-     "Returns an error if timestamp has a defined timezone. Null values return null."),
+     "Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc subsecond_doc{
     "Extract subsecond values",
     ("Subsecond returns the fraction of a second since the last full second.\n"
-     "Returns an error if timestamp has a defined timezone. Null values return null."),
+     "Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database."),
     {"values"}};
 
 const FunctionDoc strftime_doc{
     "Format timestamps according to a format string",
     ("For each input timestamp, emit a formatted string.\n"
      "The time format string and locale can be set using StrftimeOptions.\n"
-     "An error is returned if the timestamps don't have a defined timezone,\n"
-     "or if the timezone cannot be found in the timezone database."),
+     "The output precision of the \"%S\" (seconds) format code depends on\n"
+     "the input timestamp precision: it is an integer for timestamps with\n"
+     "second precision, a real number with the required number of fractional\n"
+     "digits for higher precisions.\n"
+     "Null values emit null.\n"
+     "An error is returned if the timestamps have a defined timezone but it\n"
+     "cannot be found in the timezone database, or if the specified locale\n"
+     "does not exist on this system."),
     {"timestamps"},
     "StrftimeOptions"};
 
+const FunctionDoc assume_timezone_doc{
+    "Convert naive timestamp to timezone-aware timestamp",
+    ("Input timestamps are assumed to be relative to the timezone given in the\n"
+     "`timezone` option. They are converted to UTC-relative timestamps and\n"
+     "the output type has its timezone set to the value of the `timezone`\n"
+     "option. Null values emit null.\n"
+     "This function is meant to be used when an external system produces\n"
+     "\"timezone-naive\" timestamps which need to be converted to\n"
+     "\"timezone-aware\" timestamps. An error is returned if the timestamps\n"
+     "already have a defined timezone."),
+    {"timestamps"},
+    "AssumeTimezoneOptions"};
+
 }  // namespace
 
 void RegisterScalarTemporal(FunctionRegistry* registry) {
-  auto year =
-      MakeTemporal<Year, TemporalComponentExtract, Int64Type>("year", int64(), &year_doc);
+  // Date extractors
+
+  auto year = MakeTemporal<Year, TemporalComponentExtract, Int64Type>(
+      "year", {WithDates, WithTimestamps}, int64(), &year_doc);
   DCHECK_OK(registry->AddFunction(std::move(year)));
 
-  auto month = MakeTemporal<Month, TemporalComponentExtract, Int64Type>("month", int64(),
-                                                                        &month_doc);
+  auto month = MakeTemporal<Month, TemporalComponentExtract, Int64Type>(
+      "month", {WithDates, WithTimestamps}, int64(), &month_doc);
   DCHECK_OK(registry->AddFunction(std::move(month)));
 
-  auto day =
-      MakeTemporal<Day, TemporalComponentExtract, Int64Type>("day", int64(), &day_doc);
+  auto day = MakeTemporal<Day, TemporalComponentExtract, Int64Type>(
+      "day", {WithDates, WithTimestamps}, int64(), &day_doc);
   DCHECK_OK(registry->AddFunction(std::move(day)));
 
-  static auto default_day_of_week_options = DayOfWeekOptions::Defaults();
+  static const auto default_day_of_week_options = DayOfWeekOptions::Defaults();
   auto day_of_week =
       MakeTemporal<DayOfWeek, TemporalComponentExtractDayOfWeek, Int64Type>(
-          "day_of_week", int64(), &day_of_week_doc, &default_day_of_week_options,
-          DayOfWeekState::Init);
+          "day_of_week", {WithDates, WithTimestamps}, int64(), &day_of_week_doc,
+          &default_day_of_week_options, DayOfWeekState::Init);
   DCHECK_OK(registry->AddFunction(std::move(day_of_week)));
 
   auto day_of_year = MakeTemporal<DayOfYear, TemporalComponentExtract, Int64Type>(
-      "day_of_year", int64(), &day_of_year_doc);
+      "day_of_year", {WithDates, WithTimestamps}, int64(), &day_of_year_doc);
   DCHECK_OK(registry->AddFunction(std::move(day_of_year)));
 
   auto iso_year = MakeTemporal<ISOYear, TemporalComponentExtract, Int64Type>(
-      "iso_year", int64(), &iso_year_doc);
+      "iso_year", {WithDates, WithTimestamps}, int64(), &iso_year_doc);
   DCHECK_OK(registry->AddFunction(std::move(iso_year)));
 
   auto iso_week = MakeTemporal<ISOWeek, TemporalComponentExtract, Int64Type>(
-      "iso_week", int64(), &iso_week_doc);
+      "iso_week", {WithDates, WithTimestamps}, int64(), &iso_week_doc);
   DCHECK_OK(registry->AddFunction(std::move(iso_week)));
 
   auto iso_calendar = MakeSimpleUnaryTemporal<ISOCalendar>(
-      "iso_calendar", IsoCalendarType(), &iso_calendar_doc);
+      "iso_calendar", {WithDates, WithTimestamps}, IsoCalendarType(), &iso_calendar_doc);
   DCHECK_OK(registry->AddFunction(std::move(iso_calendar)));
 
   auto quarter = MakeTemporal<Quarter, TemporalComponentExtract, Int64Type>(
-      "quarter", int64(), &quarter_doc);
+      "quarter", {WithDates, WithTimestamps}, int64(), &quarter_doc);
   DCHECK_OK(registry->AddFunction(std::move(quarter)));
 
-  auto hour =
-      MakeTemporal<Hour, TemporalComponentExtract, Int64Type>("hour", int64(), &hour_doc);
+  // Date / time extractors
+
+  auto hour = MakeTemporal<Hour, TemporalComponentExtract, Int64Type>(
+      "hour", {WithTimestamps}, int64(), &hour_doc);
   DCHECK_OK(registry->AddFunction(std::move(hour)));
 
   auto minute = MakeTemporal<Minute, TemporalComponentExtract, Int64Type>(
-      "minute", int64(), &minute_doc);
+      "minute", {WithTimestamps}, int64(), &minute_doc);
   DCHECK_OK(registry->AddFunction(std::move(minute)));
 
   auto second = MakeTemporal<Second, TemporalComponentExtract, Int64Type>(
-      "second", int64(), &second_doc);
+      "second", {WithTimestamps}, int64(), &second_doc);
   DCHECK_OK(registry->AddFunction(std::move(second)));
 
   auto millisecond = MakeTemporal<Millisecond, TemporalComponentExtract, Int64Type>(
-      "millisecond", int64(), &millisecond_doc);
+      "millisecond", {WithTimestamps}, int64(), &millisecond_doc);
   DCHECK_OK(registry->AddFunction(std::move(millisecond)));
 
   auto microsecond = MakeTemporal<Microsecond, TemporalComponentExtract, Int64Type>(
-      "microsecond", int64(), &microsecond_doc);
+      "microsecond", {WithTimestamps}, int64(), &microsecond_doc);
   DCHECK_OK(registry->AddFunction(std::move(microsecond)));
 
   auto nanosecond = MakeTemporal<Nanosecond, TemporalComponentExtract, Int64Type>(
-      "nanosecond", int64(), &nanosecond_doc);
+      "nanosecond", {WithTimestamps}, int64(), &nanosecond_doc);
   DCHECK_OK(registry->AddFunction(std::move(nanosecond)));
 
   auto subsecond = MakeTemporal<Subsecond, TemporalComponentExtract, DoubleType>(
-      "subsecond", float64(), &subsecond_doc);
+      "subsecond", {WithTimestamps}, float64(), &subsecond_doc);
   DCHECK_OK(registry->AddFunction(std::move(subsecond)));
 
-  static auto default_strftime_options = StrftimeOptions();
+  // Timezone-related functions
+
+  static const auto default_strftime_options = StrftimeOptions();
   auto strftime = MakeSimpleUnaryTemporal<Strftime>(
-      "strftime", utf8(), &strftime_doc, &default_strftime_options, StrftimeState::Init);
+      "strftime", {WithTimestamps}, utf8(), &strftime_doc, &default_strftime_options,
+      StrftimeState::Init);
   DCHECK_OK(registry->AddFunction(std::move(strftime)));
+
+  auto assume_timezone =
+      MakeTemporal<AssumeTimezone, AssumeTimezoneExtractor, TimestampType>(
+          "assume_timezone", {WithTimestamps},
+          OutputType::Resolver(ResolveAssumeTimezoneOutput), &assume_timezone_doc,
+          nullptr, AssumeTimezoneState::Init);
+  DCHECK_OK(registry->AddFunction(std::move(assume_timezone)));
 }
 
 }  // namespace internal
diff --git a/cpp/src/arrow/compute/kernels/scalar_temporal_test.cc b/cpp/src/arrow/compute/kernels/scalar_temporal_test.cc
index d8199089328..0e7b4beb95e 100644
--- a/cpp/src/arrow/compute/kernels/scalar_temporal_test.cc
+++ b/cpp/src/arrow/compute/kernels/scalar_temporal_test.cc
@@ -16,18 +16,62 @@
 // under the License.
 
 #include <gtest/gtest.h>
+
 #include "arrow/compute/api_scalar.h"
-#include "arrow/compute/kernels/common.h"
 #include "arrow/compute/kernels/test_util.h"
+#include "arrow/testing/gtest_util.h"
+#include "arrow/type.h"
 #include "arrow/util/checked_cast.h"
 #include "arrow/util/formatting.h"
+#include "arrow/util/logging.h"
 
 namespace arrow {
 
+using internal::AllTimeUnits;
 using internal::StringFormatter;
 
+namespace compute {
+
 class ScalarTemporalTest : public ::testing::Test {
  public:
+  const char* date32s =
+      R"([0,
+      11016,
+      -25932,
+      23148,
+      18262,
+      18261,
+      18260,
+      14609,
+      14610,
+      14612,
+      14613,
+      13149,
+      13148,
+      14241,
+      14242,
+      15340,
+      null])";
+
+  const char* date64s =
+      R"([0,
+      951782400000,
+      -2240524800000,
+      1999987200000,
+      1577836800000,
+      1577750400000,
+      1577664000000,
+      1262217600000,
+      1262304000000,
+      1262476800000,
+      1262563200000,
+      1136073600000,
+      1135987200000,
+      1230422400000,
+      1230508800000,
+      1325376000000,
+      null])";
+
   const char* times =
       R"(["1970-01-01T00:00:59.123456789","2000-02-29T23:23:23.999999999",
           "1899-01-01T00:59:20.001001001","2033-05-18T03:33:20.000000000",
@@ -96,30 +140,37 @@ class ScalarTemporalTest : public ::testing::Test {
   std::string zeros = "[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, null]";
 };
 
-namespace compute {
-
-TEST_F(ScalarTemporalTest, TestTemporalComponentExtraction) {
-  auto unit = timestamp(TimeUnit::NANO);
-  CheckScalarUnary("year", unit, times, int64(), year);
-  CheckScalarUnary("month", unit, times, int64(), month);
-  CheckScalarUnary("day", unit, times, int64(), day);
-  CheckScalarUnary("day_of_week", unit, times, int64(), day_of_week);
-  CheckScalarUnary("day_of_year", unit, times, int64(), day_of_year);
-  CheckScalarUnary("iso_year", unit, times, int64(), iso_year);
-  CheckScalarUnary("iso_week", unit, times, int64(), iso_week);
-  CheckScalarUnary("iso_calendar", ArrayFromJSON(unit, times), iso_calendar);
-  CheckScalarUnary("quarter", unit, times, int64(), quarter);
-  CheckScalarUnary("hour", unit, times, int64(), hour);
-  CheckScalarUnary("minute", unit, times, int64(), minute);
-  CheckScalarUnary("second", unit, times, int64(), second);
-  CheckScalarUnary("millisecond", unit, times, int64(), millisecond);
-  CheckScalarUnary("microsecond", unit, times, int64(), microsecond);
-  CheckScalarUnary("nanosecond", unit, times, int64(), nanosecond);
-  CheckScalarUnary("subsecond", unit, times, float64(), subsecond);
+TEST_F(ScalarTemporalTest, TestTemporalComponentExtractionAllTemporalTypes) {
+  std::vector<std::shared_ptr<DataType>> units = {date32(), date64(),
+                                                  timestamp(TimeUnit::NANO)};
+  std::vector<const char*> samples = {date32s, date64s, times};
+  DCHECK_EQ(units.size(), samples.size());
+  for (size_t i = 0; i < samples.size(); ++i) {
+    auto unit = units[i];
+    auto sample = samples[i];
+    CheckScalarUnary("year", unit, sample, int64(), year);
+    CheckScalarUnary("month", unit, sample, int64(), month);
+    CheckScalarUnary("day", unit, sample, int64(), day);
+    CheckScalarUnary("day_of_week", unit, sample, int64(), day_of_week);
+    CheckScalarUnary("day_of_year", unit, sample, int64(), day_of_year);
+    CheckScalarUnary("iso_year", unit, sample, int64(), iso_year);
+    CheckScalarUnary("iso_week", unit, sample, int64(), iso_week);
+    CheckScalarUnary("iso_calendar", ArrayFromJSON(unit, sample), iso_calendar);
+    CheckScalarUnary("quarter", unit, sample, int64(), quarter);
+    if (unit->id() == Type::TIMESTAMP) {
+      CheckScalarUnary("hour", unit, sample, int64(), hour);
+      CheckScalarUnary("minute", unit, sample, int64(), minute);
+      CheckScalarUnary("second", unit, sample, int64(), second);
+      CheckScalarUnary("millisecond", unit, sample, int64(), millisecond);
+      CheckScalarUnary("microsecond", unit, sample, int64(), microsecond);
+      CheckScalarUnary("nanosecond", unit, sample, int64(), nanosecond);
+      CheckScalarUnary("subsecond", unit, sample, float64(), subsecond);
+    }
+  }
 }
 
 TEST_F(ScalarTemporalTest, TestTemporalComponentExtractionWithDifferentUnits) {
-  for (auto u : internal::AllTimeUnits()) {
+  for (auto u : AllTimeUnits()) {
     auto unit = timestamp(u);
     CheckScalarUnary("year", unit, times_seconds_precision, int64(), year);
     CheckScalarUnary("month", unit, times_seconds_precision, int64(), month);
@@ -247,7 +298,7 @@ TEST_F(ScalarTemporalTest, TestZoned1) {
 }
 
 TEST_F(ScalarTemporalTest, TestZoned2) {
-  for (auto u : internal::AllTimeUnits()) {
+  for (auto u : AllTimeUnits()) {
     auto unit = timestamp(u, "Australia/Broken_Hill");
     auto iso_calendar_type =
         struct_({field("iso_year", int64()), field("iso_week", int64()),
@@ -310,7 +361,7 @@ TEST_F(ScalarTemporalTest, TestNonexistentTimezone) {
   auto data_buffer = Buffer::Wrap(std::vector<int32_t>{1, 2, 3});
   auto null_buffer = Buffer::FromString("\xff");
 
-  for (auto u : internal::AllTimeUnits()) {
+  for (auto u : AllTimeUnits()) {
     auto ts_type = timestamp(u, "Mars/Mariner_Valley");
     auto timestamp_array = std::make_shared<NumericArray<TimestampType>>(
         ts_type, 2, data_buffer, null_buffer, 0);
@@ -383,7 +434,112 @@ TEST_F(ScalarTemporalTest, DayOfWeek) {
                                                        /*week_start=*/8)));
 }
 
+// TODO: We should test on windows once ARROW-13168 is resolved.
 #ifndef _WIN32
+TEST_F(ScalarTemporalTest, TestAssumeTimezone) {
+  std::string timezone_utc = "UTC";
+  std::string timezone_kolkata = "Asia/Kolkata";
+  std::string timezone_us_central = "US/Central";
+  const char* times_utc = R"(["1970-01-01T00:00:00", null])";
+  const char* times_kolkata = R"(["1970-01-01T05:30:00", null])";
+  const char* times_us_central = R"(["1969-12-31T18:00:00", null])";
+  auto options_utc = AssumeTimezoneOptions(timezone_utc);
+  auto options_kolkata = AssumeTimezoneOptions(timezone_kolkata);
+  auto options_us_central = AssumeTimezoneOptions(timezone_us_central);
+  auto options_invalid = AssumeTimezoneOptions("Europe/Brusselsss");
+
+  for (auto u : AllTimeUnits()) {
+    auto unit = timestamp(u);
+    auto unit_utc = timestamp(u, timezone_utc);
+    auto unit_kolkata = timestamp(u, timezone_kolkata);
+    auto unit_us_central = timestamp(u, timezone_us_central);
+
+    CheckScalarUnary("assume_timezone", unit, times_utc, unit_utc, times_utc,
+                     &options_utc);
+    CheckScalarUnary("assume_timezone", unit, times_kolkata, unit_kolkata, times_utc,
+                     &options_kolkata);
+    CheckScalarUnary("assume_timezone", unit, times_us_central, unit_us_central,
+                     times_utc, &options_us_central);
+    ASSERT_RAISES(Invalid,
+                  AssumeTimezone(ArrayFromJSON(unit_kolkata, times_utc), options_utc));
+    ASSERT_RAISES(Invalid,
+                  AssumeTimezone(ArrayFromJSON(unit, times_utc), options_invalid));
+  }
+}
+
+TEST_F(ScalarTemporalTest, TestAssumeTimezoneAmbiguous) {
+  std::string timezone = "CET";
+  const char* times = R"(["2018-10-28 01:20:00",
+                          "2018-10-28 02:36:00",
+                          "2018-10-28 03:46:00"])";
+  const char* times_earliest = R"(["2018-10-27 23:20:00",
+                                   "2018-10-28 00:36:00",
+                                   "2018-10-28 02:46:00"])";
+  const char* times_latest = R"(["2018-10-27 23:20:00",
+                                 "2018-10-28 01:36:00",
+                                 "2018-10-28 02:46:00"])";
+
+  auto options_earliest =
+      AssumeTimezoneOptions(timezone, AssumeTimezoneOptions::AMBIGUOUS_EARLIEST);
+  auto options_latest =
+      AssumeTimezoneOptions(timezone, AssumeTimezoneOptions::AMBIGUOUS_LATEST);
+  auto options_raise =
+      AssumeTimezoneOptions(timezone, AssumeTimezoneOptions::AMBIGUOUS_RAISE);
+
+  for (auto u : AllTimeUnits()) {
+    auto unit = timestamp(u);
+    auto unit_local = timestamp(u, timezone);
+    ASSERT_RAISES(Invalid, AssumeTimezone(ArrayFromJSON(unit, times), options_raise));
+    CheckScalarUnary("assume_timezone", unit, times, unit_local, times_earliest,
+                     &options_earliest);
+    CheckScalarUnary("assume_timezone", unit, times, unit_local, times_latest,
+                     &options_latest);
+  }
+}
+
+TEST_F(ScalarTemporalTest, TestAssumeTimezoneNonexistent) {
+  std::string timezone = "Europe/Warsaw";
+  const char* times = R"(["2015-03-29 02:30:00", "2015-03-29 03:30:00"])";
+  const char* times_latest = R"(["2015-03-29 01:00:00", "2015-03-29 01:30:00"])";
+  const char* times_earliest = R"(["2015-03-29 00:59:59", "2015-03-29 01:30:00"])";
+  const char* times_earliest_milli =
+      R"(["2015-03-29 00:59:59.999", "2015-03-29 01:30:00"])";
+  const char* times_earliest_micro =
+      R"(["2015-03-29 00:59:59.999999", "2015-03-29 01:30:00"])";
+  const char* times_earliest_nano =
+      R"(["2015-03-29 00:59:59.999999999", "2015-03-29 01:30:00"])";
+
+  auto options_raise =
+      AssumeTimezoneOptions(timezone, AssumeTimezoneOptions::AMBIGUOUS_RAISE,
+                            AssumeTimezoneOptions::NONEXISTENT_RAISE);
+  auto options_latest =
+      AssumeTimezoneOptions(timezone, AssumeTimezoneOptions::AMBIGUOUS_RAISE,
+                            AssumeTimezoneOptions::NONEXISTENT_LATEST);
+  auto options_earliest =
+      AssumeTimezoneOptions(timezone, AssumeTimezoneOptions::AMBIGUOUS_RAISE,
+                            AssumeTimezoneOptions::NONEXISTENT_EARLIEST);
+
+  for (auto u : AllTimeUnits()) {
+    auto unit = timestamp(u);
+    auto unit_local = timestamp(u, timezone);
+    ASSERT_RAISES(Invalid, AssumeTimezone(ArrayFromJSON(unit, times), options_raise));
+    CheckScalarUnary("assume_timezone", unit, times, unit_local, times_latest,
+                     &options_latest);
+  }
+  CheckScalarUnary("assume_timezone", timestamp(TimeUnit::SECOND), times,
+                   timestamp(TimeUnit::SECOND, timezone), times_earliest,
+                   &options_earliest);
+  CheckScalarUnary("assume_timezone", timestamp(TimeUnit::MILLI), times,
+                   timestamp(TimeUnit::MILLI, timezone), times_earliest_milli,
+                   &options_earliest);
+  CheckScalarUnary("assume_timezone", timestamp(TimeUnit::MICRO), times,
+                   timestamp(TimeUnit::MICRO, timezone), times_earliest_micro,
+                   &options_earliest);
+  CheckScalarUnary("assume_timezone", timestamp(TimeUnit::NANO), times,
+                   timestamp(TimeUnit::NANO, timezone), times_earliest_nano,
+                   &options_earliest);
+}
+
 TEST_F(ScalarTemporalTest, Strftime) {
   auto options_default = StrftimeOptions();
   auto options = StrftimeOptions("%Y-%m-%dT%H:%M:%S%z");
@@ -394,7 +550,7 @@ TEST_F(ScalarTemporalTest, Strftime) {
   const char* nanoseconds = R"(["1970-01-01T00:00:59.123456789", null])";
 
   const char* default_seconds = R"(
-      ["1970-01-01T00:00:59Z", "2021-08-18T15:11:50Z", null])";
+      ["1970-01-01T00:00:59", "2021-08-18T15:11:50", null])";
   const char* string_seconds = R"(
       ["1970-01-01T00:00:59+0000", "2021-08-18T15:11:50+0000", null])";
   const char* string_milliseconds = R"(["1970-01-01T00:00:59.123+0000", null])";
@@ -414,12 +570,20 @@ TEST_F(ScalarTemporalTest, Strftime) {
 }
 
 TEST_F(ScalarTemporalTest, StrftimeNoTimezone) {
+  auto options_default = StrftimeOptions();
   const char* seconds = R"(["1970-01-01T00:00:59", null])";
   auto arr = ArrayFromJSON(timestamp(TimeUnit::SECOND), seconds);
+
+  CheckScalarUnary("strftime", timestamp(TimeUnit::SECOND), seconds, utf8(), seconds,
+                   &options_default);
   EXPECT_RAISES_WITH_MESSAGE_THAT(
       Invalid,
-      testing::HasSubstr("Timestamps without a time zone cannot be reliably formatted"),
-      Strftime(arr, StrftimeOptions()));
+      testing::HasSubstr("Invalid: Timezone not present, cannot convert to string"),
+      Strftime(arr, StrftimeOptions("%Y-%m-%dT%H:%M:%S%z")));
+  EXPECT_RAISES_WITH_MESSAGE_THAT(
+      Invalid,
+      testing::HasSubstr("Invalid: Timezone not present, cannot convert to string"),
+      Strftime(arr, StrftimeOptions("%Y-%m-%dT%H:%M:%S%Z")));
 }
 
 TEST_F(ScalarTemporalTest, StrftimeInvalidTimezone) {
@@ -440,7 +604,7 @@ TEST_F(ScalarTemporalTest, StrftimeCLocale) {
   const char* microseconds = R"(["1970-01-01T00:00:59.123456", null])";
   const char* nanoseconds = R"(["1970-01-01T00:00:59.123456789", null])";
 
-  const char* default_seconds = R"(["1970-01-01T00:00:59Z", null])";
+  const char* default_seconds = R"(["1970-01-01T00:00:59", null])";
   const char* string_seconds = R"(["1970-01-01T00:00:59+0000", null])";
   const char* string_milliseconds = R"(["1970-01-01T00:00:59.123+0000", null])";
   const char* string_microseconds = R"(["1970-01-01T05:30:59.123456+0530", null])";
@@ -486,8 +650,7 @@ TEST_F(ScalarTemporalTest, StrftimeInvalidLocale) {
                                   testing::HasSubstr("Cannot find locale 'non-existent'"),
                                   Strftime(arr, options));
 }
-
-#endif
+#endif  // !_WIN32
 
 }  // namespace compute
 }  // namespace arrow
diff --git a/cpp/src/arrow/compute/kernels/select_k_test.cc b/cpp/src/arrow/compute/kernels/select_k_test.cc
new file mode 100644
index 00000000000..2d1d5cffe3d
--- /dev/null
+++ b/cpp/src/arrow/compute/kernels/select_k_test.cc
@@ -0,0 +1,716 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#include <functional>
+#include <iostream>
+#include <limits>
+#include <memory>
+#include <string>
+#include <vector>
+
+#include "arrow/array/array_decimal.h"
+#include "arrow/array/concatenate.h"
+#include "arrow/compute/api_vector.h"
+#include "arrow/compute/kernels/test_util.h"
+#include "arrow/compute/kernels/util_internal.h"
+#include "arrow/table.h"
+#include "arrow/testing/gtest_common.h"
+#include "arrow/testing/gtest_util.h"
+#include "arrow/testing/random.h"
+#include "arrow/testing/util.h"
+#include "arrow/type_traits.h"
+
+namespace arrow {
+
+using internal::checked_cast;
+using internal::checked_pointer_cast;
+
+namespace compute {
+
+template <typename ArrayType, SortOrder order>
+class SelectKCompareForResult {
+ public:
+  template <typename Type>
+  bool operator()(const Type& lval, const Type& rval) {
+    if (order == SortOrder::Ascending) {
+      return lval <= rval;
+    } else {
+      return rval <= lval;
+    }
+  }
+};
+
+template <SortOrder order>
+Result<std::shared_ptr<Array>> SelectK(const Datum& values, int64_t k) {
+  if (order == SortOrder::Descending) {
+    return SelectKUnstable(values, SelectKOptions::TopKDefault(k));
+  } else {
+    return SelectKUnstable(values, SelectKOptions::BottomKDefault(k));
+  }
+}
+
+void ValidateSelectK(const Datum& datum, Array& select_k_indices, SortOrder order,
+                     bool stable_sort = false) {
+  ASSERT_TRUE(datum.is_arraylike());
+  ASSERT_OK_AND_ASSIGN(auto sorted_indices,
+                       SortIndices(datum, SortOptions({SortKey("unused", order)})));
+
+  int64_t k = select_k_indices.length();
+  // head(k)
+  auto head_k_indices = sorted_indices->Slice(0, k);
+  if (stable_sort) {
+    AssertDatumsEqual(*head_k_indices, select_k_indices);
+  } else {
+    ASSERT_OK_AND_ASSIGN(auto expected,
+                         Take(datum, *head_k_indices, TakeOptions::NoBoundsCheck()));
+    ASSERT_OK_AND_ASSIGN(auto actual,
+                         Take(datum, select_k_indices, TakeOptions::NoBoundsCheck()));
+    AssertDatumsEqual(Datum(expected), Datum(actual));
+  }
+}
+
+template <typename ArrowType>
+class TestSelectKBase : public TestBase {
+  using ArrayType = typename TypeTraits<ArrowType>::ArrayType;
+
+ protected:
+  template <SortOrder order>
+  void AssertSelectKArray(const std::shared_ptr<Array> values, int k) {
+    std::shared_ptr<Array> select_k;
+    ASSERT_OK_AND_ASSIGN(select_k, SelectK<order>(Datum(*values), k));
+    ASSERT_EQ(select_k->data()->null_count, 0);
+    ValidateOutput(*select_k);
+    ValidateSelectK(Datum(*values), *select_k, order);
+  }
+
+  void AssertTopKArray(const std::shared_ptr<Array> values, int n) {
+    AssertSelectKArray<SortOrder::Descending>(values, n);
+  }
+  void AssertBottomKArray(const std::shared_ptr<Array> values, int n) {
+    AssertSelectKArray<SortOrder::Ascending>(values, n);
+  }
+
+  void AssertSelectKJson(const std::string& values, int n) {
+    AssertTopKArray(ArrayFromJSON(type_singleton(), values), n);
+    AssertBottomKArray(ArrayFromJSON(type_singleton(), values), n);
+  }
+
+  virtual std::shared_ptr<DataType> type_singleton() = 0;
+};
+
+template <typename ArrowType>
+class TestSelectK : public TestSelectKBase<ArrowType> {
+ protected:
+  std::shared_ptr<DataType> type_singleton() override {
+    return default_type_instance<ArrowType>();
+  }
+};
+
+template <typename ArrowType>
+class TestSelectKForReal : public TestSelectK<ArrowType> {};
+TYPED_TEST_SUITE(TestSelectKForReal, RealArrowTypes);
+
+template <typename ArrowType>
+class TestSelectKForIntegral : public TestSelectK<ArrowType> {};
+TYPED_TEST_SUITE(TestSelectKForIntegral, IntegralArrowTypes);
+
+template <typename ArrowType>
+class TestSelectKForBool : public TestSelectK<ArrowType> {};
+TYPED_TEST_SUITE(TestSelectKForBool, ::testing::Types<BooleanType>);
+
+template <typename ArrowType>
+class TestSelectKForTemporal : public TestSelectK<ArrowType> {};
+TYPED_TEST_SUITE(TestSelectKForTemporal, TemporalArrowTypes);
+
+template <typename ArrowType>
+class TestSelectKForDecimal : public TestSelectKBase<ArrowType> {
+  std::shared_ptr<DataType> type_singleton() override {
+    return std::make_shared<ArrowType>(5, 2);
+  }
+};
+TYPED_TEST_SUITE(TestSelectKForDecimal, DecimalArrowTypes);
+
+template <typename ArrowType>
+class TestSelectKForStrings : public TestSelectK<ArrowType> {};
+TYPED_TEST_SUITE(TestSelectKForStrings, testing::Types<StringType>);
+
+TYPED_TEST(TestSelectKForReal, SelectKDoesNotProvideDefaultOptions) {
+  auto input = ArrayFromJSON(this->type_singleton(), "[null, 1, 3.3, null, 2, 5.3]");
+  ASSERT_RAISES(Invalid, CallFunction("select_k_unstable", {input}));
+}
+
+TYPED_TEST(TestSelectKForReal, Real) {
+  this->AssertSelectKJson("[null, 1, 3.3, null, 2, 5.3]", 0);
+  this->AssertSelectKJson("[null, 1, 3.3, null, 2, 5.3]", 2);
+  this->AssertSelectKJson("[null, 1, 3.3, null, 2, 5.3]", 5);
+  this->AssertSelectKJson("[null, 1, 3.3, null, 2, 5.3]", 6);
+
+  this->AssertSelectKJson("[null, 2, NaN, 3, 1]", 0);
+  this->AssertSelectKJson("[null, 2, NaN, 3, 1]", 1);
+  this->AssertSelectKJson("[null, 2, NaN, 3, 1]", 2);
+  this->AssertSelectKJson("[null, 2, NaN, 3, 1]", 3);
+  this->AssertSelectKJson("[null, 2, NaN, 3, 1]", 4);
+  this->AssertSelectKJson("[NaN, 2, null, 3, 1]", 3);
+  this->AssertSelectKJson("[NaN, 2, null, 3, 1]", 4);
+  this->AssertSelectKJson("[100, 4, 2, 7, 8, 3, NaN, 3, 1]", 4);
+}
+
+TYPED_TEST(TestSelectKForIntegral, Integral) {
+  this->AssertSelectKJson("[null, 1, 3, null, 2, 5]", 0);
+  this->AssertSelectKJson("[null, 1, 3, null, 2, 5]", 2);
+  this->AssertSelectKJson("[null, 1, 3, null, 2, 5]", 5);
+  this->AssertSelectKJson("[null, 1, 3, null, 2, 5]", 6);
+
+  this->AssertSelectKJson("[2, 4, 5, 7, 8, 0, 9, 1, 3]", 5);
+}
+
+TYPED_TEST(TestSelectKForBool, Bool) {
+  this->AssertSelectKJson("[null, false, true, null, false, true]", 0);
+  this->AssertSelectKJson("[null, false, true, null, false, true]", 2);
+  this->AssertSelectKJson("[null, false, true, null, false, true]", 5);
+  this->AssertSelectKJson("[null, false, true, null, false, true]", 6);
+}
+
+TYPED_TEST(TestSelectKForTemporal, Temporal) {
+  this->AssertSelectKJson("[null, 1, 3, null, 2, 5]", 0);
+  this->AssertSelectKJson("[null, 1, 3, null, 2, 5]", 2);
+  this->AssertSelectKJson("[null, 1, 3, null, 2, 5]", 5);
+  this->AssertSelectKJson("[null, 1, 3, null, 2, 5]", 6);
+}
+
+TYPED_TEST(TestSelectKForDecimal, Decimal) {
+  const std::string values = R"(["123.45", null, "-123.45", "456.78", "-456.78"])";
+  this->AssertSelectKJson(values, 0);
+  this->AssertSelectKJson(values, 2);
+  this->AssertSelectKJson(values, 4);
+  this->AssertSelectKJson(values, 5);
+}
+
+TYPED_TEST(TestSelectKForStrings, Strings) {
+  this->AssertSelectKJson(R"(["testing", null, "nth", "for", null, "strings"])", 0);
+  this->AssertSelectKJson(R"(["testing", null, "nth", "for", null, "strings"])", 2);
+  this->AssertSelectKJson(R"(["testing", null, "nth", "for", null, "strings"])", 5);
+  this->AssertSelectKJson(R"(["testing", null, "nth", "for", null, "strings"])", 6);
+}
+
+template <typename ArrowType>
+class TestSelectKRandom : public TestSelectKBase<ArrowType> {
+ public:
+  std::shared_ptr<DataType> type_singleton() override {
+    EXPECT_TRUE(0) << "shouldn't be used";
+    return nullptr;
+  }
+};
+
+using SelectKableTypes =
+    ::testing::Types<UInt8Type, UInt16Type, UInt32Type, UInt64Type, Int8Type, Int16Type,
+                     Int32Type, Int64Type, FloatType, DoubleType, StringType>;
+
+TYPED_TEST_SUITE(TestSelectKRandom, SelectKableTypes);
+
+TYPED_TEST(TestSelectKRandom, RandomValues) {
+  Random<TypeParam> rand(0x61549225);
+  int length = 100;
+  for (auto null_probability : {0.0, 0.1, 0.5, 1.0}) {
+    auto array = rand.Generate(length, null_probability);
+    // Try n from 0 to out of bound
+    for (int n = 0; n <= length; ++n) {
+      this->AssertTopKArray(array, n);
+      this->AssertBottomKArray(array, n);
+    }
+  }
+}
+
+// Test basic cases for chunked array
+
+template <typename ArrowType>
+struct TestSelectKWithChunkedArray : public ::testing::Test {
+  TestSelectKWithChunkedArray() {}
+
+  // Slice `array` into multiple chunks along `offsets`
+  ArrayVector Slices(const std::shared_ptr<Array>& array,
+                     const std::shared_ptr<Int32Array>& offsets) {
+    ArrayVector slices(offsets->length() - 1);
+    for (int64_t i = 0; i != static_cast<int64_t>(slices.size()); ++i) {
+      slices[i] =
+          array->Slice(offsets->Value(i), offsets->Value(i + 1) - offsets->Value(i));
+    }
+    return slices;
+  }
+
+  template <SortOrder order = SortOrder::Descending>
+  void AssertSelectK(const std::shared_ptr<ChunkedArray>& chunked_array, int64_t k) {
+    ASSERT_OK_AND_ASSIGN(auto select_k_array, SelectK<order>(Datum(*chunked_array), k));
+    ValidateSelectK(Datum(*chunked_array), *select_k_array, order);
+  }
+
+  void AssertTopK(const std::shared_ptr<ChunkedArray>& chunked_array, int64_t k) {
+    AssertSelectK<SortOrder::Descending>(chunked_array, k);
+  }
+  void AssertBottomK(const std::shared_ptr<ChunkedArray>& chunked_array, int64_t k) {
+    AssertSelectK<SortOrder::Ascending>(chunked_array, k);
+  }
+};
+
+TYPED_TEST_SUITE(TestSelectKWithChunkedArray, SelectKableTypes);
+
+TYPED_TEST(TestSelectKWithChunkedArray, RandomValuesWithSlices) {
+  Random<TypeParam> rand(0x61549225);
+  int length = 100;
+  for (auto null_probability : {0.0, 0.1, 0.5, 1.0}) {
+    // Try n from 0 to out of bound
+    auto array = rand.Generate(length, null_probability);
+    auto offsets = rand.Offsets(length, 3);
+    auto slices = this->Slices(array, offsets);
+    ASSERT_OK_AND_ASSIGN(auto chunked_array, ChunkedArray::Make(slices));
+    for (int k = 0; k <= length; k += 10) {
+      this->AssertTopK(chunked_array, k);
+      this->AssertBottomK(chunked_array, k);
+    }
+  }
+}
+
+template <typename ArrayType, SortOrder order>
+void ValidateSelectKIndices(const ArrayType& array) {
+  ValidateOutput(array);
+
+  SelectKCompareForResult<ArrayType, order> compare;
+  for (uint64_t i = 1; i < static_cast<uint64_t>(array.length()); i++) {
+    using ArrowType = typename ArrayType::TypeClass;
+    using GetView = internal::GetViewType<ArrowType>;
+
+    const auto lval = GetView::LogicalValue(array.GetView(i - 1));
+    const auto rval = GetView::LogicalValue(array.GetView(i));
+    ASSERT_TRUE(compare(lval, rval));
+  }
+}
+// Base class for testing against random chunked array.
+template <typename Type, SortOrder order>
+struct TestSelectKWithChunkedArrayRandomBase : public ::testing::Test {
+  void TestSelectK(int length) {
+    using ArrayType = typename TypeTraits<Type>::ArrayType;
+    // We can use INSTANTIATE_TEST_SUITE_P() instead of using fors in a test.
+    for (auto null_probability : {0.0, 0.1, 0.5, 0.9, 1.0}) {
+      for (auto num_chunks : {1, 2, 5, 10, 40}) {
+        std::vector<std::shared_ptr<Array>> arrays;
+        for (int i = 0; i < num_chunks; ++i) {
+          auto array = this->GenerateArray(length / num_chunks, null_probability);
+          arrays.push_back(array);
+        }
+        ASSERT_OK_AND_ASSIGN(auto chunked_array, ChunkedArray::Make(arrays));
+        ASSERT_OK_AND_ASSIGN(auto indices, SelectK<order>(Datum(*chunked_array), 5));
+        ASSERT_OK_AND_ASSIGN(auto actual, Take(Datum(chunked_array), Datum(indices),
+                                               TakeOptions::NoBoundsCheck()));
+        ASSERT_OK_AND_ASSIGN(auto sorted_k,
+                             Concatenate(actual.chunked_array()->chunks()));
+
+        ValidateSelectKIndices<ArrayType, order>(
+            *checked_pointer_cast<ArrayType>(sorted_k));
+      }
+    }
+  }
+
+  void SetUp() override { rand_ = new Random<Type>(0x5487655); }
+
+  void TearDown() override { delete rand_; }
+
+ protected:
+  std::shared_ptr<Array> GenerateArray(int length, double null_probability) {
+    return rand_->Generate(length, null_probability);
+  }
+
+ private:
+  Random<Type>* rand_;
+};
+
+// Long array with big value range
+template <typename Type>
+class TestTopKChunkedArrayRandom
+    : public TestSelectKWithChunkedArrayRandomBase<Type, SortOrder::Descending> {};
+
+TYPED_TEST_SUITE(TestTopKChunkedArrayRandom, SelectKableTypes);
+
+TYPED_TEST(TestTopKChunkedArrayRandom, TopK) { this->TestSelectK(1000); }
+
+template <typename Type>
+class TestBottomKChunkedArrayRandom
+    : public TestSelectKWithChunkedArrayRandomBase<Type, SortOrder::Ascending> {};
+
+TYPED_TEST_SUITE(TestBottomKChunkedArrayRandom, SelectKableTypes);
+
+TYPED_TEST(TestBottomKChunkedArrayRandom, BottomK) { this->TestSelectK(1000); }
+
+// // Test basic cases for record batch.
+class TestSelectKWithRecordBatch : public ::testing::Test {
+ public:
+  void Check(const std::shared_ptr<Schema>& schm, const std::string& batch_json,
+             const SelectKOptions& options, const std::string& expected_batch) {
+    std::shared_ptr<RecordBatch> actual;
+    ASSERT_OK(this->DoSelectK(schm, batch_json, options, &actual));
+    ASSERT_BATCHES_EQUAL(*RecordBatchFromJSON(schm, expected_batch), *actual);
+  }
+
+  Status DoSelectK(const std::shared_ptr<Schema>& schm, const std::string& batch_json,
+                   const SelectKOptions& options, std::shared_ptr<RecordBatch>* out) {
+    auto batch = RecordBatchFromJSON(schm, batch_json);
+    ARROW_ASSIGN_OR_RAISE(auto indices, SelectKUnstable(Datum(*batch), options));
+
+    ValidateOutput(*indices);
+    ARROW_ASSIGN_OR_RAISE(
+        auto select_k, Take(Datum(batch), Datum(indices), TakeOptions::NoBoundsCheck()));
+    *out = select_k.record_batch();
+    return Status::OK();
+  }
+};
+
+TEST_F(TestSelectKWithRecordBatch, TopKNoNull) {
+  auto schema = ::arrow::schema({
+      {field("a", uint8())},
+      {field("b", uint32())},
+  });
+
+  auto batch_input = R"([
+    {"a": 3,    "b": 5},
+    {"a": 30,   "b": 3},
+    {"a": 3,    "b": 4},
+    {"a": 0,    "b": 6},
+    {"a": 20,   "b": 5},
+    {"a": 10,   "b": 5},
+    {"a": 10,   "b": 3}
+  ])";
+
+  auto options = SelectKOptions::TopKDefault(3, {"a"});
+
+  auto expected_batch = R"([
+    {"a": 30,    "b": 3},
+    {"a": 20,    "b": 5},
+    {"a": 10,    "b": 5}
+  ])";
+
+  Check(schema, batch_input, options, expected_batch);
+}
+
+TEST_F(TestSelectKWithRecordBatch, TopKNull) {
+  auto schema = ::arrow::schema({
+      {field("a", uint8())},
+      {field("b", uint32())},
+  });
+
+  auto batch_input = R"([
+    {"a": null,    "b": 5},
+    {"a": 30,   "b": 3},
+    {"a": null,    "b": 4},
+    {"a": null,    "b": 6},
+    {"a": 20,   "b": 5},
+    {"a": null,   "b": 5},
+    {"a": 10,   "b": 3}
+  ])";
+
+  auto options = SelectKOptions::TopKDefault(3, {"a"});
+
+  auto expected_batch = R"([
+    {"a": 30,    "b": 3},
+    {"a": 20,    "b": 5},
+    {"a": 10,    "b": 3}
+  ])";
+
+  Check(schema, batch_input, options, expected_batch);
+}
+
+TEST_F(TestSelectKWithRecordBatch, TopKOneColumnKey) {
+  auto schema = ::arrow::schema({
+      {field("country", utf8())},
+      {field("population", uint64())},
+  });
+
+  auto batch_input =
+      R"([{"country": "Italy", "population": 59000000},
+        {"country": "France", "population": 65000000},
+        {"country": "Malta", "population": 434000},
+        {"country": "Maldives", "population": 434000},
+        {"country": "Brunei", "population": 434000},
+        {"country": "Iceland", "population": 337000},
+        {"country": "Nauru", "population": 11300},
+        {"country": "Tuvalu", "population": 11300},
+        {"country": "Anguilla", "population": 11300},
+        {"country": "Montserrat", "population": 5200}
+        ])";
+
+  auto options = SelectKOptions::TopKDefault(3, {"population"});
+
+  auto expected_batch =
+      R"([{"country": "France", "population": 65000000},
+         {"country": "Italy", "population": 59000000},
+         {"country": "Malta", "population": 434000}
+         ])";
+  this->Check(schema, batch_input, options, expected_batch);
+}
+
+TEST_F(TestSelectKWithRecordBatch, TopKMultipleColumnKeys) {
+  auto schema = ::arrow::schema({{field("country", utf8())},
+                                 {field("population", uint64())},
+                                 {field("GDP", uint64())}});
+
+  auto batch_input =
+      R"([{"country": "Italy", "population": 59000000, "GDP": 1937894},
+        {"country": "France", "population": 65000000, "GDP": 2583560},
+        {"country": "Malta", "population": 434000, "GDP": 12011},
+        {"country": "Maldives", "population": 434000, "GDP": 4520},
+        {"country": "Brunei", "population": 434000, "GDP": 12128},
+        {"country": "Iceland", "population": 337000, "GDP": 17036},
+        {"country": "Nauru", "population": 337000, "GDP": 182},
+        {"country": "Tuvalu", "population": 11300, "GDP": 38},
+        {"country": "Anguilla", "population": 11300, "GDP": 311}
+        ])";
+  auto options = SelectKOptions::TopKDefault(3, {"population", "GDP"});
+
+  auto expected_batch =
+      R"([{"country": "France", "population": 65000000, "GDP": 2583560},
+         {"country": "Italy", "population": 59000000, "GDP": 1937894},
+         {"country": "Brunei", "population": 434000, "GDP": 12128}
+         ])";
+  this->Check(schema, batch_input, options, expected_batch);
+}
+
+TEST_F(TestSelectKWithRecordBatch, BottomKNoNull) {
+  auto schema = ::arrow::schema({
+      {field("a", uint8())},
+      {field("b", uint32())},
+  });
+
+  auto batch_input = R"([
+    {"a": 3,    "b": 5},
+    {"a": 30,   "b": 3},
+    {"a": 3,    "b": 4},
+    {"a": 0,    "b": 6},
+    {"a": 20,   "b": 5},
+    {"a": 10,   "b": 5},
+    {"a": 10,   "b": 3}
+  ])";
+
+  auto options = SelectKOptions::BottomKDefault(3, {"a"});
+
+  auto expected_batch = R"([
+    {"a": 0,    "b": 6},
+    {"a": 3,    "b": 4},
+    {"a": 3,    "b": 5}
+  ])";
+
+  Check(schema, batch_input, options, expected_batch);
+}
+
+TEST_F(TestSelectKWithRecordBatch, BottomKNull) {
+  auto schema = ::arrow::schema({
+      {field("a", uint8())},
+      {field("b", uint32())},
+  });
+
+  auto batch_input = R"([
+    {"a": null,    "b": 5},
+    {"a": 30,   "b": 3},
+    {"a": null,    "b": 4},
+    {"a": null,    "b": 6},
+    {"a": 20,   "b": 5},
+    {"a": null,   "b": 5},
+    {"a": 10,   "b": 3}
+  ])";
+
+  auto options = SelectKOptions::BottomKDefault(3, {"a"});
+
+  auto expected_batch = R"([
+    {"a": 10,    "b": 3},
+    {"a": 20,    "b": 5},
+    {"a": 30,    "b": 3}
+  ])";
+
+  Check(schema, batch_input, options, expected_batch);
+}
+
+TEST_F(TestSelectKWithRecordBatch, BottomKOneColumnKey) {
+  auto schema = ::arrow::schema({
+      {field("country", utf8())},
+      {field("population", uint64())},
+  });
+
+  auto batch_input =
+      R"([{"country": "Italy", "population": 59000000},
+        {"country": "France", "population": 65000000},
+        {"country": "Malta", "population": 434000},
+        {"country": "Maldives", "population": 434000},
+        {"country": "Brunei", "population": 434000},
+        {"country": "Iceland", "population": 337000},
+        {"country": "Nauru", "population": 11300},
+        {"country": "Tuvalu", "population": 11300},
+        {"country": "Anguilla", "population": 11300},
+        {"country": "Montserrat", "population": 5200}
+        ])";
+
+  auto options = SelectKOptions::BottomKDefault(3, {"population"});
+
+  auto expected_batch =
+      R"([{"country": "Montserrat", "population": 5200},
+         {"country": "Anguilla", "population": 11300},
+         {"country": "Tuvalu", "population": 11300}
+         ])";
+  this->Check(schema, batch_input, options, expected_batch);
+}
+
+TEST_F(TestSelectKWithRecordBatch, BottomKMultipleColumnKeys) {
+  auto schema = ::arrow::schema({{field("country", utf8())},
+                                 {field("population", uint64())},
+                                 {field("GDP", uint64())}});
+
+  auto batch_input =
+      R"([{"country": "Italy", "population": 59000000, "GDP": 1937894},
+        {"country": "France", "population": 65000000, "GDP": 2583560},
+        {"country": "Malta", "population": 434000, "GDP": 12011},
+        {"country": "Maldives", "population": 434000, "GDP": 4520},
+        {"country": "Brunei", "population": 434000, "GDP": 12128},
+        {"country": "Iceland", "population": 337000, "GDP": 17036},
+        {"country": "Nauru", "population": 337000, "GDP": 182},
+        {"country": "Tuvalu", "population": 11300, "GDP": 38},
+        {"country": "Anguilla", "population": 11300, "GDP": 311}
+        ])";
+
+  auto options = SelectKOptions::BottomKDefault(3, {"population", "GDP"});
+
+  auto expected_batch =
+      R"([{"country": "Tuvalu", "population": 11300, "GDP": 38},
+         {"country": "Anguilla", "population": 11300, "GDP": 311},
+         {"country": "Nauru", "population": 337000, "GDP": 182}
+         ])";
+  this->Check(schema, batch_input, options, expected_batch);
+}
+
+// Test basic cases for table.
+struct TestSelectKWithTable : public ::testing::Test {
+  void Check(const std::shared_ptr<Schema>& schm,
+             const std::vector<std::string>& input_json, const SelectKOptions& options,
+             const std::vector<std::string>& expected) {
+    std::shared_ptr<Table> actual;
+    ASSERT_OK(this->DoSelectK(schm, input_json, options, &actual));
+    ASSERT_TABLES_EQUAL(*TableFromJSON(schm, expected), *actual);
+  }
+
+  Status DoSelectK(const std::shared_ptr<Schema>& schm,
+                   const std::vector<std::string>& input_json,
+                   const SelectKOptions& options, std::shared_ptr<Table>* out) {
+    auto table = TableFromJSON(schm, input_json);
+    ARROW_ASSIGN_OR_RAISE(auto indices, SelectKUnstable(Datum(*table), options));
+    ValidateOutput(*indices);
+
+    ARROW_ASSIGN_OR_RAISE(
+        auto select_k, Take(Datum(table), Datum(indices), TakeOptions::NoBoundsCheck()));
+    *out = select_k.table();
+    return Status::OK();
+  }
+};
+
+TEST_F(TestSelectKWithTable, TopKOneColumnKey) {
+  auto schema = ::arrow::schema({
+      {field("a", uint8())},
+      {field("b", uint32())},
+  });
+
+  std::vector<std::string> input = {R"([{"a": null, "b": 5},
+                                     {"a": 1,    "b": 3},
+                                     {"a": 3,    "b": null},
+                                     {"a": null, "b": null},
+                                     {"a": 2,    "b": 5},
+                                     {"a": 1,    "b": 5}
+                                    ])"};
+
+  auto options = SelectKOptions::TopKDefault(3, {"a"});
+
+  std::vector<std::string> expected = {R"([{"a": 3,    "b": null},
+                                     {"a": 2,    "b": 5},
+                                     {"a": 1,    "b": 3}
+                                    ])"};
+  Check(schema, input, options, expected);
+}
+
+TEST_F(TestSelectKWithTable, TopKMultipleColumnKeys) {
+  auto schema = ::arrow::schema({
+      {field("a", uint8())},
+      {field("b", uint32())},
+  });
+  std::vector<std::string> input = {R"([{"a": null, "b": 5},
+                                        {"a": 1,    "b": 3},
+                                        {"a": 3,    "b": null}
+                                      ])",
+                                    R"([{"a": null, "b": null},
+                                          {"a": 2,    "b": 5},
+                                          {"a": 1,    "b": 5}
+                                        ])"};
+
+  auto options = SelectKOptions::TopKDefault(3, {"a", "b"});
+
+  std::vector<std::string> expected = {R"([{"a": 3,    "b": null},
+                                     {"a": 2,    "b": 5},
+                                     {"a": 1,    "b": 5}
+                                    ])"};
+  Check(schema, input, options, expected);
+}
+
+TEST_F(TestSelectKWithTable, BottomKOneColumnKey) {
+  auto schema = ::arrow::schema({
+      {field("a", uint8())},
+      {field("b", uint32())},
+  });
+
+  std::vector<std::string> input = {R"([{"a": null, "b": 5},
+                                     {"a": 0,    "b": 3},
+                                     {"a": 3,    "b": null},
+                                     {"a": null, "b": null},
+                                     {"a": 2,    "b": 5},
+                                     {"a": 1,    "b": 5}
+                                    ])"};
+
+  auto options = SelectKOptions::BottomKDefault(3, {"a"});
+
+  std::vector<std::string> expected = {R"([{"a": 0,    "b": 3},
+                                           {"a": 1,    "b": 5},
+                                           {"a": 2,    "b": 5}
+                                           ])"};
+  Check(schema, input, options, expected);
+}
+
+TEST_F(TestSelectKWithTable, BottomKMultipleColumnKeys) {
+  auto schema = ::arrow::schema({
+      {field("a", uint8())},
+      {field("b", uint32())},
+  });
+  std::vector<std::string> input = {R"([{"a": null, "b": 5},
+                                        {"a": 1,    "b": 3},
+                                        {"a": 3,    "b": null}
+                                      ])",
+                                    R"([{"a": null, "b": null},
+                                          {"a": 2,    "b": 5},
+                                          {"a": 1,    "b": 5}
+                                        ])"};
+
+  auto options = SelectKOptions::BottomKDefault(3, {"a", "b"});
+
+  std::vector<std::string> expected = {R"([{"a": 1,    "b": 3},
+                                     {"a": 1,    "b": 5},
+                                     {"a": 2,    "b": 5}
+                                    ])"};
+  Check(schema, input, options, expected);
+}
+
+}  // namespace compute
+}  // namespace arrow
diff --git a/cpp/src/arrow/compute/kernels/test_util.h b/cpp/src/arrow/compute/kernels/test_util.h
index b685599f952..79745b05552 100644
--- a/cpp/src/arrow/compute/kernels/test_util.h
+++ b/cpp/src/arrow/compute/kernels/test_util.h
@@ -35,6 +35,7 @@
 #include "arrow/testing/random.h"
 #include "arrow/testing/util.h"
 #include "arrow/type.h"
+#include "arrow/util/checked_cast.h"
 
 // IWYU pragma: end_exports
 
@@ -142,5 +143,84 @@ enable_if_decimal<T, std::shared_ptr<DataType>> default_type_instance() {
   return std::make_shared<T>(5, 2);
 }
 
+// Random Generator Helpers
+class RandomImpl {
+ protected:
+  random::RandomArrayGenerator generator_;
+  std::shared_ptr<DataType> type_;
+
+  explicit RandomImpl(random::SeedType seed, std::shared_ptr<DataType> type)
+      : generator_(seed), type_(std::move(type)) {}
+
+ public:
+  std::shared_ptr<Array> Generate(uint64_t count, double null_prob) {
+    return generator_.ArrayOf(type_, count, null_prob);
+  }
+
+  std::shared_ptr<Int32Array> Offsets(int32_t length, int32_t slice_count) {
+    return arrow::internal::checked_pointer_cast<Int32Array>(
+        generator_.Offsets(slice_count, 0, length));
+  }
+};
+
+template <typename ArrowType>
+class Random : public RandomImpl {
+ public:
+  explicit Random(random::SeedType seed)
+      : RandomImpl(seed, TypeTraits<ArrowType>::type_singleton()) {}
+};
+
+template <>
+class Random<FloatType> : public RandomImpl {
+  using CType = float;
+
+ public:
+  explicit Random(random::SeedType seed) : RandomImpl(seed, float32()) {}
+
+  std::shared_ptr<Array> Generate(uint64_t count, double null_prob, double nan_prob = 0) {
+    return generator_.Float32(count, std::numeric_limits<CType>::min(),
+                              std::numeric_limits<CType>::max(), null_prob, nan_prob);
+  }
+};
+
+template <>
+class Random<DoubleType> : public RandomImpl {
+  using CType = double;
+
+ public:
+  explicit Random(random::SeedType seed) : RandomImpl(seed, float64()) {}
+
+  std::shared_ptr<Array> Generate(uint64_t count, double null_prob, double nan_prob = 0) {
+    return generator_.Float64(count, std::numeric_limits<CType>::min(),
+                              std::numeric_limits<CType>::max(), null_prob, nan_prob);
+  }
+};
+
+template <>
+class Random<Decimal128Type> : public RandomImpl {
+ public:
+  explicit Random(random::SeedType seed,
+                  std::shared_ptr<DataType> type = decimal128(18, 5))
+      : RandomImpl(seed, std::move(type)) {}
+};
+
+template <typename ArrowType>
+class RandomRange : public RandomImpl {
+  using CType = typename TypeTraits<ArrowType>::CType;
+
+ public:
+  explicit RandomRange(random::SeedType seed)
+      : RandomImpl(seed, TypeTraits<ArrowType>::type_singleton()) {}
+
+  std::shared_ptr<Array> Generate(uint64_t count, int range, double null_prob) {
+    CType min = std::numeric_limits<CType>::min();
+    CType max = min + range;
+    if (sizeof(CType) < 4 && (range + min) > std::numeric_limits<CType>::max()) {
+      max = std::numeric_limits<CType>::max();
+    }
+    return generator_.Numeric<ArrowType>(count, min, max, null_prob);
+  }
+};
+
 }  // namespace compute
 }  // namespace arrow
diff --git a/cpp/src/arrow/compute/kernels/util_internal.h b/cpp/src/arrow/compute/kernels/util_internal.h
index 8d21e34b3bf..eaaf96ef431 100644
--- a/cpp/src/arrow/compute/kernels/util_internal.h
+++ b/cpp/src/arrow/compute/kernels/util_internal.h
@@ -26,23 +26,12 @@
 #include "arrow/compute/kernels/codegen_internal.h"
 #include "arrow/compute/type_fwd.h"
 #include "arrow/util/bit_run_reader.h"
+#include "arrow/util/math_constants.h"
 
 namespace arrow {
 namespace compute {
 namespace internal {
 
-// Used in some kernels and testing - not provided by default in MSVC
-// and _USE_MATH_DEFINES is not reliable with unity builds
-#ifndef M_PI
-#define M_PI 3.14159265358979323846
-#endif
-#ifndef M_PI_2
-#define M_PI_2 1.57079632679489661923
-#endif
-#ifndef M_PI_4
-#define M_PI_4 0.785398163397448309616
-#endif
-
 template <typename T>
 using maybe_make_unsigned =
     typename std::conditional<std::is_integral<T>::value && !std::is_same<T, bool>::value,
diff --git a/cpp/src/arrow/compute/kernels/vector_sort.cc b/cpp/src/arrow/compute/kernels/vector_sort.cc
index 7fa43e715d8..70537954510 100644
--- a/cpp/src/arrow/compute/kernels/vector_sort.cc
+++ b/cpp/src/arrow/compute/kernels/vector_sort.cc
@@ -19,9 +19,11 @@
 #include <cmath>
 #include <limits>
 #include <numeric>
+#include <queue>
 #include <type_traits>
 #include <utility>
 
+#include "arrow/array/concatenate.h"
 #include "arrow/array/data.h"
 #include "arrow/compute/api_vector.h"
 #include "arrow/compute/kernels/common.h"
@@ -98,7 +100,7 @@ struct ResolvedChunk<Array> {
 struct ChunkedArrayResolver {
   explicit ChunkedArrayResolver(const std::vector<const Array*>& chunks)
       : num_chunks_(static_cast<int64_t>(chunks.size())),
-        chunks_(chunks.data()),
+        chunks_(chunks),
         offsets_(MakeEndOffsets(chunks)),
         cached_chunk_(0) {}
 
@@ -156,7 +158,7 @@ struct ChunkedArrayResolver {
   }
 
   int64_t num_chunks_;
-  const Array* const* chunks_;
+  const std::vector<const Array*> chunks_;
   std::vector<int64_t> offsets_;
 
   mutable int64_t cached_chunk_;
@@ -636,12 +638,6 @@ struct ArraySortIndices {
   }
 };
 
-// Sort indices kernels implemented for
-//
-// * Boolean type
-// * Number types
-// * Base binary types
-
 template <template <typename...> class ExecTemplate>
 void AddSortingKernels(VectorKernel base, VectorFunction* func) {
   // bool type
@@ -649,6 +645,11 @@ void AddSortingKernels(VectorKernel base, VectorFunction* func) {
   base.exec = ExecTemplate<UInt64Type, BooleanType>::Exec;
   DCHECK_OK(func->AddKernel(base));
 
+  // duration type
+  base.signature = KernelSignature::Make({InputType::Array(Type::DURATION)}, uint64());
+  base.exec = GenerateNumeric<ExecTemplate, UInt64Type>(*int64());
+  DCHECK_OK(func->AddKernel(base));
+
   for (const auto& ty : NumericTypes()) {
     auto physical_type = GetPhysicalType(ty);
     base.signature = KernelSignature::Make({InputType::Array(ty)}, uint64());
@@ -657,7 +658,7 @@ void AddSortingKernels(VectorKernel base, VectorFunction* func) {
   }
   for (const auto& ty : TemporalTypes()) {
     auto physical_type = GetPhysicalType(ty);
-    base.signature = KernelSignature::Make({InputType::Array(ty)}, uint64());
+    base.signature = KernelSignature::Make({InputType::Array(ty->id())}, uint64());
     base.exec = GenerateNumeric<ExecTemplate, UInt64Type>(*physical_type);
     DCHECK_OK(func->AddKernel(base));
   }
@@ -1142,6 +1143,23 @@ class MultipleKeyComparator {
     return current_compared_ < 0;
   }
 
+  bool Equals(uint64_t left, uint64_t right, size_t start_sort_key_index) {
+    current_left_ = left;
+    current_right_ = right;
+    current_compared_ = 0;
+    auto num_sort_keys = sort_keys_.size();
+    for (size_t i = start_sort_key_index; i < num_sort_keys; ++i) {
+      current_sort_key_index_ = i;
+      status_ = VisitTypeInline(*sort_keys_[i].type, this);
+      // If the left value equals to the right value, we need to
+      // continue to sort.
+      if (current_compared_ != 0) {
+        return false;
+      }
+    }
+    return current_compared_ == 0;
+  }
+
 #define VISIT(TYPE)                          \
   Status Visit(const TYPE& type) {           \
     current_compared_ = CompareType<TYPE>(); \
@@ -1250,7 +1268,7 @@ class MultipleKeyComparator {
 
 // Sort a batch using a single sort and multiple-key comparisons.
 class MultipleKeyRecordBatchSorter : public TypeVisitor {
- private:
+ public:
   // Preprocessed sort key.
   struct ResolvedSortKey {
     ResolvedSortKey(const std::shared_ptr<Array>& array, const SortOrder order)
@@ -1272,6 +1290,7 @@ class MultipleKeyRecordBatchSorter : public TypeVisitor {
     int64_t null_count;
   };
 
+ private:
   using Comparator = MultipleKeyComparator<ResolvedSortKey>;
 
  public:
@@ -1447,7 +1466,7 @@ class TableRadixSorter {
 
 // Sort a table using a single sort and multiple-key comparisons.
 class MultipleKeyTableSorter : public TypeVisitor {
- private:
+ public:
   // TODO instead of resolving chunks for each column independently, we could
   // split the table into RecordBatches and pay the cost of chunked indexing
   // at the first column only.
@@ -1778,6 +1797,606 @@ class SortIndicesMetaFunction : public MetaFunction {
   }
 };
 
+// ----------------------------------------------------------------------
+// TopK/BottomK implementations
+
+const auto kDefaultSelectKOptions = SelectKOptions::Defaults();
+
+const FunctionDoc select_k_unstable_doc(
+    "Selects the indices of the first `k` ordered elements from the input",
+    ("This function selects an array of indices of the first `k` ordered elements from\n"
+     "the input array, record batch or table specified in the column keys\n"
+     "(`options.sort_keys`). Output is not guaranteed to be stable.\n"
+     "The columns that are not specified are returned as well, but not used for\n"
+     "ordering. Null values are considered  greater than any other value and are\n"
+     "therefore sorted at the end of the array. For floating-point types, ordering of\n"
+     "values is such that: Null > NaN > Inf > number."),
+    {"input"}, "SelectKOptions");
+
+Result<std::shared_ptr<ArrayData>> MakeMutableUInt64Array(
+    std::shared_ptr<DataType> out_type, int64_t length, MemoryPool* memory_pool) {
+  auto buffer_size = length * sizeof(uint64_t);
+  ARROW_ASSIGN_OR_RAISE(auto data, AllocateBuffer(buffer_size, memory_pool));
+  return ArrayData::Make(uint64(), length, {nullptr, std::move(data)}, /*null_count=*/0);
+}
+
+template <SortOrder order>
+class SelectKComparator {
+ public:
+  template <typename Type>
+  bool operator()(const Type& lval, const Type& rval);
+};
+
+template <>
+class SelectKComparator<SortOrder::Ascending> {
+ public:
+  template <typename Type>
+  bool operator()(const Type& lval, const Type& rval) {
+    return lval < rval;
+  }
+};
+
+template <>
+class SelectKComparator<SortOrder::Descending> {
+ public:
+  template <typename Type>
+  bool operator()(const Type& lval, const Type& rval) {
+    return rval < lval;
+  }
+};
+
+class ArraySelecter : public TypeVisitor {
+ public:
+  ArraySelecter(ExecContext* ctx, const Array& array, const SelectKOptions& options,
+                Datum* output)
+      : TypeVisitor(),
+        ctx_(ctx),
+        array_(array),
+        k_(options.k),
+        order_(options.sort_keys[0].order),
+        physical_type_(GetPhysicalType(array.type())),
+        output_(output) {}
+
+  Status Run() { return physical_type_->Accept(this); }
+
+#define VISIT(TYPE)                                           \
+  Status Visit(const TYPE& type) {                            \
+    if (order_ == SortOrder::Ascending) {                     \
+      return SelectKthInternal<TYPE, SortOrder::Ascending>(); \
+    }                                                         \
+    return SelectKthInternal<TYPE, SortOrder::Descending>();  \
+  }
+
+  VISIT_PHYSICAL_TYPES(VISIT)
+
+#undef VISIT
+
+  template <typename InType, SortOrder sort_order>
+  Status SelectKthInternal() {
+    using GetView = GetViewType<InType>;
+    using ArrayType = typename TypeTraits<InType>::ArrayType;
+
+    ArrayType arr(array_.data());
+    std::vector<uint64_t> indices(arr.length());
+
+    uint64_t* indices_begin = indices.data();
+    uint64_t* indices_end = indices_begin + indices.size();
+    std::iota(indices_begin, indices_end, 0);
+    if (k_ > arr.length()) {
+      k_ = arr.length();
+    }
+    auto end_iter = PartitionNulls<ArrayType, NonStablePartitioner>(indices_begin,
+                                                                    indices_end, arr, 0);
+    auto kth_begin = std::min(indices_begin + k_, end_iter);
+
+    SelectKComparator<sort_order> comparator;
+    auto cmp = [&arr, &comparator](uint64_t left, uint64_t right) {
+      const auto lval = GetView::LogicalValue(arr.GetView(left));
+      const auto rval = GetView::LogicalValue(arr.GetView(right));
+      return comparator(lval, rval);
+    };
+    using HeapContainer =
+        std::priority_queue<uint64_t, std::vector<uint64_t>, decltype(cmp)>;
+    HeapContainer heap(indices_begin, kth_begin, cmp);
+    for (auto iter = kth_begin; iter != end_iter && !heap.empty(); ++iter) {
+      uint64_t x_index = *iter;
+      if (cmp(x_index, heap.top())) {
+        heap.pop();
+        heap.push(x_index);
+      }
+    }
+    int64_t out_size = static_cast<int64_t>(heap.size());
+    ARROW_ASSIGN_OR_RAISE(auto take_indices, MakeMutableUInt64Array(uint64(), out_size,
+                                                                    ctx_->memory_pool()));
+
+    auto* out_cbegin = take_indices->GetMutableValues<uint64_t>(1) + out_size - 1;
+    while (heap.size() > 0) {
+      *out_cbegin = heap.top();
+      heap.pop();
+      --out_cbegin;
+    }
+    *output_ = Datum(take_indices);
+    return Status::OK();
+  }
+
+  ExecContext* ctx_;
+  const Array& array_;
+  int64_t k_;
+  SortOrder order_;
+  const std::shared_ptr<DataType> physical_type_;
+  Datum* output_;
+};
+
+template <typename ArrayType>
+struct TypedHeapItem {
+  uint64_t index;
+  uint64_t offset;
+  ArrayType* array;
+};
+
+class ChunkedArraySelecter : public TypeVisitor {
+ public:
+  ChunkedArraySelecter(ExecContext* ctx, const ChunkedArray& chunked_array,
+                       const SelectKOptions& options, Datum* output)
+      : TypeVisitor(),
+        chunked_array_(chunked_array),
+        physical_type_(GetPhysicalType(chunked_array.type())),
+        physical_chunks_(GetPhysicalChunks(chunked_array_, physical_type_)),
+        k_(options.k),
+        order_(options.sort_keys[0].order),
+        ctx_(ctx),
+        output_(output) {}
+
+  Status Run() { return physical_type_->Accept(this); }
+
+#define VISIT(TYPE)                                           \
+  Status Visit(const TYPE& type) {                            \
+    if (order_ == SortOrder::Ascending) {                     \
+      return SelectKthInternal<TYPE, SortOrder::Ascending>(); \
+    }                                                         \
+    return SelectKthInternal<TYPE, SortOrder::Descending>();  \
+  }
+
+  VISIT_PHYSICAL_TYPES(VISIT)
+#undef VISIT
+
+  template <typename InType, SortOrder sort_order>
+  Status SelectKthInternal() {
+    using GetView = GetViewType<InType>;
+    using ArrayType = typename TypeTraits<InType>::ArrayType;
+    using HeapItem = TypedHeapItem<ArrayType>;
+
+    const auto num_chunks = chunked_array_.num_chunks();
+    if (num_chunks == 0) {
+      return Status::OK();
+    }
+    if (k_ > chunked_array_.length()) {
+      k_ = chunked_array_.length();
+    }
+    std::function<bool(const HeapItem&, const HeapItem&)> cmp;
+    SelectKComparator<sort_order> comparator;
+
+    cmp = [&comparator](const HeapItem& left, const HeapItem& right) -> bool {
+      const auto lval = GetView::LogicalValue(left.array->GetView(left.index));
+      const auto rval = GetView::LogicalValue(right.array->GetView(right.index));
+      return comparator(lval, rval);
+    };
+    using HeapContainer =
+        std::priority_queue<HeapItem, std::vector<HeapItem>, decltype(cmp)>;
+
+    HeapContainer heap(cmp);
+    std::vector<std::shared_ptr<ArrayType>> chunks_holder;
+    uint64_t offset = 0;
+    for (const auto& chunk : physical_chunks_) {
+      if (chunk->length() == 0) continue;
+      chunks_holder.emplace_back(std::make_shared<ArrayType>(chunk->data()));
+      ArrayType& arr = *chunks_holder[chunks_holder.size() - 1];
+
+      std::vector<uint64_t> indices(arr.length());
+      uint64_t* indices_begin = indices.data();
+      uint64_t* indices_end = indices_begin + indices.size();
+      std::iota(indices_begin, indices_end, 0);
+
+      auto end_iter = PartitionNulls<ArrayType, NonStablePartitioner>(
+          indices_begin, indices_end, arr, 0);
+      auto kth_begin = std::min(indices_begin + k_, end_iter);
+      uint64_t* iter = indices_begin;
+      for (; iter != kth_begin && heap.size() < static_cast<size_t>(k_); ++iter) {
+        heap.push(HeapItem{*iter, offset, &arr});
+      }
+      for (; iter != end_iter && !heap.empty(); ++iter) {
+        uint64_t x_index = *iter;
+        const auto& xval = GetView::LogicalValue(arr.GetView(x_index));
+        auto top_item = heap.top();
+        const auto& top_value =
+            GetView::LogicalValue(top_item.array->GetView(top_item.index));
+        if (comparator(xval, top_value)) {
+          heap.pop();
+          heap.push(HeapItem{x_index, offset, &arr});
+        }
+      }
+      offset += chunk->length();
+    }
+
+    int64_t out_size = static_cast<int64_t>(heap.size());
+    ARROW_ASSIGN_OR_RAISE(auto take_indices, MakeMutableUInt64Array(uint64(), out_size,
+                                                                    ctx_->memory_pool()));
+    auto* out_cbegin = take_indices->GetMutableValues<uint64_t>(1) + out_size - 1;
+    while (heap.size() > 0) {
+      auto top_item = heap.top();
+      *out_cbegin = top_item.index + top_item.offset;
+      heap.pop();
+      --out_cbegin;
+    }
+    *output_ = Datum(take_indices);
+    return Status::OK();
+  }
+
+  const ChunkedArray& chunked_array_;
+  const std::shared_ptr<DataType> physical_type_;
+  const ArrayVector physical_chunks_;
+  int64_t k_;
+  SortOrder order_;
+  ExecContext* ctx_;
+  Datum* output_;
+};  // namespace
+
+class RecordBatchSelecter : public TypeVisitor {
+ private:
+  using ResolvedSortKey = MultipleKeyRecordBatchSorter::ResolvedSortKey;
+  using Comparator = MultipleKeyComparator<ResolvedSortKey>;
+
+ public:
+  RecordBatchSelecter(ExecContext* ctx, const RecordBatch& record_batch,
+                      const SelectKOptions& options, Datum* output)
+      : TypeVisitor(),
+        ctx_(ctx),
+        record_batch_(record_batch),
+        k_(options.k),
+        output_(output),
+        sort_keys_(ResolveSortKeys(record_batch, options.sort_keys)),
+        comparator_(sort_keys_) {}
+
+  Status Run() { return sort_keys_[0].type->Accept(this); }
+
+ protected:
+#define VISIT(TYPE)                                            \
+  Status Visit(const TYPE& type) {                             \
+    if (sort_keys_[0].order == SortOrder::Descending)          \
+      return SelectKthInternal<TYPE, SortOrder::Descending>(); \
+    return SelectKthInternal<TYPE, SortOrder::Ascending>();    \
+  }
+  VISIT_PHYSICAL_TYPES(VISIT)
+#undef VISIT
+
+  static std::vector<ResolvedSortKey> ResolveSortKeys(
+      const RecordBatch& batch, const std::vector<SortKey>& sort_keys) {
+    std::vector<ResolvedSortKey> resolved;
+    for (const auto& key : sort_keys) {
+      auto array = batch.GetColumnByName(key.name);
+      resolved.emplace_back(array, key.order);
+    }
+    return resolved;
+  }
+
+  template <typename InType, SortOrder sort_order>
+  Status SelectKthInternal() {
+    using GetView = GetViewType<InType>;
+    using ArrayType = typename TypeTraits<InType>::ArrayType;
+    auto& comparator = comparator_;
+    const auto& first_sort_key = sort_keys_[0];
+    const ArrayType& arr = checked_cast<const ArrayType&>(first_sort_key.array);
+
+    const auto num_rows = record_batch_.num_rows();
+    if (num_rows == 0) {
+      return Status::OK();
+    }
+    if (k_ > record_batch_.num_rows()) {
+      k_ = record_batch_.num_rows();
+    }
+    std::function<bool(const uint64_t&, const uint64_t&)> cmp;
+    SelectKComparator<sort_order> select_k_comparator;
+    cmp = [&](const uint64_t& left, const uint64_t& right) -> bool {
+      const auto lval = GetView::LogicalValue(arr.GetView(left));
+      const auto rval = GetView::LogicalValue(arr.GetView(right));
+      if (lval == rval) {
+        // If the left value equals to the right value,
+        // we need to compare the second and following
+        // sort keys.
+        return comparator.Compare(left, right, 1);
+      }
+      return select_k_comparator(lval, rval);
+    };
+    using HeapContainer =
+        std::priority_queue<uint64_t, std::vector<uint64_t>, decltype(cmp)>;
+
+    std::vector<uint64_t> indices(arr.length());
+    uint64_t* indices_begin = indices.data();
+    uint64_t* indices_end = indices_begin + indices.size();
+    std::iota(indices_begin, indices_end, 0);
+
+    auto end_iter = PartitionNulls<ArrayType, NonStablePartitioner>(indices_begin,
+                                                                    indices_end, arr, 0);
+    auto kth_begin = std::min(indices_begin + k_, end_iter);
+
+    HeapContainer heap(indices_begin, kth_begin, cmp);
+    for (auto iter = kth_begin; iter != end_iter && !heap.empty(); ++iter) {
+      uint64_t x_index = *iter;
+      auto top_item = heap.top();
+      if (cmp(x_index, top_item)) {
+        heap.pop();
+        heap.push(x_index);
+      }
+    }
+    int64_t out_size = static_cast<int64_t>(heap.size());
+    ARROW_ASSIGN_OR_RAISE(auto take_indices, MakeMutableUInt64Array(uint64(), out_size,
+                                                                    ctx_->memory_pool()));
+    auto* out_cbegin = take_indices->GetMutableValues<uint64_t>(1) + out_size - 1;
+    while (heap.size() > 0) {
+      *out_cbegin = heap.top();
+      heap.pop();
+      --out_cbegin;
+    }
+    *output_ = Datum(take_indices);
+    return Status::OK();
+  }
+
+  ExecContext* ctx_;
+  const RecordBatch& record_batch_;
+  int64_t k_;
+  Datum* output_;
+  std::vector<ResolvedSortKey> sort_keys_;
+  Comparator comparator_;
+};
+
+class TableSelecter : public TypeVisitor {
+ private:
+  using ResolvedSortKey = MultipleKeyTableSorter::ResolvedSortKey;
+  using Comparator = MultipleKeyComparator<ResolvedSortKey>;
+
+ public:
+  TableSelecter(ExecContext* ctx, const Table& table, const SelectKOptions& options,
+                Datum* output)
+      : TypeVisitor(),
+        ctx_(ctx),
+        table_(table),
+        k_(options.k),
+        output_(output),
+        sort_keys_(ResolveSortKeys(table, options.sort_keys)),
+        comparator_(sort_keys_) {}
+
+  Status Run() { return sort_keys_[0].type->Accept(this); }
+
+ protected:
+#define VISIT(TYPE)                                            \
+  Status Visit(const TYPE& type) {                             \
+    if (sort_keys_[0].order == SortOrder::Descending)          \
+      return SelectKthInternal<TYPE, SortOrder::Descending>(); \
+    return SelectKthInternal<TYPE, SortOrder::Ascending>();    \
+  }
+  VISIT_PHYSICAL_TYPES(VISIT)
+
+#undef VISIT
+
+  static std::vector<ResolvedSortKey> ResolveSortKeys(
+      const Table& table, const std::vector<SortKey>& sort_keys) {
+    std::vector<ResolvedSortKey> resolved;
+    for (const auto& key : sort_keys) {
+      auto chunked_array = table.GetColumnByName(key.name);
+      resolved.emplace_back(*chunked_array, key.order);
+    }
+    return resolved;
+  }
+
+  // Behaves like PatitionNulls() but this supports multiple sort keys.
+  //
+  // For non-float types.
+  template <typename Type>
+  enable_if_t<!is_floating_type<Type>::value, uint64_t*> PartitionNullsInternal(
+      uint64_t* indices_begin, uint64_t* indices_end,
+      const ResolvedSortKey& first_sort_key) {
+    using ArrayType = typename TypeTraits<Type>::ArrayType;
+    if (first_sort_key.null_count == 0) {
+      return indices_end;
+    }
+    StablePartitioner partitioner;
+    auto nulls_begin =
+        partitioner(indices_begin, indices_end, [&first_sort_key](uint64_t index) {
+          const auto chunk =
+              first_sort_key.GetChunk<ArrayType>(static_cast<int64_t>(index));
+          return !chunk.IsNull();
+        });
+    DCHECK_EQ(indices_end - nulls_begin, first_sort_key.null_count);
+    auto& comparator = comparator_;
+    std::stable_sort(nulls_begin, indices_end, [&](uint64_t left, uint64_t right) {
+      return comparator.Compare(left, right, 1);
+    });
+    return nulls_begin;
+  }
+
+  // Behaves like PatitionNulls() but this supports multiple sort keys.
+  //
+  // For float types.
+  template <typename Type>
+  enable_if_t<is_floating_type<Type>::value, uint64_t*> PartitionNullsInternal(
+      uint64_t* indices_begin, uint64_t* indices_end,
+      const ResolvedSortKey& first_sort_key) {
+    using ArrayType = typename TypeTraits<Type>::ArrayType;
+    StablePartitioner partitioner;
+    uint64_t* nulls_begin;
+    if (first_sort_key.null_count == 0) {
+      nulls_begin = indices_end;
+    } else {
+      nulls_begin = partitioner(indices_begin, indices_end, [&](uint64_t index) {
+        const auto chunk = first_sort_key.GetChunk<ArrayType>(index);
+        return !chunk.IsNull();
+      });
+    }
+    DCHECK_EQ(indices_end - nulls_begin, first_sort_key.null_count);
+    uint64_t* nans_begin = partitioner(indices_begin, nulls_begin, [&](uint64_t index) {
+      const auto chunk = first_sort_key.GetChunk<ArrayType>(index);
+      return !std::isnan(chunk.Value());
+    });
+    auto& comparator = comparator_;
+    // Sort all NaNs by the second and following sort keys.
+    std::stable_sort(nans_begin, nulls_begin, [&](uint64_t left, uint64_t right) {
+      return comparator.Compare(left, right, 1);
+    });
+    // Sort all nulls by the second and following sort keys.
+    std::stable_sort(nulls_begin, indices_end, [&](uint64_t left, uint64_t right) {
+      return comparator.Compare(left, right, 1);
+    });
+    return nans_begin;
+  }
+
+  template <typename InType, SortOrder sort_order>
+  Status SelectKthInternal() {
+    using ArrayType = typename TypeTraits<InType>::ArrayType;
+    auto& comparator = comparator_;
+    const auto& first_sort_key = sort_keys_[0];
+
+    const auto num_rows = table_.num_rows();
+    if (num_rows == 0) {
+      return Status::OK();
+    }
+    if (k_ > table_.num_rows()) {
+      k_ = table_.num_rows();
+    }
+    std::function<bool(const uint64_t&, const uint64_t&)> cmp;
+    SelectKComparator<sort_order> select_k_comparator;
+    cmp = [&](const uint64_t& left, const uint64_t& right) -> bool {
+      auto chunk_left = first_sort_key.template GetChunk<ArrayType>(left);
+      auto chunk_right = first_sort_key.template GetChunk<ArrayType>(right);
+      auto value_left = chunk_left.Value();
+      auto value_right = chunk_right.Value();
+      if (value_left == value_right) {
+        return comparator.Compare(left, right, 1);
+      }
+      return select_k_comparator(value_left, value_right);
+    };
+    using HeapContainer =
+        std::priority_queue<uint64_t, std::vector<uint64_t>, decltype(cmp)>;
+
+    std::vector<uint64_t> indices(num_rows);
+    uint64_t* indices_begin = indices.data();
+    uint64_t* indices_end = indices_begin + indices.size();
+    std::iota(indices_begin, indices_end, 0);
+
+    auto end_iter =
+        this->PartitionNullsInternal<InType>(indices_begin, indices_end, first_sort_key);
+    auto kth_begin = std::min(indices_begin + k_, end_iter);
+
+    HeapContainer heap(indices_begin, kth_begin, cmp);
+    for (auto iter = kth_begin; iter != end_iter && !heap.empty(); ++iter) {
+      uint64_t x_index = *iter;
+      uint64_t top_item = heap.top();
+      if (cmp(x_index, top_item)) {
+        heap.pop();
+        heap.push(x_index);
+      }
+    }
+    int64_t out_size = static_cast<int64_t>(heap.size());
+    ARROW_ASSIGN_OR_RAISE(auto take_indices, MakeMutableUInt64Array(uint64(), out_size,
+                                                                    ctx_->memory_pool()));
+    auto* out_cbegin = take_indices->GetMutableValues<uint64_t>(1) + out_size - 1;
+    while (heap.size() > 0) {
+      *out_cbegin = heap.top();
+      heap.pop();
+      --out_cbegin;
+    }
+    *output_ = Datum(take_indices);
+    return Status::OK();
+  }
+
+  ExecContext* ctx_;
+  const Table& table_;
+  int64_t k_;
+  Datum* output_;
+  std::vector<ResolvedSortKey> sort_keys_;
+  Comparator comparator_;
+};
+
+static Status CheckConsistency(const Schema& schema,
+                               const std::vector<SortKey>& sort_keys) {
+  for (const auto& key : sort_keys) {
+    auto field = schema.GetFieldByName(key.name);
+    if (!field) {
+      return Status::Invalid("Nonexistent sort key column: ", key.name);
+    }
+  }
+  return Status::OK();
+}
+
+class SelectKUnstableMetaFunction : public MetaFunction {
+ public:
+  SelectKUnstableMetaFunction()
+      : MetaFunction("select_k_unstable", Arity::Unary(), &select_k_unstable_doc,
+                     &kDefaultSelectKOptions) {}
+
+  Result<Datum> ExecuteImpl(const std::vector<Datum>& args,
+                            const FunctionOptions* options, ExecContext* ctx) const {
+    const SelectKOptions& select_k_options = static_cast<const SelectKOptions&>(*options);
+    if (select_k_options.k < 0) {
+      return Status::Invalid("SelectK requires a nonnegative `k`, got ",
+                             select_k_options.k);
+    }
+    switch (args[0].kind()) {
+      case Datum::ARRAY: {
+        return SelectKth(*args[0].make_array(), select_k_options, ctx);
+      } break;
+      case Datum::CHUNKED_ARRAY: {
+        return SelectKth(*args[0].chunked_array(), select_k_options, ctx);
+      } break;
+      case Datum::RECORD_BATCH:
+        return SelectKth(*args[0].record_batch(), select_k_options, ctx);
+        break;
+      case Datum::TABLE:
+        return SelectKth(*args[0].table(), select_k_options, ctx);
+        break;
+      default:
+        break;
+    }
+    return Status::NotImplemented(
+        "Unsupported types for select_k operation: "
+        "values=",
+        args[0].ToString());
+  }
+
+ private:
+  Result<Datum> SelectKth(const Array& array, const SelectKOptions& options,
+                          ExecContext* ctx) const {
+    Datum output;
+    ArraySelecter selecter(ctx, array, options, &output);
+    ARROW_RETURN_NOT_OK(selecter.Run());
+    return output;
+  }
+
+  Result<Datum> SelectKth(const ChunkedArray& chunked_array,
+                          const SelectKOptions& options, ExecContext* ctx) const {
+    Datum output;
+    ChunkedArraySelecter selecter(ctx, chunked_array, options, &output);
+    ARROW_RETURN_NOT_OK(selecter.Run());
+    return output;
+  }
+  Result<Datum> SelectKth(const RecordBatch& record_batch, const SelectKOptions& options,
+                          ExecContext* ctx) const {
+    ARROW_RETURN_NOT_OK(CheckConsistency(*record_batch.schema(), options.sort_keys));
+    Datum output;
+    RecordBatchSelecter selecter(ctx, record_batch, options, &output);
+    ARROW_RETURN_NOT_OK(selecter.Run());
+    return output;
+  }
+  Result<Datum> SelectKth(const Table& table, const SelectKOptions& options,
+                          ExecContext* ctx) const {
+    ARROW_RETURN_NOT_OK(CheckConsistency(*table.schema(), options.sort_keys));
+    Datum output;
+    TableSelecter selecter(ctx, table, options, &output);
+    ARROW_RETURN_NOT_OK(selecter.Run());
+    return output;
+  }
+};
+
+// array documentation
 const auto kDefaultArraySortOptions = ArraySortOptions::Defaults();
 
 const FunctionDoc array_sort_indices_doc(
@@ -1829,6 +2448,9 @@ void RegisterVectorSort(FunctionRegistry* registry) {
   base.init = PartitionNthToIndicesState::Init;
   AddSortingKernels<PartitionNthToIndices>(base, part_indices.get());
   DCHECK_OK(registry->AddFunction(std::move(part_indices)));
+
+  // select_k_unstable
+  DCHECK_OK(registry->AddFunction(std::make_shared<SelectKUnstableMetaFunction>()));
 }
 
 #undef VISIT_PHYSICAL_TYPES
diff --git a/cpp/src/arrow/compute/kernels/vector_sort_test.cc b/cpp/src/arrow/compute/kernels/vector_sort_test.cc
index 478f6ccac3a..54ac6e47485 100644
--- a/cpp/src/arrow/compute/kernels/vector_sort_test.cc
+++ b/cpp/src/arrow/compute/kernels/vector_sort_test.cc
@@ -38,34 +38,6 @@ using internal::checked_cast;
 using internal::checked_pointer_cast;
 
 namespace compute {
-
-// Convert arrow::Type to arrow::DataType. If arrow::Type isn't
-// parameter free, this returns an arrow::DataType with the default
-// parameter.
-template <typename ArrowType>
-enable_if_t<TypeTraits<ArrowType>::is_parameter_free, std::shared_ptr<DataType>>
-TypeToDataType() {
-  return TypeTraits<ArrowType>::type_singleton();
-}
-
-template <typename ArrowType>
-enable_if_t<std::is_same<ArrowType, TimestampType>::value, std::shared_ptr<DataType>>
-TypeToDataType() {
-  return timestamp(TimeUnit::MILLI);
-}
-
-template <typename ArrowType>
-enable_if_t<std::is_same<ArrowType, Time32Type>::value, std::shared_ptr<DataType>>
-TypeToDataType() {
-  return time32(TimeUnit::MILLI);
-}
-
-template <typename ArrowType>
-enable_if_t<std::is_same<ArrowType, Time64Type>::value, std::shared_ptr<DataType>>
-TypeToDataType() {
-  return time64(TimeUnit::NANO);
-}
-
 // ----------------------------------------------------------------------
 // Tests for NthToIndices
 
@@ -169,7 +141,9 @@ class TestNthToIndicesBase : public TestBase {
 template <typename ArrowType>
 class TestNthToIndices : public TestNthToIndicesBase<ArrowType> {
  protected:
-  std::shared_ptr<DataType> GetType() override { return TypeToDataType<ArrowType>(); }
+  std::shared_ptr<DataType> GetType() override {
+    return default_type_instance<ArrowType>();
+  }
 };
 
 template <typename ArrowType>
@@ -270,79 +244,6 @@ using NthToIndicesableTypes =
                      Int32Type, Int64Type, FloatType, DoubleType, Decimal128Type,
                      StringType>;
 
-class RandomImpl {
- protected:
-  random::RandomArrayGenerator generator_;
-  std::shared_ptr<DataType> type_;
-
-  explicit RandomImpl(random::SeedType seed, std::shared_ptr<DataType> type)
-      : generator_(seed), type_(std::move(type)) {}
-
- public:
-  std::shared_ptr<Array> Generate(uint64_t count, double null_prob) {
-    return generator_.ArrayOf(type_, count, null_prob);
-  }
-};
-
-template <typename ArrowType>
-class Random : public RandomImpl {
- public:
-  explicit Random(random::SeedType seed)
-      : RandomImpl(seed, TypeTraits<ArrowType>::type_singleton()) {}
-};
-
-template <>
-class Random<FloatType> : public RandomImpl {
-  using CType = float;
-
- public:
-  explicit Random(random::SeedType seed) : RandomImpl(seed, float32()) {}
-
-  std::shared_ptr<Array> Generate(uint64_t count, double null_prob, double nan_prob = 0) {
-    return generator_.Float32(count, std::numeric_limits<CType>::min(),
-                              std::numeric_limits<CType>::max(), null_prob, nan_prob);
-  }
-};
-
-template <>
-class Random<DoubleType> : public RandomImpl {
-  using CType = double;
-
- public:
-  explicit Random(random::SeedType seed) : RandomImpl(seed, float64()) {}
-
-  std::shared_ptr<Array> Generate(uint64_t count, double null_prob, double nan_prob = 0) {
-    return generator_.Float64(count, std::numeric_limits<CType>::min(),
-                              std::numeric_limits<CType>::max(), null_prob, nan_prob);
-  }
-};
-
-template <>
-class Random<Decimal128Type> : public RandomImpl {
- public:
-  explicit Random(random::SeedType seed,
-                  std::shared_ptr<DataType> type = decimal128(18, 5))
-      : RandomImpl(seed, std::move(type)) {}
-};
-
-template <typename ArrowType>
-class RandomRange : public RandomImpl {
-  using CType = typename TypeTraits<ArrowType>::CType;
-
- public:
-  explicit RandomRange(random::SeedType seed)
-      : RandomImpl(seed, TypeTraits<ArrowType>::type_singleton()) {}
-
-  std::shared_ptr<Array> Generate(uint64_t count, int range, double null_prob) {
-    CType min = std::numeric_limits<CType>::min();
-    CType max = min + range;
-    if (sizeof(CType) < 4 && (range + min) > std::numeric_limits<CType>::max()) {
-      max = std::numeric_limits<CType>::max();
-    }
-    return generator_.Numeric<ArrowType>(count, min, max, null_prob);
-  }
-};
-
 TYPED_TEST_SUITE(TestNthToIndicesRandom, NthToIndicesableTypes);
 
 TYPED_TEST(TestNthToIndicesRandom, RandomValues) {
@@ -569,6 +470,43 @@ TYPED_TEST(TestArraySortIndicesForDecimal, DecimalSortTestTypes) {
                           SortOrder::Descending, "[3, 0, 2, 4, 1]");
 }
 
+TEST(TestArraySortIndices, TemporalTypeParameters) {
+  std::vector<std::shared_ptr<DataType>> types;
+  for (auto unit : {TimeUnit::NANO, TimeUnit::MICRO, TimeUnit::MILLI, TimeUnit::SECOND}) {
+    types.push_back(duration(unit));
+    types.push_back(timestamp(unit));
+    types.push_back(timestamp(unit, "America/Phoenix"));
+  }
+  types.push_back(time64(TimeUnit::NANO));
+  types.push_back(time64(TimeUnit::MICRO));
+  types.push_back(time32(TimeUnit::MILLI));
+  types.push_back(time32(TimeUnit::SECOND));
+  for (const auto& ty : types) {
+    AssertSortIndices(ArrayFromJSON(ty, "[]"), SortOrder::Ascending,
+                      ArrayFromJSON(uint64(), "[]"));
+
+    AssertSortIndices(ArrayFromJSON(ty, "[3, 2, 6]"), SortOrder::Ascending,
+                      ArrayFromJSON(uint64(), "[1, 0, 2]"));
+    AssertSortIndices(ArrayFromJSON(ty, "[1, 2, 3, 4, 5, 6, 7]"), SortOrder::Ascending,
+                      ArrayFromJSON(uint64(), "[0, 1, 2, 3, 4, 5, 6]"));
+    AssertSortIndices(ArrayFromJSON(ty, "[7, 6, 5, 4, 3, 2, 1]"), SortOrder::Ascending,
+                      ArrayFromJSON(uint64(), "[6, 5, 4, 3, 2, 1, 0]"));
+
+    AssertSortIndices(ArrayFromJSON(ty, "[10, 12, 4, 50, 50, 32, 11]"),
+                      SortOrder::Ascending,
+                      ArrayFromJSON(uint64(), "[2, 0, 6, 1, 5, 3, 4]"));
+    AssertSortIndices(ArrayFromJSON(ty, "[10, 12, 4, 50, 50, 32, 11]"),
+                      SortOrder::Descending,
+                      ArrayFromJSON(uint64(), "[3, 4, 5, 1, 6, 0, 2]"));
+
+    AssertSortIndices(ArrayFromJSON(ty, "[null, 1, 3, null, 2, 5]"), SortOrder::Ascending,
+                      ArrayFromJSON(uint64(), "[1, 4, 2, 5, 0, 3]"));
+    AssertSortIndices(ArrayFromJSON(ty, "[null, 1, 3, null, 2, 5]"),
+                      SortOrder::Descending,
+                      ArrayFromJSON(uint64(), "[5, 2, 4, 1, 0, 3]"));
+  }
+}
+
 template <typename ArrowType>
 class TestArraySortIndicesRandom : public TestBase {};
 
@@ -686,7 +624,7 @@ TEST_F(TestChunkedArraySortIndices, NaN) {
 template <typename ArrowType>
 class TestChunkedArraySortIndicesForTemporal : public TestChunkedArraySortIndices {
  protected:
-  std::shared_ptr<DataType> GetType() { return TypeToDataType<ArrowType>(); }
+  std::shared_ptr<DataType> GetType() { return default_type_instance<ArrowType>(); }
 };
 TYPED_TEST_SUITE(TestChunkedArraySortIndicesForTemporal, TemporalArrowTypes);
 
@@ -1097,7 +1035,7 @@ TEST_F(TestTableSortIndices, Decimal) {
 template <typename ArrowType>
 class TestTableSortIndicesForTemporal : public TestTableSortIndices {
  protected:
-  std::shared_ptr<DataType> GetType() { return TypeToDataType<ArrowType>(); }
+  std::shared_ptr<DataType> GetType() { return default_type_instance<ArrowType>(); }
 };
 TYPED_TEST_SUITE(TestTableSortIndicesForTemporal, TemporalArrowTypes);
 
diff --git a/cpp/src/arrow/compute/kernels/vector_topk_benchmark.cc b/cpp/src/arrow/compute/kernels/vector_topk_benchmark.cc
new file mode 100644
index 00000000000..3f89eb6bea9
--- /dev/null
+++ b/cpp/src/arrow/compute/kernels/vector_topk_benchmark.cc
@@ -0,0 +1,59 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#include "benchmark/benchmark.h"
+
+#include "arrow/compute/api_vector.h"
+#include "arrow/compute/kernels/test_util.h"
+#include "arrow/testing/gtest_util.h"
+#include "arrow/testing/random.h"
+#include "arrow/util/benchmark_util.h"
+
+namespace arrow {
+namespace compute {
+constexpr auto kSeed = 0x0ff1ce;
+
+static void SelectKBenchmark(benchmark::State& state,
+                             const std::shared_ptr<Array>& values, int64_t k) {
+  for (auto _ : state) {
+    ABORT_NOT_OK(SelectKUnstable(*values, SelectKOptions::TopKDefault(k)).status());
+  }
+  state.SetItemsProcessed(state.iterations() * values->length());
+}
+
+static void SelectKInt64(benchmark::State& state) {
+  RegressionArgs args(state);
+
+  const int64_t array_size = args.size / sizeof(int64_t);
+  auto rand = random::RandomArrayGenerator(kSeed);
+
+  auto min = std::numeric_limits<int64_t>::min();
+  auto max = std::numeric_limits<int64_t>::max();
+  auto values = rand.Int64(array_size, min, max, args.null_proportion);
+
+  SelectKBenchmark(state, values, array_size / 8);
+}
+
+BENCHMARK(SelectKInt64)
+    ->Apply(RegressionSetArgs)
+    ->Args({1 << 20, 100})
+    ->Args({1 << 23, 100})
+    ->MinTime(1.0)
+    ->Unit(benchmark::TimeUnit::kNanosecond);
+
+}  // namespace compute
+}  // namespace arrow
diff --git a/cpp/src/arrow/extension_type_test.cc b/cpp/src/arrow/extension_type_test.cc
index cd1c3b9790e..31222d74806 100644
--- a/cpp/src/arrow/extension_type_test.cc
+++ b/cpp/src/arrow/extension_type_test.cc
@@ -325,10 +325,12 @@ TEST_F(TestExtensionType, ValidateExtensionArray) {
   auto p1_type = std::make_shared<Parametric1Type>(6);
   auto ext_arr2 = ExampleParametric(p1_type, "[null, 1, 2, 3]");
   auto ext_arr3 = ExampleStruct();
+  auto ext_arr4 = ExampleComplex128();
 
   ASSERT_OK(ext_arr1->ValidateFull());
   ASSERT_OK(ext_arr2->ValidateFull());
   ASSERT_OK(ext_arr3->ValidateFull());
+  ASSERT_OK(ext_arr4->ValidateFull());
 }
 
 }  // namespace arrow
diff --git a/cpp/src/arrow/io/compressed_test.cc b/cpp/src/arrow/io/compressed_test.cc
index 4da0a1bc191..c4ed6066768 100644
--- a/cpp/src/arrow/io/compressed_test.cc
+++ b/cpp/src/arrow/io/compressed_test.cc
@@ -273,6 +273,12 @@ TEST(TestSnappyOutputStream, NotImplemented) {
 }
 #endif
 
+#if !defined ARROW_WITH_ZLIB && !defined ARROW_WITH_BROTLI && !defined ARROW_WITH_LZ4 && \
+    !defined ARROW_WITH_ZSTD
+GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(CompressedInputStreamTest);
+GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(CompressedOutputStreamTest);
+#endif
+
 #ifdef ARROW_WITH_ZLIB
 INSTANTIATE_TEST_SUITE_P(TestGZipInputStream, CompressedInputStreamTest,
                          ::testing::Values(Compression::GZIP));
diff --git a/cpp/src/arrow/io/file.cc b/cpp/src/arrow/io/file.cc
index 70e15335af2..effbfd30b4b 100644
--- a/cpp/src/arrow/io/file.cc
+++ b/cpp/src/arrow/io/file.cc
@@ -267,12 +267,29 @@ class ReadableFile::ReadableFileImpl : public OSFile {
   }
 
   Status WillNeed(const std::vector<ReadRange>& ranges) {
+    auto report_error = [](int errnum, const char* msg) -> Status {
+      if (errnum == EBADF || errnum == EINVAL) {
+        // These are logic errors, so raise them
+        return IOErrorFromErrno(errnum, msg);
+      }
+#ifndef NDEBUG
+      // Other errors may be encountered if the target device or filesystem
+      // does not support fadvise advisory (for example, macOS can return
+      // ENOTTY on macOS: ARROW-13983).  Log the error for diagnosis
+      // on debug builds, but avoid bothering the user otherwise.
+      ARROW_LOG(WARNING) << IOErrorFromErrno(errnum, msg).ToString();
+#else
+      ARROW_UNUSED(msg);
+#endif
+      return Status::OK();
+    };
     RETURN_NOT_OK(CheckClosed());
     for (const auto& range : ranges) {
       RETURN_NOT_OK(internal::ValidateRange(range.offset, range.length));
 #if defined(POSIX_FADV_WILLNEED)
-      if (posix_fadvise(fd_, range.offset, range.length, POSIX_FADV_WILLNEED)) {
-        return IOErrorFromErrno(errno, "posix_fadvise failed");
+      int ret = posix_fadvise(fd_, range.offset, range.length, POSIX_FADV_WILLNEED);
+      if (ret) {
+        RETURN_NOT_OK(report_error(ret, "posix_fadvise failed"));
       }
 #elif defined(F_RDADVISE)  // macOS, BSD?
       struct {
@@ -280,7 +297,7 @@ class ReadableFile::ReadableFileImpl : public OSFile {
         int ra_count;
       } radvisory{range.offset, static_cast<int>(range.length)};
       if (radvisory.ra_count > 0 && fcntl(fd_, F_RDADVISE, &radvisory) == -1) {
-        return IOErrorFromErrno(errno, "fcntl(fd, F_RDADVISE, ...) failed");
+        RETURN_NOT_OK(report_error(errno, "fcntl(fd, F_RDADVISE, ...) failed"));
       }
 #endif
     }
diff --git a/cpp/src/arrow/ipc/read_write_test.cc b/cpp/src/arrow/ipc/read_write_test.cc
index 245534b1d5c..d7b7fb54eaf 100644
--- a/cpp/src/arrow/ipc/read_write_test.cc
+++ b/cpp/src/arrow/ipc/read_write_test.cc
@@ -355,20 +355,18 @@ const std::vector<test::MakeRecordBatch*> kBatchCases = {
     &MakeFloatBatch,
     &MakeIntervals,
     &MakeUuid,
+    &MakeComplex128,
     &MakeDictExtension};
 
 static int g_file_number = 0;
 
 class ExtensionTypesMixin {
  public:
-  ExtensionTypesMixin() {
-    // Register the extension types required to ensure roundtripping
-    ext_guards_.emplace_back(uuid());
-    ext_guards_.emplace_back(dict_extension_type());
-  }
+  // Register the extension types required to ensure roundtripping
+  ExtensionTypesMixin() : ext_guard_({uuid(), dict_extension_type(), complex128()}) {}
 
  protected:
-  std::vector<ExtensionTypeGuard> ext_guards_;
+  ExtensionTypeGuard ext_guard_;
 };
 
 class IpcTestFixture : public io::MemoryMapFixture, public ExtensionTypesMixin {
diff --git a/cpp/src/arrow/ipc/test_common.cc b/cpp/src/arrow/ipc/test_common.cc
index c93f1f60e6e..5068eca001a 100644
--- a/cpp/src/arrow/ipc/test_common.cc
+++ b/cpp/src/arrow/ipc/test_common.cc
@@ -985,6 +985,23 @@ Status MakeUuid(std::shared_ptr<RecordBatch>* out) {
   return Status::OK();
 }
 
+Status MakeComplex128(std::shared_ptr<RecordBatch>* out) {
+  auto type = complex128();
+  auto storage_type = checked_cast<const ExtensionType&>(*type).storage_type();
+
+  auto f0 = field("f0", type);
+  auto f1 = field("f1", type, /*nullable=*/false);
+  auto schema = ::arrow::schema({f0, f1});
+
+  auto a0 = ExtensionType::WrapArray(complex128(),
+                                     ArrayFromJSON(storage_type, "[[1.0, -2.5], null]"));
+  auto a1 = ExtensionType::WrapArray(
+      complex128(), ArrayFromJSON(storage_type, "[[1.0, -2.5], [3.0, -4.0]]"));
+
+  *out = RecordBatch::Make(schema, a1->length(), {a0, a1});
+  return Status::OK();
+}
+
 Status MakeDictExtension(std::shared_ptr<RecordBatch>* out) {
   auto type = dict_extension_type();
   auto storage_type = checked_cast<const ExtensionType&>(*type).storage_type();
diff --git a/cpp/src/arrow/ipc/test_common.h b/cpp/src/arrow/ipc/test_common.h
index 2217bae39fc..48df28b2d5a 100644
--- a/cpp/src/arrow/ipc/test_common.h
+++ b/cpp/src/arrow/ipc/test_common.h
@@ -159,6 +159,9 @@ Status MakeNull(std::shared_ptr<RecordBatch>* out);
 ARROW_TESTING_EXPORT
 Status MakeUuid(std::shared_ptr<RecordBatch>* out);
 
+ARROW_TESTING_EXPORT
+Status MakeComplex128(std::shared_ptr<RecordBatch>* out);
+
 ARROW_TESTING_EXPORT
 Status MakeDictExtension(std::shared_ptr<RecordBatch>* out);
 
diff --git a/cpp/src/arrow/json/chunked_builder.cc b/cpp/src/arrow/json/chunked_builder.cc
index 040009c764f..e95041ea06d 100644
--- a/cpp/src/arrow/json/chunked_builder.cc
+++ b/cpp/src/arrow/json/chunked_builder.cc
@@ -201,6 +201,11 @@ class ChunkedListArrayBuilder : public ChunkedArrayBuilder {
               const std::shared_ptr<Array>& unconverted) override {
     std::unique_lock<std::mutex> lock(mutex_);
 
+    if (null_bitmap_chunks_.size() <= static_cast<size_t>(block_index)) {
+      null_bitmap_chunks_.resize(static_cast<size_t>(block_index) + 1, nullptr);
+      offset_chunks_.resize(null_bitmap_chunks_.size(), nullptr);
+    }
+
     if (unconverted->type_id() == Type::NA) {
       auto st = InsertNull(block_index, unconverted->length());
       if (!st.ok()) {
@@ -212,10 +217,6 @@ class ChunkedListArrayBuilder : public ChunkedArrayBuilder {
     DCHECK_EQ(unconverted->type_id(), Type::LIST);
     const auto& list_array = checked_cast<const ListArray&>(*unconverted);
 
-    if (null_bitmap_chunks_.size() <= static_cast<size_t>(block_index)) {
-      null_bitmap_chunks_.resize(static_cast<size_t>(block_index) + 1, nullptr);
-      offset_chunks_.resize(null_bitmap_chunks_.size(), nullptr);
-    }
     null_bitmap_chunks_[block_index] = unconverted->null_bitmap();
     offset_chunks_[block_index] = list_array.value_offsets();
 
diff --git a/cpp/src/arrow/json/chunked_builder_test.cc b/cpp/src/arrow/json/chunked_builder_test.cc
index a3810316f76..d04f0d5c9bd 100644
--- a/cpp/src/arrow/json/chunked_builder_test.cc
+++ b/cpp/src/arrow/json/chunked_builder_test.cc
@@ -438,15 +438,11 @@ TEST(InferringChunkedArrayBuilder, MultipleChunkList) {
                                     struct_({}), &builder));
 
   std::shared_ptr<ChunkedArray> actual;
-  AssertBuilding(builder,
-                 {
-                     "{}\n",
-                     "{\"a\": []}\n",
-                     "{\"a\": [1, 2]}\n",
-                 },
+  AssertBuilding(builder, {"{}\n", "{\"a\": []}\n", "{\"a\": [1, 2]}\n", "{}\n"},
                  &actual);
 
-  auto expected = ChunkedArrayFromJSON(list(int64()), {"[null]", "[[]]", "[[1, 2]]"});
+  auto expected =
+      ChunkedArrayFromJSON(list(int64()), {"[null]", "[[]]", "[[1, 2]]", "[null]"});
   AssertFieldEqual({"a"}, actual, *expected);
 }
 
diff --git a/cpp/src/arrow/pretty_print_test.cc b/cpp/src/arrow/pretty_print_test.cc
index d01e5377d07..7ab38d2c056 100644
--- a/cpp/src/arrow/pretty_print_test.cc
+++ b/cpp/src/arrow/pretty_print_test.cc
@@ -451,9 +451,9 @@ TEST_F(TestPrettyPrint, DateTimeTypesWithOutOfRangeValues) {
     CheckPrimitive<TimestampType, int64_t>(timestamp(TimeUnit::MICRO), {0, 10}, is_valid,
                                            values, expected);
   }
-#ifndef ARROW_UBSAN
-  // While the values below are legal and correct, they trigger an internal
-  // signed overflow inside the arrow_vendored::date library.
+  // Note that while the values below are legal and correct, they used to
+  // trigger an internal signed overflow inside the vendored "date" library
+  // (https://github.com/HowardHinnant/date/issues/696).
   {
     std::vector<int64_t> values = {min_int64, max_int64};
     static const char* expected = R"expected([
@@ -463,7 +463,6 @@ TEST_F(TestPrettyPrint, DateTimeTypesWithOutOfRangeValues) {
     CheckPrimitive<TimestampType, int64_t>(timestamp(TimeUnit::NANO), {0, 10},
                                            {true, true}, values, expected);
   }
-#endif
 }
 
 TEST_F(TestPrettyPrint, StructTypeBasic) {
diff --git a/cpp/src/arrow/python/python_test.cc b/cpp/src/arrow/python/python_test.cc
index d1c00e68cc4..c465fabc680 100644
--- a/cpp/src/arrow/python/python_test.cc
+++ b/cpp/src/arrow/python/python_test.cc
@@ -222,7 +222,7 @@ TEST(PyBuffer, NumpyArray) {
 }
 
 TEST(NumPyBuffer, NumpyArray) {
-  const npy_intp dims[1] = {10};
+  npy_intp dims[1] = {10};
 
   OwnedRef arr_ref(PyArray_SimpleNew(1, dims, NPY_FLOAT));
   PyObject* arr = arr_ref.obj();
diff --git a/cpp/src/arrow/record_batch.h b/cpp/src/arrow/record_batch.h
index 92ffa8b87fb..3173eee1000 100644
--- a/cpp/src/arrow/record_batch.h
+++ b/cpp/src/arrow/record_batch.h
@@ -130,6 +130,10 @@ class ARROW_EXPORT RecordBatch {
       int i, std::string field_name, const std::shared_ptr<Array>& column) const;
 
   /// \brief Replace a column in the record batch, producing a new RecordBatch
+  ///
+  /// \param[in] i field index, does boundscheck
+  /// \param[in] field field to be replaced
+  /// \param[in] column column to be replaced
   virtual Result<std::shared_ptr<RecordBatch>> SetColumn(
       int i, const std::shared_ptr<Field>& field,
       const std::shared_ptr<Array>& column) const = 0;
diff --git a/cpp/src/arrow/testing/extension_type.h b/cpp/src/arrow/testing/extension_type.h
index 4163c9d8358..5afe2340076 100644
--- a/cpp/src/arrow/testing/extension_type.h
+++ b/cpp/src/arrow/testing/extension_type.h
@@ -19,6 +19,7 @@
 
 #include <memory>
 #include <string>
+#include <vector>
 
 #include "arrow/extension_type.h"
 #include "arrow/testing/visibility.h"
@@ -87,6 +88,30 @@ class ARROW_TESTING_EXPORT DictExtensionType : public ExtensionType {
   std::string Serialize() const override { return "dict-extension-serialized"; }
 };
 
+class ARROW_TESTING_EXPORT Complex128Array : public ExtensionArray {
+ public:
+  using ExtensionArray::ExtensionArray;
+};
+
+class ARROW_TESTING_EXPORT Complex128Type : public ExtensionType {
+ public:
+  Complex128Type()
+      : ExtensionType(struct_({::arrow::field("real", float64(), /*nullable=*/false),
+                               ::arrow::field("imag", float64(), /*nullable=*/false)})) {}
+
+  std::string extension_name() const override { return "complex128"; }
+
+  bool ExtensionEquals(const ExtensionType& other) const override;
+
+  std::shared_ptr<Array> MakeArray(std::shared_ptr<ArrayData> data) const override;
+
+  Result<std::shared_ptr<DataType>> Deserialize(
+      std::shared_ptr<DataType> storage_type,
+      const std::string& serialized) const override;
+
+  std::string Serialize() const override { return "complex128-serialized"; }
+};
+
 ARROW_TESTING_EXPORT
 std::shared_ptr<DataType> uuid();
 
@@ -96,24 +121,38 @@ std::shared_ptr<DataType> smallint();
 ARROW_TESTING_EXPORT
 std::shared_ptr<DataType> dict_extension_type();
 
+ARROW_TESTING_EXPORT
+std::shared_ptr<DataType> complex128();
+
 ARROW_TESTING_EXPORT
 std::shared_ptr<Array> ExampleUuid();
 
 ARROW_TESTING_EXPORT
 std::shared_ptr<Array> ExampleSmallint();
 
+ARROW_TESTING_EXPORT
+std::shared_ptr<Array> ExampleDictExtension();
+
+ARROW_TESTING_EXPORT
+std::shared_ptr<Array> ExampleComplex128();
+
+ARROW_TESTING_EXPORT
+std::shared_ptr<Array> MakeComplex128(const std::shared_ptr<Array>& real,
+                                      const std::shared_ptr<Array>& imag);
+
 // A RAII class that registers an extension type on construction
 // and unregisters it on destruction.
 class ARROW_TESTING_EXPORT ExtensionTypeGuard {
  public:
   explicit ExtensionTypeGuard(const std::shared_ptr<DataType>& type);
+  explicit ExtensionTypeGuard(const DataTypeVector& types);
   ~ExtensionTypeGuard();
   ARROW_DEFAULT_MOVE_AND_ASSIGN(ExtensionTypeGuard);
 
  protected:
   ARROW_DISALLOW_COPY_AND_ASSIGN(ExtensionTypeGuard);
 
-  std::string extension_name_;
+  std::vector<std::string> extension_names_;
 };
 
 }  // namespace arrow
diff --git a/cpp/src/arrow/testing/gtest_compat.h b/cpp/src/arrow/testing/gtest_compat.h
index 012f7d33909..c934dd27938 100644
--- a/cpp/src/arrow/testing/gtest_compat.h
+++ b/cpp/src/arrow/testing/gtest_compat.h
@@ -19,6 +19,10 @@
 
 #include <gtest/gtest.h>
 
+// GTest < 1.11
+#ifndef GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST
+#define GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(A)
+#endif
 // GTest < 1.10
 #ifndef TYPED_TEST_SUITE
 #define TYPED_TEST_SUITE TYPED_TEST_CASE
diff --git a/cpp/src/arrow/testing/gtest_util.cc b/cpp/src/arrow/testing/gtest_util.cc
index 3e7c9b78c6b..587154c1f30 100644
--- a/cpp/src/arrow/testing/gtest_util.cc
+++ b/cpp/src/arrow/testing/gtest_util.cc
@@ -811,6 +811,28 @@ Result<std::shared_ptr<DataType>> DictExtensionType::Deserialize(
   return std::make_shared<DictExtensionType>();
 }
 
+bool Complex128Type::ExtensionEquals(const ExtensionType& other) const {
+  return (other.extension_name() == this->extension_name());
+}
+
+std::shared_ptr<Array> Complex128Type::MakeArray(std::shared_ptr<ArrayData> data) const {
+  DCHECK_EQ(data->type->id(), Type::EXTENSION);
+  DCHECK(ExtensionEquals(checked_cast<const ExtensionType&>(*data->type)));
+  return std::make_shared<Complex128Array>(data);
+}
+
+Result<std::shared_ptr<DataType>> Complex128Type::Deserialize(
+    std::shared_ptr<DataType> storage_type, const std::string& serialized) const {
+  if (serialized != "complex128-serialized") {
+    return Status::Invalid("Type identifier did not match: '", serialized, "'");
+  }
+  if (!storage_type->Equals(*storage_type_)) {
+    return Status::Invalid("Invalid storage type for Complex128Type: ",
+                           storage_type->ToString());
+  }
+  return std::make_shared<Complex128Type>();
+}
+
 std::shared_ptr<DataType> uuid() { return std::make_shared<UuidType>(); }
 
 std::shared_ptr<DataType> smallint() { return std::make_shared<SmallintType>(); }
@@ -819,40 +841,58 @@ std::shared_ptr<DataType> dict_extension_type() {
   return std::make_shared<DictExtensionType>();
 }
 
-std::shared_ptr<Array> ExampleUuid() {
-  auto storage_type = fixed_size_binary(16);
-  auto ext_type = uuid();
+std::shared_ptr<DataType> complex128() { return std::make_shared<Complex128Type>(); }
 
+std::shared_ptr<Array> MakeComplex128(const std::shared_ptr<Array>& real,
+                                      const std::shared_ptr<Array>& imag) {
+  auto type = complex128();
+  std::shared_ptr<Array> storage(
+      new StructArray(checked_cast<const ExtensionType&>(*type).storage_type(),
+                      real->length(), {real, imag}));
+  return ExtensionType::WrapArray(type, storage);
+}
+
+std::shared_ptr<Array> ExampleUuid() {
   auto arr = ArrayFromJSON(
-      storage_type,
+      fixed_size_binary(16),
       "[null, \"abcdefghijklmno0\", \"abcdefghijklmno1\", \"abcdefghijklmno2\"]");
-
-  auto ext_data = arr->data()->Copy();
-  ext_data->type = ext_type;
-  return MakeArray(ext_data);
+  return ExtensionType::WrapArray(uuid(), arr);
 }
 
 std::shared_ptr<Array> ExampleSmallint() {
-  auto storage_type = int16();
-  auto ext_type = smallint();
-  auto arr = ArrayFromJSON(storage_type, "[-32768, null, 1, 2, 3, 4, 32767]");
-  auto ext_data = arr->data()->Copy();
-  ext_data->type = ext_type;
-  return MakeArray(ext_data);
+  auto arr = ArrayFromJSON(int16(), "[-32768, null, 1, 2, 3, 4, 32767]");
+  return ExtensionType::WrapArray(smallint(), arr);
 }
 
-ExtensionTypeGuard::ExtensionTypeGuard(const std::shared_ptr<DataType>& type) {
-  ARROW_CHECK_EQ(type->id(), Type::EXTENSION);
-  auto ext_type = checked_pointer_cast<ExtensionType>(type);
+std::shared_ptr<Array> ExampleDictExtension() {
+  auto arr = DictArrayFromJSON(dictionary(int8(), utf8()), "[0, 1, null, 1]",
+                               R"(["foo", "bar"])");
+  return ExtensionType::WrapArray(dict_extension_type(), arr);
+}
+
+std::shared_ptr<Array> ExampleComplex128() {
+  auto arr = ArrayFromJSON(struct_({field("", float64()), field("", float64())}),
+                           "[[1.0, -2.5], null, [3.0, -4.5]]");
+  return ExtensionType::WrapArray(complex128(), arr);
+}
 
-  ARROW_CHECK_OK(RegisterExtensionType(ext_type));
-  extension_name_ = ext_type->extension_name();
-  DCHECK(!extension_name_.empty());
+ExtensionTypeGuard::ExtensionTypeGuard(const std::shared_ptr<DataType>& type)
+    : ExtensionTypeGuard(DataTypeVector{type}) {}
+
+ExtensionTypeGuard::ExtensionTypeGuard(const DataTypeVector& types) {
+  for (const auto& type : types) {
+    ARROW_CHECK_EQ(type->id(), Type::EXTENSION);
+    auto ext_type = checked_pointer_cast<ExtensionType>(type);
+
+    ARROW_CHECK_OK(RegisterExtensionType(ext_type));
+    extension_names_.push_back(ext_type->extension_name());
+    DCHECK(!extension_names_.back().empty());
+  }
 }
 
 ExtensionTypeGuard::~ExtensionTypeGuard() {
-  if (!extension_name_.empty()) {
-    ARROW_CHECK_OK(UnregisterExtensionType(extension_name_));
+  for (const auto& name : extension_names_) {
+    ARROW_CHECK_OK(UnregisterExtensionType(name));
   }
 }
 
diff --git a/cpp/src/arrow/testing/json_integration_test.cc b/cpp/src/arrow/testing/json_integration_test.cc
index 34b871c56c1..55620119550 100644
--- a/cpp/src/arrow/testing/json_integration_test.cc
+++ b/cpp/src/arrow/testing/json_integration_test.cc
@@ -197,8 +197,7 @@ Status RunCommand(const std::string& json_path, const std::string& arrow_path,
                   const std::string& command) {
   // Make sure the required extension types are registered, as they will be
   // referenced in test data.
-  ExtensionTypeGuard uuid_ext_guard(uuid());
-  ExtensionTypeGuard dict_ext_guard(dict_extension_type());
+  ExtensionTypeGuard ext_guard({uuid(), dict_extension_type()});
 
   if (json_path == "") {
     return Status::Invalid("Must specify json file name");
@@ -1105,8 +1104,7 @@ class TestJsonRoundTrip : public ::testing::TestWithParam<MakeRecordBatch*> {
 };
 
 void CheckRoundtrip(const RecordBatch& batch) {
-  ExtensionTypeGuard uuid_ext_guard(uuid());
-  ExtensionTypeGuard dict_ext_guard(dict_extension_type());
+  ExtensionTypeGuard guard({uuid(), dict_extension_type(), complex128()});
 
   TestSchemaRoundTrip(*batch.schema());
 
@@ -1160,6 +1158,7 @@ const std::vector<ipc::test::MakeRecordBatch*> kBatchCases = {
     &MakeFloatBatch,
     &MakeIntervals,
     &MakeUuid,
+    &MakeComplex128,
     &MakeDictExtension};
 
 INSTANTIATE_TEST_SUITE_P(TestJsonRoundTrip, TestJsonRoundTrip,
diff --git a/cpp/src/arrow/testing/random.cc b/cpp/src/arrow/testing/random.cc
index cd3385e5aee..ce6ec1a6e67 100644
--- a/cpp/src/arrow/testing/random.cc
+++ b/cpp/src/arrow/testing/random.cc
@@ -389,6 +389,8 @@ std::shared_ptr<Array> RandomArrayGenerator::StringWithRepeats(int64_t size,
                                                                int32_t min_length,
                                                                int32_t max_length,
                                                                double null_probability) {
+  ARROW_CHECK_LE(unique, size);
+
   // Generate a random string dictionary without any nulls
   auto array = String(unique, min_length, max_length, /*null_probability=*/0);
   auto dictionary = std::dynamic_pointer_cast<StringArray>(array);
@@ -619,110 +621,8 @@ std::shared_ptr<Array> RandomArrayGenerator::DenseUnion(const ArrayVector& field
 
 namespace {
 
-struct RandomArrayGeneratorOfImpl {
-  Status Visit(const NullType&) {
-    out_ = std::make_shared<NullArray>(size_);
-    return Status::OK();
-  }
-
-  Status Visit(const BooleanType&) {
-    double probability = 0.25;
-    out_ = rag_->Boolean(size_, probability, null_probability_);
-    return Status::OK();
-  }
-
-  template <typename T>
-  enable_if_integer<T, Status> Visit(const T&) {
-    auto max = std::numeric_limits<typename T::c_type>::max();
-    auto min = std::numeric_limits<typename T::c_type>::lowest();
-
-    out_ = rag_->Numeric<T>(size_, min, max, null_probability_);
-    return Status::OK();
-  }
-
-  template <typename T>
-  enable_if_floating_point<T, Status> Visit(const T&) {
-    out_ = rag_->Numeric<T>(size_, 0., 1., null_probability_);
-    return Status::OK();
-  }
-
-  template <typename T>
-  enable_if_t<is_temporal_type<T>::value &&
-                  !std::is_same<T, DayTimeIntervalType>::value &&
-                  !std::is_same<T, MonthDayNanoIntervalType>::value,
-              Status>
-  Visit(const T&) {
-    auto max = std::numeric_limits<typename T::c_type>::max();
-    auto min = std::numeric_limits<typename T::c_type>::lowest();
-    auto values =
-        rag_->Numeric<typename T::PhysicalType>(size_, min, max, null_probability_);
-    return values->View(type_).Value(&out_);
-  }
-
-  template <typename T>
-  enable_if_base_binary<T, Status> Visit(const T& t) {
-    int32_t min_length = 0;
-    auto max_length = static_cast<int32_t>(std::sqrt(size_));
-
-    if (t.layout().buffers[1].byte_width == sizeof(int32_t)) {
-      out_ = rag_->String(size_, min_length, max_length, null_probability_);
-    } else {
-      out_ = rag_->LargeString(size_, min_length, max_length, null_probability_);
-    }
-    return out_->View(type_).Value(&out_);
-  }
-
-  template <typename T>
-  enable_if_t<std::is_same<T, FixedSizeBinaryType>::value, Status> Visit(const T& t) {
-    const int32_t value_size = t.byte_width();
-    int64_t data_nbytes = size_ * value_size;
-    ARROW_ASSIGN_OR_RAISE(std::shared_ptr<Buffer> data, AllocateBuffer(data_nbytes));
-    random_bytes(data_nbytes, /*seed=*/0, data->mutable_data());
-    auto validity = rag_->Boolean(size_, 1 - null_probability_);
-
-    // Assemble the data for a FixedSizeBinaryArray
-    auto values_data = std::make_shared<ArrayData>(type_, size_);
-    values_data->buffers = {validity->data()->buffers[1], data};
-    out_ = MakeArray(values_data);
-    return Status::OK();
-  }
-
-  Status Visit(const Decimal256Type&) {
-    out_ = rag_->Decimal256(type_, size_, null_probability_);
-    return Status::OK();
-  }
-
-  Status Visit(const Decimal128Type&) {
-    out_ = rag_->Decimal128(type_, size_, null_probability_);
-    return Status::OK();
-  }
-
-  Status Visit(const DataType& t) {
-    return Status::NotImplemented("generation of random arrays of type ", t);
-  }
-
-  std::shared_ptr<Array> Finish() && {
-    DCHECK_OK(VisitTypeInline(*type_, this));
-    DCHECK(type_->Equals(out_->type()));
-    return std::move(out_);
-  }
-
-  RandomArrayGenerator* rag_;
-  const std::shared_ptr<DataType>& type_;
-  int64_t size_;
-  double null_probability_;
-  std::shared_ptr<Array> out_;
-};
-
-}  // namespace
-
-std::shared_ptr<Array> RandomArrayGenerator::ArrayOf(std::shared_ptr<DataType> type,
-                                                     int64_t size,
-                                                     double null_probability) {
-  return RandomArrayGeneratorOfImpl{this, type, size, null_probability, nullptr}.Finish();
-}
-
-namespace {
+// Helper for RandomArrayGenerator::ArrayOf: extract some C value from
+// a given metadata key.
 template <typename T, typename ArrowType = typename CTypeTraits<T>::ArrowType>
 enable_if_parameter_free<ArrowType, T> GetMetadata(const KeyValueMetadata* metadata,
                                                    const std::string& key,
@@ -737,14 +637,24 @@ enable_if_parameter_free<ArrowType, T> GetMetadata(const KeyValueMetadata* metad
   }
   return output;
 }
+
 }  // namespace
 
+std::shared_ptr<Array> RandomArrayGenerator::ArrayOf(std::shared_ptr<DataType> type,
+                                                     int64_t size,
+                                                     double null_probability) {
+  auto metadata =
+      key_value_metadata({"null_probability"}, {std::to_string(null_probability)});
+  auto field = ::arrow::field("", std::move(type), std::move(metadata));
+  return ArrayOf(*field, size);
+}
+
 std::shared_ptr<Array> RandomArrayGenerator::ArrayOf(const Field& field, int64_t length) {
 #define VALIDATE_RANGE(PARAM, MIN, MAX)                                          \
   if (PARAM < MIN || PARAM > MAX) {                                              \
     ABORT_NOT_OK(Status::Invalid(field.ToString(), ": ", ARROW_STRINGIFY(PARAM), \
                                  " must be in [", MIN, ", ", MAX, " ] but got ", \
-                                 null_probability));                             \
+                                 PARAM));                                        \
   }
 #define VALIDATE_MIN_MAX(MIN, MAX)                                                  \
   if (MIN > MAX) {                                                                  \
@@ -783,7 +693,7 @@ std::shared_ptr<Array> RandomArrayGenerator::ArrayOf(const Field& field, int64_t
     const auto min_length = GetMetadata<ARRAY_TYPE::TypeClass::offset_type>(         \
         field.metadata().get(), "min_length", 0);                                    \
     const auto max_length = GetMetadata<ARRAY_TYPE::TypeClass::offset_type>(         \
-        field.metadata().get(), "max_length", 1024);                                 \
+        field.metadata().get(), "max_length", 20);                                   \
     const auto lengths = internal::checked_pointer_cast<                             \
         CTypeTraits<ARRAY_TYPE::TypeClass::offset_type>::ArrayType>(                 \
         Numeric<CTypeTraits<ARRAY_TYPE::TypeClass::offset_type>::ArrowType>(         \
@@ -835,7 +745,7 @@ std::shared_ptr<Array> RandomArrayGenerator::ArrayOf(const Field& field, int64_t
       const auto min_length =
           GetMetadata<int32_t>(field.metadata().get(), "min_length", 0);
       const auto max_length =
-          GetMetadata<int32_t>(field.metadata().get(), "max_length", 1024);
+          GetMetadata<int32_t>(field.metadata().get(), "max_length", 20);
       const auto unique_values =
           GetMetadata<int32_t>(field.metadata().get(), "unique", -1);
       if (unique_values > 0) {
@@ -956,7 +866,7 @@ std::shared_ptr<Array> RandomArrayGenerator::ArrayOf(const Field& field, int64_t
       const auto min_length =
           GetMetadata<int32_t>(field.metadata().get(), "min_length", 0);
       const auto max_length =
-          GetMetadata<int32_t>(field.metadata().get(), "max_length", 1024);
+          GetMetadata<int32_t>(field.metadata().get(), "max_length", 20);
       const auto unique_values =
           GetMetadata<int32_t>(field.metadata().get(), "unique", -1);
       if (unique_values > 0) {
diff --git a/cpp/src/arrow/type.cc b/cpp/src/arrow/type.cc
index d2adbf04b15..260686177f6 100644
--- a/cpp/src/arrow/type.cc
+++ b/cpp/src/arrow/type.cc
@@ -88,6 +88,8 @@ constexpr Type::type MonthIntervalType::type_id;
 
 constexpr Type::type DayTimeIntervalType::type_id;
 
+constexpr Type::type MonthDayNanoIntervalType::type_id;
+
 constexpr Type::type DurationType::type_id;
 
 constexpr Type::type DictionaryType::type_id;
@@ -185,6 +187,12 @@ int GetByteWidth(const DataType& type) {
   return fw_type.bit_width() / CHAR_BIT;
 }
 
+const std::vector<TimeUnit::type>& AllTimeUnits() {
+  static std::vector<TimeUnit::type> units = {TimeUnit::SECOND, TimeUnit::MILLI,
+                                              TimeUnit::MICRO, TimeUnit::NANO};
+  return units;
+}
+
 }  // namespace internal
 
 namespace {
diff --git a/cpp/src/arrow/type.h b/cpp/src/arrow/type.h
index 337d4cd64a1..acd5e66a822 100644
--- a/cpp/src/arrow/type.h
+++ b/cpp/src/arrow/type.h
@@ -1955,6 +1955,9 @@ std::string ToString(TimeUnit::type unit);
 ARROW_EXPORT
 int GetByteWidth(const DataType& type);
 
+ARROW_EXPORT
+const std::vector<TimeUnit::type>& AllTimeUnits();
+
 }  // namespace internal
 
 }  // namespace arrow
diff --git a/cpp/src/arrow/util/CMakeLists.txt b/cpp/src/arrow/util/CMakeLists.txt
index aa875ab6bee..1b14215ddd8 100644
--- a/cpp/src/arrow/util/CMakeLists.txt
+++ b/cpp/src/arrow/util/CMakeLists.txt
@@ -42,6 +42,7 @@ add_arrow_test(utility-test
                SOURCES
                align_util_test.cc
                async_generator_test.cc
+               async_util_test.cc
                bit_block_counter_test.cc
                bit_util_test.cc
                cache_test.cc
diff --git a/cpp/src/arrow/util/async_util.cc b/cpp/src/arrow/util/async_util.cc
new file mode 100644
index 00000000000..76c971f576e
--- /dev/null
+++ b/cpp/src/arrow/util/async_util.cc
@@ -0,0 +1,82 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#include "arrow/util/async_util.h"
+
+#include "arrow/util/future.h"
+#include "arrow/util/logging.h"
+
+namespace arrow {
+namespace util {
+
+AsyncDestroyable::AsyncDestroyable() : on_closed_(Future<>::Make()) {}
+
+#ifndef NDEBUG
+AsyncDestroyable::~AsyncDestroyable() {
+  DCHECK(constructed_correctly_) << "An instance of AsyncDestroyable must be created by "
+                                    "MakeSharedAsync or MakeUniqueAsync";
+}
+#else
+AsyncDestroyable::~AsyncDestroyable() = default;
+#endif
+
+void AsyncDestroyable::Destroy() {
+  DoDestroy().AddCallback([this](const Status& st) {
+    on_closed_.MarkFinished(st);
+    delete this;
+  });
+}
+
+Status AsyncTaskGroup::AddTask(const Future<>& task) {
+  auto guard = mutex_.Lock();
+  if (all_tasks_done_.is_finished()) {
+    return Status::Invalid("Attempt to add a task after the task group has completed");
+  }
+  if (!err_.ok()) {
+    return err_;
+  }
+  // If the task is already finished there is nothing to track so lets save
+  // some work and return early
+  if (task.is_finished()) {
+    err_ &= task.status();
+    return Status::OK();
+  }
+  running_tasks_++;
+  guard.Unlock();
+  task.AddCallback([this](const Status& st) {
+    auto guard = mutex_.Lock();
+    err_ &= st;
+    if (--running_tasks_ == 0 && finished_adding_) {
+      guard.Unlock();
+      all_tasks_done_.MarkFinished(err_);
+    }
+  });
+  return Status::OK();
+}
+
+Future<> AsyncTaskGroup::WaitForTasksToFinish() {
+  auto guard = mutex_.Lock();
+  finished_adding_ = true;
+  if (running_tasks_ == 0) {
+    all_tasks_done_.MarkFinished(err_);
+    return all_tasks_done_;
+  }
+  return all_tasks_done_;
+}
+
+}  // namespace util
+}  // namespace arrow
diff --git a/cpp/src/arrow/util/async_util.h b/cpp/src/arrow/util/async_util.h
new file mode 100644
index 00000000000..31e5d09a86c
--- /dev/null
+++ b/cpp/src/arrow/util/async_util.h
@@ -0,0 +1,132 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#pragma once
+
+#include "arrow/result.h"
+#include "arrow/status.h"
+#include "arrow/util/future.h"
+#include "arrow/util/mutex.h"
+
+namespace arrow {
+namespace util {
+
+/// Custom deleter for AsyncDestroyable objects
+template <typename T>
+struct DestroyingDeleter {
+  void operator()(T* p) { p->Destroy(); }
+};
+
+/// An object which should be asynchronously closed before it is destroyed
+///
+/// Classes can extend this to ensure that the close method is called and completed
+/// before the instance is deleted.  This provides smart_ptr / delete semantics for
+/// objects with an asynchronous destructor.
+///
+/// Classes which extend this must be constructed using MakeSharedAsync or MakeUniqueAsync
+class ARROW_EXPORT AsyncDestroyable {
+ public:
+  AsyncDestroyable();
+  virtual ~AsyncDestroyable();
+
+  /// A future which will complete when the AsyncDestroyable has finished and is ready
+  /// to be deleted.
+  ///
+  /// This can be used to ensure all work done by this object has been completed before
+  /// proceeding.
+  Future<> on_closed() { return on_closed_; }
+
+ protected:
+  /// Subclasses should override this and perform any cleanup.  Once the future returned
+  /// by this method finishes then this object is eligible for destruction and any
+  /// reference to `this` will be invalid
+  virtual Future<> DoDestroy() = 0;
+
+ private:
+  void Destroy();
+
+  Future<> on_closed_;
+#ifndef NDEBUG
+  bool constructed_correctly_ = false;
+#endif
+
+  template <typename T>
+  friend struct DestroyingDeleter;
+  template <typename T, typename... Args>
+  friend std::shared_ptr<T> MakeSharedAsync(Args&&... args);
+  template <typename T, typename... Args>
+  friend std::unique_ptr<T, DestroyingDeleter<T>> MakeUniqueAsync(Args&&... args);
+};
+
+template <typename T, typename... Args>
+std::shared_ptr<T> MakeSharedAsync(Args&&... args) {
+  static_assert(std::is_base_of<AsyncDestroyable, T>::value,
+                "Nursery::MakeSharedCloseable only works with AsyncDestroyable types");
+  std::shared_ptr<T> ptr(new T(std::forward<Args&&>(args)...), DestroyingDeleter<T>());
+#ifndef NDEBUG
+  ptr->constructed_correctly_ = true;
+#endif
+  return ptr;
+}
+
+template <typename T, typename... Args>
+std::unique_ptr<T, DestroyingDeleter<T>> MakeUniqueAsync(Args&&... args) {
+  static_assert(std::is_base_of<AsyncDestroyable, T>::value,
+                "Nursery::MakeUniqueCloseable only works with AsyncDestroyable types");
+  std::unique_ptr<T, DestroyingDeleter<T>> ptr(new T(std::forward<Args>(args)...),
+                                               DestroyingDeleter<T>());
+#ifndef NDEBUG
+  ptr->constructed_correctly_ = true;
+#endif
+  return ptr;
+}
+
+/// A utility which keeps track of a collection of asynchronous tasks
+///
+/// This can be used to provide structured concurrency for asynchronous development.
+/// A task group created at a high level can be distributed amongst low level components
+/// which register work to be completed.  The high level job can then wait for all work
+/// to be completed before cleaning up.
+class ARROW_EXPORT AsyncTaskGroup {
+ public:
+  /// Add a task to be tracked by this task group
+  ///
+  /// If a previous task has failed then adding a task will fail
+  ///
+  /// If WaitForTasksToFinish has been called and the returned future has been marked
+  /// completed then adding a task will fail.
+  Status AddTask(const Future<>& task);
+  /// A future that will be completed when all running tasks are finished.
+  ///
+  /// It is allowed for tasks to be added after this call provided the future has not yet
+  /// completed.  This should be safe as long as the tasks being added are added as part
+  /// of a task that is tracked.  As soon as the count of running tasks reaches 0 this
+  /// future will be marked complete.
+  ///
+  /// Any attempt to add a task after the returned future has completed will fail.
+  Future<> WaitForTasksToFinish();
+
+ private:
+  bool finished_adding_ = false;
+  int running_tasks_ = 0;
+  Status err_;
+  Future<> all_tasks_done_ = Future<>::Make();
+  util::Mutex mutex_;
+};
+
+}  // namespace util
+}  // namespace arrow
diff --git a/cpp/src/arrow/util/async_util_test.cc b/cpp/src/arrow/util/async_util_test.cc
new file mode 100644
index 00000000000..f263ee548cf
--- /dev/null
+++ b/cpp/src/arrow/util/async_util_test.cc
@@ -0,0 +1,154 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#include "arrow/util/async_util.h"
+
+#include <gtest/gtest.h>
+
+#include "arrow/result.h"
+#include "arrow/testing/future_util.h"
+#include "arrow/testing/gtest_util.h"
+
+namespace arrow {
+namespace util {
+
+class GatingDestroyable : public AsyncDestroyable {
+ public:
+  GatingDestroyable(Future<> close_future, bool* destroyed)
+      : close_future_(std::move(close_future)), destroyed_(destroyed) {}
+  ~GatingDestroyable() override { *destroyed_ = true; }
+
+ protected:
+  Future<> DoDestroy() override { return close_future_; }
+
+ private:
+  Future<> close_future_;
+  bool* destroyed_;
+};
+
+template <typename Factory>
+void TestAsyncDestroyable(Factory factory) {
+  Future<> gate = Future<>::Make();
+  bool destroyed = false;
+  bool on_closed = false;
+  {
+    auto obj = factory(gate, &destroyed);
+    obj->on_closed().AddCallback([&](const Status& st) { on_closed = true; });
+    ASSERT_FALSE(destroyed);
+  }
+  ASSERT_FALSE(destroyed);
+  ASSERT_FALSE(on_closed);
+  gate.MarkFinished();
+  ASSERT_TRUE(destroyed);
+  ASSERT_TRUE(on_closed);
+}
+
+TEST(AsyncDestroyable, MakeShared) {
+  TestAsyncDestroyable([](Future<> gate, bool* destroyed) {
+    return MakeSharedAsync<GatingDestroyable>(gate, destroyed);
+  });
+}
+
+TEST(AsyncDestroyable, MakeUnique) {
+  TestAsyncDestroyable([](Future<> gate, bool* destroyed) {
+    return MakeUniqueAsync<GatingDestroyable>(gate, destroyed);
+  });
+}
+
+TEST(AsyncTaskGroup, Basic) {
+  AsyncTaskGroup task_group;
+  Future<> fut1 = Future<>::Make();
+  Future<> fut2 = Future<>::Make();
+  ASSERT_OK(task_group.AddTask(fut1));
+  ASSERT_OK(task_group.AddTask(fut2));
+  Future<> all_done = task_group.WaitForTasksToFinish();
+  AssertNotFinished(all_done);
+  fut1.MarkFinished();
+  AssertNotFinished(all_done);
+  fut2.MarkFinished();
+  ASSERT_FINISHES_OK(all_done);
+}
+
+TEST(AsyncTaskGroup, NoTasks) {
+  AsyncTaskGroup task_group;
+  ASSERT_FINISHES_OK(task_group.WaitForTasksToFinish());
+}
+
+TEST(AsyncTaskGroup, AddAfterDone) {
+  AsyncTaskGroup task_group;
+  ASSERT_FINISHES_OK(task_group.WaitForTasksToFinish());
+  ASSERT_RAISES(Invalid, task_group.AddTask(Future<>::Make()));
+}
+
+TEST(AsyncTaskGroup, AddAfterWaitButBeforeFinish) {
+  AsyncTaskGroup task_group;
+  Future<> task_one = Future<>::Make();
+  ASSERT_OK(task_group.AddTask(task_one));
+  Future<> finish_fut = task_group.WaitForTasksToFinish();
+  AssertNotFinished(finish_fut);
+  Future<> task_two = Future<>::Make();
+  ASSERT_OK(task_group.AddTask(task_two));
+  AssertNotFinished(finish_fut);
+  task_one.MarkFinished();
+  AssertNotFinished(finish_fut);
+  task_two.MarkFinished();
+  AssertFinished(finish_fut);
+  ASSERT_FINISHES_OK(finish_fut);
+}
+
+TEST(AsyncTaskGroup, Error) {
+  AsyncTaskGroup task_group;
+  Future<> failed_task = Future<>::MakeFinished(Status::Invalid("XYZ"));
+  ASSERT_OK(task_group.AddTask(failed_task));
+  ASSERT_FINISHES_AND_RAISES(Invalid, task_group.WaitForTasksToFinish());
+}
+
+TEST(AsyncTaskGroup, TaskFinishesAfterError) {
+  AsyncTaskGroup task_group;
+  Future<> fut1 = Future<>::Make();
+  ASSERT_OK(task_group.AddTask(fut1));
+  ASSERT_OK(task_group.AddTask(Future<>::MakeFinished(Status::Invalid("XYZ"))));
+  Future<> finished_fut = task_group.WaitForTasksToFinish();
+  AssertNotFinished(finished_fut);
+  fut1.MarkFinished();
+  ASSERT_FINISHES_AND_RAISES(Invalid, finished_fut);
+}
+
+TEST(AsyncTaskGroup, AddAfterFailed) {
+  AsyncTaskGroup task_group;
+  ASSERT_OK(task_group.AddTask(Future<>::MakeFinished(Status::Invalid("XYZ"))));
+  ASSERT_RAISES(Invalid, task_group.AddTask(Future<>::Make()));
+  ASSERT_FINISHES_AND_RAISES(Invalid, task_group.WaitForTasksToFinish());
+}
+
+TEST(AsyncTaskGroup, FailAfterAdd) {
+  AsyncTaskGroup task_group;
+  Future<> will_fail = Future<>::Make();
+  ASSERT_OK(task_group.AddTask(will_fail));
+  Future<> added_later_and_passes = Future<>::Make();
+  ASSERT_OK(task_group.AddTask(added_later_and_passes));
+  will_fail.MarkFinished(Status::Invalid("XYZ"));
+  ASSERT_RAISES(Invalid, task_group.AddTask(Future<>::Make()));
+  Future<> finished_fut = task_group.WaitForTasksToFinish();
+  AssertNotFinished(finished_fut);
+  added_later_and_passes.MarkFinished();
+  AssertFinished(finished_fut);
+  ASSERT_FINISHES_AND_RAISES(Invalid, finished_fut);
+}
+
+}  // namespace util
+}  // namespace arrow
diff --git a/cpp/src/arrow/util/bit_util.cc b/cpp/src/arrow/util/bit_util.cc
index ee4bcde7713..aa78da76531 100644
--- a/cpp/src/arrow/util/bit_util.cc
+++ b/cpp/src/arrow/util/bit_util.cc
@@ -111,8 +111,10 @@ void SetBitmapImpl(uint8_t* data, int64_t offset, int64_t length) {
 
   // clean up
   DCHECK_LT(length, 8);
-  data[offset / 8] =
-      BitUtil::SpliceWord(static_cast<int32_t>(length), set_byte, data[offset / 8]);
+  if (length > 0) {
+    data[offset / 8] =
+        BitUtil::SpliceWord(static_cast<int32_t>(length), set_byte, data[offset / 8]);
+  }
 }
 
 void SetBitmap(uint8_t* data, int64_t offset, int64_t length) {
diff --git a/cpp/src/arrow/util/bit_util_test.cc b/cpp/src/arrow/util/bit_util_test.cc
index 61d064cc65f..c3fb0832198 100644
--- a/cpp/src/arrow/util/bit_util_test.cc
+++ b/cpp/src/arrow/util/bit_util_test.cc
@@ -1569,6 +1569,12 @@ TEST(BitUtilTests, TestSetBitmap) {
       uint8_t false_byte = static_cast<uint8_t>(0);
       ASSERT_BYTES_EQ(bitmap, {false_byte, false_byte, false_byte, fill_byte});
     }
+    {
+      // ASAN test against out of bound access (ARROW-13803)
+      uint8_t bitmap[1] = {fill_byte};
+      BitUtil::ClearBitmap(bitmap, 0, 8);
+      ASSERT_EQ(bitmap[0], 0);
+    }
   }
 }
 
diff --git a/cpp/src/arrow/util/compression_test.cc b/cpp/src/arrow/util/compression_test.cc
index 795d5e31d65..2dbbf607ba9 100644
--- a/cpp/src/arrow/util/compression_test.cc
+++ b/cpp/src/arrow/util/compression_test.cc
@@ -584,6 +584,11 @@ TEST_P(CodecTest, StreamingMultiFlush) {
   ASSERT_FALSE(result.should_retry);
 }
 
+#if !defined ARROW_WITH_ZLIB && !defined ARROW_WITH_SNAPPY && !defined ARROW_WITH_LZ4 && \
+    !defined ARROW_WITH_BROTLI && !defined ARROW_WITH_BZ2 && !defined ARROW_WITH_ZSTD
+GTEST_ALLOW_UNINSTANTIATED_PARAMETERIZED_TEST(CodecTest);
+#endif
+
 #ifdef ARROW_WITH_ZLIB
 INSTANTIATE_TEST_SUITE_P(TestGZip, CodecTest, ::testing::Values(Compression::GZIP));
 #endif
diff --git a/cpp/src/arrow/util/decimal.h b/cpp/src/arrow/util/decimal.h
index 4a158728833..da88fbeb379 100644
--- a/cpp/src/arrow/util/decimal.h
+++ b/cpp/src/arrow/util/decimal.h
@@ -25,6 +25,7 @@
 
 #include "arrow/result.h"
 #include "arrow/status.h"
+#include "arrow/type_fwd.h"
 #include "arrow/util/basic_decimal.h"
 #include "arrow/util/string_view.h"
 
@@ -288,4 +289,26 @@ struct Decimal256::ToRealConversion<double> {
   }
 };
 
+/// For an integer type, return the max number of decimal digits
+/// (=minimal decimal precision) it can represent.
+inline Result<int32_t> MaxDecimalDigitsForInteger(Type::type type_id) {
+  switch (type_id) {
+    case Type::INT8:
+    case Type::UINT8:
+      return 3;
+    case Type::INT16:
+    case Type::UINT16:
+      return 5;
+    case Type::INT32:
+    case Type::UINT32:
+      return 10;
+    case Type::INT64:
+    case Type::UINT64:
+      return 19;
+    default:
+      break;
+  }
+  return Status::Invalid("Not an integer type: ", type_id);
+}
+
 }  // namespace arrow
diff --git a/cpp/src/arrow/util/key_value_metadata.cc b/cpp/src/arrow/util/key_value_metadata.cc
index ad3b686a9bd..fd179a8bf38 100644
--- a/cpp/src/arrow/util/key_value_metadata.cc
+++ b/cpp/src/arrow/util/key_value_metadata.cc
@@ -56,8 +56,6 @@ static std::vector<std::string> UnorderedMapValues(
   return values;
 }
 
-KeyValueMetadata::KeyValueMetadata() : keys_(), values_() {}
-
 KeyValueMetadata::KeyValueMetadata(
     const std::unordered_map<std::string, std::string>& map)
     : keys_(UnorderedMapKeys(map)), values_(UnorderedMapValues(map)) {
@@ -85,9 +83,9 @@ void KeyValueMetadata::ToUnorderedMap(
   }
 }
 
-void KeyValueMetadata::Append(const std::string& key, const std::string& value) {
-  keys_.push_back(key);
-  values_.push_back(value);
+void KeyValueMetadata::Append(std::string key, std::string value) {
+  keys_.push_back(std::move(key));
+  values_.push_back(std::move(value));
 }
 
 Result<std::string> KeyValueMetadata::Get(const std::string& key) const {
diff --git a/cpp/src/arrow/util/key_value_metadata.h b/cpp/src/arrow/util/key_value_metadata.h
index d42ab78f667..2a31bf378b0 100644
--- a/cpp/src/arrow/util/key_value_metadata.h
+++ b/cpp/src/arrow/util/key_value_metadata.h
@@ -34,16 +34,15 @@ namespace arrow {
 /// \brief A container for key-value pair type metadata. Not thread-safe
 class ARROW_EXPORT KeyValueMetadata {
  public:
-  KeyValueMetadata();
+  KeyValueMetadata() = default;
   KeyValueMetadata(std::vector<std::string> keys, std::vector<std::string> values);
   explicit KeyValueMetadata(const std::unordered_map<std::string, std::string>& map);
-  virtual ~KeyValueMetadata() = default;
 
   static std::shared_ptr<KeyValueMetadata> Make(std::vector<std::string> keys,
                                                 std::vector<std::string> values);
 
   void ToUnorderedMap(std::unordered_map<std::string, std::string>* out) const;
-  void Append(const std::string& key, const std::string& value);
+  void Append(std::string key, std::string value);
 
   Result<std::string> Get(const std::string& key) const;
   bool Contains(const std::string& key) const;
diff --git a/cpp/src/arrow/util/math_constants.h b/cpp/src/arrow/util/math_constants.h
new file mode 100644
index 00000000000..7ee87c5d6ac
--- /dev/null
+++ b/cpp/src/arrow/util/math_constants.h
@@ -0,0 +1,32 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#pragma once
+
+#include <cmath>
+
+// Not provided by default in MSVC,
+// and _USE_MATH_DEFINES is not reliable with unity builds
+#ifndef M_PI
+#define M_PI 3.14159265358979323846
+#endif
+#ifndef M_PI_2
+#define M_PI_2 1.57079632679489661923
+#endif
+#ifndef M_PI_4
+#define M_PI_4 0.785398163397448309616
+#endif
diff --git a/cpp/src/arrow/util/tdigest.cc b/cpp/src/arrow/util/tdigest.cc
index 541fc362529..ee84a5ef6b2 100644
--- a/cpp/src/arrow/util/tdigest.cc
+++ b/cpp/src/arrow/util/tdigest.cc
@@ -26,10 +26,7 @@
 #include <vector>
 
 #include "arrow/status.h"
-
-#ifndef M_PI
-#define M_PI 3.14159265358979323846
-#endif
+#include "arrow/util/math_constants.h"
 
 namespace arrow {
 namespace internal {
diff --git a/cpp/src/arrow/util/value_parsing.h b/cpp/src/arrow/util/value_parsing.h
index a92db132d0a..24a8f9fe879 100644
--- a/cpp/src/arrow/util/value_parsing.h
+++ b/cpp/src/arrow/util/value_parsing.h
@@ -273,6 +273,30 @@ inline bool ParseUnsigned(const char* s, size_t length, uint64_t* out) {
 #undef PARSE_UNSIGNED_ITERATION
 #undef PARSE_UNSIGNED_ITERATION_LAST
 
+template <typename T>
+bool ParseHex(const char* s, size_t length, T* out) {
+  // lets make sure that the length of the string is not too big
+  if (!ARROW_PREDICT_TRUE(sizeof(T) * 2 >= length && length > 0)) {
+    return false;
+  }
+  T result = 0;
+  for (size_t i = 0; i < length; i++) {
+    result = static_cast<T>(result << 4);
+    if (s[i] >= '0' && s[i] <= '9') {
+      result = static_cast<T>(result | (s[i] - '0'));
+    } else if (s[i] >= 'A' && s[i] <= 'F') {
+      result = static_cast<T>(result | (s[i] - 'A' + 10));
+    } else if (s[i] >= 'a' && s[i] <= 'f') {
+      result = static_cast<T>(result | (s[i] - 'a' + 10));
+    } else {
+      /* Non-digit */
+      return false;
+    }
+  }
+  *out = result;
+  return true;
+}
+
 template <class ARROW_TYPE>
 struct StringToUnsignedIntConverterMixin {
   using value_type = typename ARROW_TYPE::c_type;
@@ -281,6 +305,16 @@ struct StringToUnsignedIntConverterMixin {
     if (ARROW_PREDICT_FALSE(length == 0)) {
       return false;
     }
+    // If it starts with 0x then its hex
+    if (length > 2 && s[0] == '0' && ((s[1] == 'x') || (s[1] == 'X'))) {
+      length -= 2;
+      s += 2;
+
+      if (!ARROW_PREDICT_TRUE(ParseHex(s, length, out))) {
+        return false;
+      }
+      return true;
+    }
     // Skip leading zeros
     while (length > 0 && *s == '0') {
       length--;
@@ -329,6 +363,19 @@ struct StringToSignedIntConverterMixin {
     if (ARROW_PREDICT_FALSE(length == 0)) {
       return false;
     }
+
+    // If it starts with 0x then its hex
+    if (length > 2 && s[0] == '0' && ((s[1] == 'x') || (s[1] == 'X'))) {
+      length -= 2;
+      s += 2;
+
+      if (!ARROW_PREDICT_TRUE(ParseHex(s, length, &unsigned_value))) {
+        return false;
+      }
+      *out = static_cast<value_type>(unsigned_value);
+      return true;
+    }
+
     if (*s == '-') {
       negative = true;
       s++;
@@ -336,6 +383,7 @@ struct StringToSignedIntConverterMixin {
         return false;
       }
     }
+
     // Skip leading zeros
     while (length > 0 && *s == '0') {
       length--;
diff --git a/cpp/src/arrow/util/value_parsing_benchmark.cc b/cpp/src/arrow/util/value_parsing_benchmark.cc
index c113c245fff..40d139316e5 100644
--- a/cpp/src/arrow/util/value_parsing_benchmark.cc
+++ b/cpp/src/arrow/util/value_parsing_benchmark.cc
@@ -56,6 +56,26 @@ static std::vector<std::string> MakeIntStrings(int32_t num_items) {
   return strings;
 }
 
+template <typename c_int>
+static std::vector<std::string> MakeHexStrings(int32_t num_items) {
+  int32_t num_bytes = sizeof(c_int);
+  const char* kAsciiTable = "0123456789ABCDEF";
+  std::vector<char> large_hex_chars(num_bytes * 2 + 2);
+  large_hex_chars[0] = '0';
+  large_hex_chars[1] = 'x';
+  for (int32_t i = 0; i < num_bytes * 2; ++i) {
+    large_hex_chars[i + 2] = kAsciiTable[i];
+  }
+  std::string large_hex(&large_hex_chars[0], large_hex_chars.size());
+
+  std::vector<std::string> base_strings = {"0x0", "0xA5", "0x5E", large_hex};
+  std::vector<std::string> strings;
+  for (int32_t i = 0; i < num_items; ++i) {
+    strings.push_back(base_strings[i % base_strings.size()]);
+  }
+  return strings;
+}
+
 static std::vector<std::string> MakeFloatStrings(int32_t num_items) {
   std::vector<std::string> base_strings = {"0.0",         "5",        "-12.3",
                                            "98765430000", "3456.789", "0.0012345",
@@ -123,6 +143,25 @@ static void IntegerParsing(benchmark::State& state) {  // NOLINT non-const refer
   state.SetItemsProcessed(state.iterations() * strings.size());
 }
 
+template <typename ARROW_TYPE, typename C_TYPE = typename ARROW_TYPE::c_type>
+static void HexParsing(benchmark::State& state) {  // NOLINT non-const reference
+  auto strings = MakeHexStrings<C_TYPE>(1000);
+
+  while (state.KeepRunning()) {
+    C_TYPE total = 0;
+    for (const auto& s : strings) {
+      C_TYPE value;
+      if (!ParseValue<ARROW_TYPE>(s.data(), s.length(), &value)) {
+        std::cerr << "Conversion failed for '" << s << "'";
+        std::abort();
+      }
+      total = static_cast<C_TYPE>(total + value);
+    }
+    benchmark::DoNotOptimize(total);
+  }
+  state.SetItemsProcessed(state.iterations() * strings.size());
+}
+
 template <typename ARROW_TYPE, typename C_TYPE = typename ARROW_TYPE::c_type>
 static void FloatParsing(benchmark::State& state) {  // NOLINT non-const reference
   auto strings = MakeFloatStrings(1000);
@@ -230,6 +269,15 @@ BENCHMARK_TEMPLATE(IntegerParsing, UInt16Type);
 BENCHMARK_TEMPLATE(IntegerParsing, UInt32Type);
 BENCHMARK_TEMPLATE(IntegerParsing, UInt64Type);
 
+BENCHMARK_TEMPLATE(HexParsing, Int8Type);
+BENCHMARK_TEMPLATE(HexParsing, Int16Type);
+BENCHMARK_TEMPLATE(HexParsing, Int32Type);
+BENCHMARK_TEMPLATE(HexParsing, Int64Type);
+BENCHMARK_TEMPLATE(HexParsing, UInt8Type);
+BENCHMARK_TEMPLATE(HexParsing, UInt16Type);
+BENCHMARK_TEMPLATE(HexParsing, UInt32Type);
+BENCHMARK_TEMPLATE(HexParsing, UInt64Type);
+
 BENCHMARK_TEMPLATE(FloatParsing, FloatType);
 BENCHMARK_TEMPLATE(FloatParsing, DoubleType);
 
diff --git a/cpp/src/arrow/util/value_parsing_test.cc b/cpp/src/arrow/util/value_parsing_test.cc
index b5dc5619ded..ebbb733398d 100644
--- a/cpp/src/arrow/util/value_parsing_test.cc
+++ b/cpp/src/arrow/util/value_parsing_test.cc
@@ -120,6 +120,16 @@ TEST(StringConversion, ToInt8) {
   AssertConversionFails<Int8Type>("-");
   AssertConversionFails<Int8Type>("0.0");
   AssertConversionFails<Int8Type>("e");
+
+  // Hex
+  AssertConversion<Int8Type>("0x0", 0);
+  AssertConversion<Int8Type>("0X1A", 26);
+  AssertConversion<Int8Type>("0xb", 11);
+  AssertConversion<Int8Type>("0x7F", 127);
+  AssertConversion<Int8Type>("0xFF", -1);
+  AssertConversionFails<Int8Type>("0x");
+  AssertConversionFails<Int8Type>("0x100");
+  AssertConversionFails<Int8Type>("0x1g");
 }
 
 TEST(StringConversion, ToUInt8) {
@@ -138,6 +148,16 @@ TEST(StringConversion, ToUInt8) {
   AssertConversionFails<UInt8Type>("-");
   AssertConversionFails<UInt8Type>("0.0");
   AssertConversionFails<UInt8Type>("e");
+
+  // Hex
+  AssertConversion<UInt8Type>("0x0", 0);
+  AssertConversion<UInt8Type>("0x1A", 26);
+  AssertConversion<UInt8Type>("0xb", 11);
+  AssertConversion<UInt8Type>("0x7F", 127);
+  AssertConversion<UInt8Type>("0xFF", 255);
+  AssertConversionFails<UInt8Type>("0x");
+  AssertConversionFails<UInt8Type>("0x100");
+  AssertConversionFails<UInt8Type>("0x1g");
 }
 
 TEST(StringConversion, ToInt16) {
@@ -155,6 +175,16 @@ TEST(StringConversion, ToInt16) {
   AssertConversionFails<Int16Type>("-");
   AssertConversionFails<Int16Type>("0.0");
   AssertConversionFails<Int16Type>("e");
+
+  // Hex
+  AssertConversion<Int16Type>("0x0", 0);
+  AssertConversion<Int16Type>("0X1aA", 426);
+  AssertConversion<Int16Type>("0xb", 11);
+  AssertConversion<Int16Type>("0x7ffF", 32767);
+  AssertConversion<Int16Type>("0XfffF", -1);
+  AssertConversionFails<Int16Type>("0x");
+  AssertConversionFails<Int16Type>("0x10000");
+  AssertConversionFails<Int16Type>("0x1g");
 }
 
 TEST(StringConversion, ToUInt16) {
@@ -172,6 +202,16 @@ TEST(StringConversion, ToUInt16) {
   AssertConversionFails<UInt16Type>("-");
   AssertConversionFails<UInt16Type>("0.0");
   AssertConversionFails<UInt16Type>("e");
+
+  // Hex
+  AssertConversion<UInt16Type>("0x0", 0);
+  AssertConversion<UInt16Type>("0x1aA", 426);
+  AssertConversion<UInt16Type>("0xb", 11);
+  AssertConversion<UInt16Type>("0x7ffF", 32767);
+  AssertConversion<UInt16Type>("0xFffF", 65535);
+  AssertConversionFails<UInt16Type>("0x");
+  AssertConversionFails<UInt16Type>("0x10000");
+  AssertConversionFails<UInt16Type>("0x1g");
 }
 
 TEST(StringConversion, ToInt32) {
@@ -189,6 +229,18 @@ TEST(StringConversion, ToInt32) {
   AssertConversionFails<Int32Type>("-");
   AssertConversionFails<Int32Type>("0.0");
   AssertConversionFails<Int32Type>("e");
+
+  // Hex
+  AssertConversion<Int32Type>("0x0", 0);
+  AssertConversion<Int32Type>("0x123ABC", 1194684);
+  AssertConversion<Int32Type>("0xA4B35", 674613);
+  AssertConversion<Int32Type>("0x7FFFFFFF", 2147483647);
+  AssertConversion<Int32Type>("0x123abc", 1194684);
+  AssertConversion<Int32Type>("0xA4b35", 674613);
+  AssertConversion<Int32Type>("0x7FFFfFfF", 2147483647);
+  AssertConversion<Int32Type>("0XFFFFfFfF", -1);
+  AssertConversionFails<Int32Type>("0X");
+  AssertConversionFails<Int32Type>("0x23512ak");
 }
 
 TEST(StringConversion, ToUInt32) {
@@ -206,6 +258,18 @@ TEST(StringConversion, ToUInt32) {
   AssertConversionFails<UInt32Type>("-");
   AssertConversionFails<UInt32Type>("0.0");
   AssertConversionFails<UInt32Type>("e");
+
+  // Hex
+  AssertConversion<UInt32Type>("0x0", 0);
+  AssertConversion<UInt32Type>("0x123ABC", 1194684);
+  AssertConversion<UInt32Type>("0xA4B35", 674613);
+  AssertConversion<UInt32Type>("0x7FFFFFFF", 2147483647);
+  AssertConversion<UInt32Type>("0x123abc", 1194684);
+  AssertConversion<UInt32Type>("0xA4b35", 674613);
+  AssertConversion<UInt32Type>("0x7FFFfFfF", 2147483647);
+  AssertConversion<UInt32Type>("0XFFFFfFfF", 4294967295);
+  AssertConversionFails<UInt32Type>("0X");
+  AssertConversionFails<UInt32Type>("0x23512ak");
 }
 
 TEST(StringConversion, ToInt64) {
@@ -223,6 +287,17 @@ TEST(StringConversion, ToInt64) {
   AssertConversionFails<Int64Type>("-");
   AssertConversionFails<Int64Type>("0.0");
   AssertConversionFails<Int64Type>("e");
+
+  // Hex
+  AssertConversion<Int64Type>("0x0", 0);
+  AssertConversion<Int64Type>("0x5415a123ABC123cb", 6058926048274359243);
+  AssertConversion<Int64Type>("0xA4B35", 674613);
+  AssertConversion<Int64Type>("0x7FFFFFFFFFFFFFFf", 9223372036854775807);
+  AssertConversion<Int64Type>("0XF000000000000001", -1152921504606846975);
+  AssertConversion<Int64Type>("0xfFFFFFFFFFFFFFFf", -1);
+  AssertConversionFails<Int64Type>("0X");
+  AssertConversionFails<Int64Type>("0x12345678901234567");
+  AssertConversionFails<Int64Type>("0x23512ak");
 }
 
 TEST(StringConversion, ToUInt64) {
@@ -237,6 +312,17 @@ TEST(StringConversion, ToUInt64) {
   AssertConversionFails<UInt64Type>("-");
   AssertConversionFails<UInt64Type>("0.0");
   AssertConversionFails<UInt64Type>("e");
+
+  // Hex
+  AssertConversion<UInt64Type>("0x0", 0);
+  AssertConversion<UInt64Type>("0x5415a123ABC123cb", 6058926048274359243);
+  AssertConversion<UInt64Type>("0xA4B35", 674613);
+  AssertConversion<UInt64Type>("0x7FFFFFFFFFFFFFFf", 9223372036854775807);
+  AssertConversion<UInt64Type>("0XF000000000000001", 17293822569102704641ULL);
+  AssertConversion<UInt64Type>("0xfFFFFFFFFFFFFFFf", 18446744073709551615ULL);
+  AssertConversionFails<UInt64Type>("0x");
+  AssertConversionFails<UInt64Type>("0x12345678901234567");
+  AssertConversionFails<UInt64Type>("0x23512ak");
 }
 
 TEST(StringConversion, ToDate32) {
diff --git a/cpp/src/arrow/util/variant_test.cc b/cpp/src/arrow/util/variant_test.cc
index 9e36f2eb9cf..f94d1b6ccf8 100644
--- a/cpp/src/arrow/util/variant_test.cc
+++ b/cpp/src/arrow/util/variant_test.cc
@@ -226,6 +226,20 @@ TEST(Variant, ExceptionSafety) {
   EXPECT_EQ(v.index(), 0);
 }
 
+// XXX GTest 1.11 exposes a `using std::visit` in its headers which
+// somehow gets preferred to `arrow::util::visit`, even if there is
+// a using clause (perhaps because of macros such as EXPECT_EQ).
+template <typename... Args>
+void DoVisit(Args&&... args) {
+  return ::arrow::util::visit(std::forward<Args>(args)...);
+}
+
+template <typename T, typename... Args>
+void AssertVisitedEquals(const T& expected, Args&&... args) {
+  const auto actual = ::arrow::util::visit(std::forward<Args>(args)...);
+  EXPECT_EQ(expected, actual);
+}
+
 template <typename V, typename T>
 struct AssertVisitOne {
   void operator()(const T& actual) { EXPECT_EQ(&actual, expected_); }
@@ -247,16 +261,17 @@ struct AssertVisitOne {
   void operator()() {
     V v{member_};
     expected_ = &get<T>(v);
-    visit(*this, v);
-    visit(*this, &v);
+    DoVisit(*this, v);
+    DoVisit(*this, &v);
   }
 
   T member_;
   const T* expected_;
 };
 
+// Try visiting all alternatives on a Variant<T...>
 template <typename... T>
-void AssertVisit(T... member) {
+void AssertVisitAll(T... member) {
   for (auto Assert :
        {std::function<void()>(AssertVisitOne<Variant<T...>, T>{member})...}) {
     Assert();
@@ -264,10 +279,10 @@ void AssertVisit(T... member) {
 }
 
 TEST(VariantTest, Visit) {
-  AssertVisit(32, std::string("hello"), true);
-  AssertVisit(std::string("world"), false, 53);
-  AssertVisit(nullptr, std::true_type{}, std::string("!"));
-  AssertVisit(std::vector<int>{1, 3, 3, 7}, "C string");
+  AssertVisitAll(32, std::string("hello"), true);
+  AssertVisitAll(std::string("world"), false, 53);
+  AssertVisitAll(nullptr, std::true_type{}, std::string("!"));
+  AssertVisitAll(std::vector<int>{1, 3, 3, 7}, "C string");
 
   using int_or_string = Variant<int, std::string>;
   int_or_string v;
@@ -279,10 +294,10 @@ TEST(VariantTest, Visit) {
   } Double;
 
   v = 7;
-  EXPECT_EQ(visit(Double, v), int_or_string{14});
+  AssertVisitedEquals(int_or_string{14}, Double, v);
 
   v = "lolol";
-  EXPECT_EQ(visit(Double, v), int_or_string{"lolollolol"});
+  AssertVisitedEquals(int_or_string{"lolollolol"}, Double, v);
 
   // mutating visit:
   struct {
@@ -291,11 +306,11 @@ TEST(VariantTest, Visit) {
   } DoubleInplace;
 
   v = 7;
-  visit(DoubleInplace, &v);
+  DoVisit(DoubleInplace, &v);
   EXPECT_EQ(v, int_or_string{14});
 
   v = "lolol";
-  visit(DoubleInplace, &v);
+  DoVisit(DoubleInplace, &v);
   EXPECT_EQ(v, int_or_string{"lolollolol"});
 }
 
diff --git a/cpp/src/arrow/vendored/datetime/README.md b/cpp/src/arrow/vendored/datetime/README.md
index 811b6935ff2..cff53e7e307 100644
--- a/cpp/src/arrow/vendored/datetime/README.md
+++ b/cpp/src/arrow/vendored/datetime/README.md
@@ -17,5 +17,12 @@ copies or substantial portions of the Software.
 Sources for datetime are adapted from Howard Hinnant's date library
 (https://github.com/HowardHinnant/date).
 
-Sources are taken from v3.0.0 release of the above project.
+Sources are taken from changeset 2e19c006e2218447ee31f864191859517603f59f
+of the above project.
 
+The following changes are made:
+- fix internal inclusion paths (from "date/xxx.h" to simply "xxx.h")
+- enclose the `date` namespace inside the `arrow_vendored` namespace
+- include a custom "visibility.h" header from "tz.cpp" for proper DLL
+  exports on Windows
+- disable curl-based database downloading in "tz.h"
diff --git a/cpp/src/arrow/vendored/datetime/date.h b/cpp/src/arrow/vendored/datetime/date.h
index 6d0455a354b..3b38b263a8f 100644
--- a/cpp/src/arrow/vendored/datetime/date.h
+++ b/cpp/src/arrow/vendored/datetime/date.h
@@ -45,9 +45,7 @@
 #include <cctype>
 #include <chrono>
 #include <climits>
-#if !(__cplusplus >= 201402)
-#  include <cmath>
-#endif
+#include <cmath>
 #include <cstddef>
 #include <cstdint>
 #include <cstdlib>
@@ -140,7 +138,7 @@ namespace date
 #endif
 
 #ifndef HAS_UNCAUGHT_EXCEPTIONS
-#  if __cplusplus > 201703 || (defined(_MSVC_LANG) && _MSVC_LANG > 201703L)
+#  if __cplusplus >= 201703 || (defined(_MSVC_LANG) && _MSVC_LANG >= 201703L)
 #    define HAS_UNCAUGHT_EXCEPTIONS 1
 #  else
 #    define HAS_UNCAUGHT_EXCEPTIONS 0
@@ -1008,6 +1006,8 @@ struct is_clock<T, std::void_t<decltype(T::now()), typename T::rep, typename T::
     : std::true_type
 {};
 
+template<class T> inline constexpr bool is_clock_v = is_clock<T>::value;
+
 #endif  // HAS_VOID_T
 
 //----------------+
@@ -1024,6 +1024,7 @@ class save_istream
     std::basic_ios<CharT, Traits>& is_;
     CharT fill_;
     std::ios::fmtflags flags_;
+    std::streamsize precision_;
     std::streamsize width_;
     std::basic_ostream<CharT, Traits>* tie_;
     std::locale loc_;
@@ -1033,6 +1034,7 @@ class save_istream
     {
         is_.fill(fill_);
         is_.flags(flags_);
+        is_.precision(precision_);
         is_.width(width_);
         is_.imbue(loc_);
         is_.tie(tie_);
@@ -1045,6 +1047,7 @@ class save_istream
         : is_(is)
         , fill_(is.fill())
         , flags_(is.flags())
+        , precision_(is.precision())
         , width_(is.width(0))
         , tie_(is.tie(nullptr))
         , loc_(is.getloc())
@@ -1168,7 +1171,11 @@ struct no_overflow
     static const std::intmax_t d1 = R1::den / gcd_d1_d2;
     static const std::intmax_t n2 = R2::num / gcd_n1_n2;
     static const std::intmax_t d2 = R2::den / gcd_d1_d2;
+#ifdef __cpp_constexpr
     static const std::intmax_t max = std::numeric_limits<std::intmax_t>::max();
+#else
+    static const std::intmax_t max = LLONG_MAX;
+#endif
 
     template <std::intmax_t Xp, std::intmax_t Yp, bool overflow>
     struct mul    // overflow == false
@@ -1356,6 +1363,47 @@ using std::chrono::abs;
 
 #endif  // HAS_CHRONO_ROUNDING
 
+namespace detail
+{
+
+template <class To, class Rep, class Period>
+CONSTCD14
+inline
+typename std::enable_if
+<
+    !std::chrono::treat_as_floating_point<typename To::rep>::value,
+    To
+>::type
+round_i(const std::chrono::duration<Rep, Period>& d)
+{
+    return round<To>(d);
+}
+
+template <class To, class Rep, class Period>
+CONSTCD14
+inline
+typename std::enable_if
+<
+    std::chrono::treat_as_floating_point<typename To::rep>::value,
+    To
+>::type
+round_i(const std::chrono::duration<Rep, Period>& d)
+{
+    return d;
+}
+
+template <class To, class Clock, class FromDuration>
+CONSTCD11
+inline
+std::chrono::time_point<Clock, To>
+round_i(const std::chrono::time_point<Clock, FromDuration>& tp)
+{
+    using std::chrono::time_point;
+    return time_point<Clock, To>{round_i<To>(tp.time_since_epoch())};
+}
+
+}  // detail
+
 // trunc towards zero
 template <class To, class Clock, class FromDuration>
 CONSTCD11
@@ -1460,16 +1508,29 @@ operator-(const day& x, const days& y) NOEXCEPT
     return x + -y;
 }
 
+namespace detail
+{
+
 template<class CharT, class Traits>
-inline
 std::basic_ostream<CharT, Traits>&
-operator<<(std::basic_ostream<CharT, Traits>& os, const day& d)
+low_level_fmt(std::basic_ostream<CharT, Traits>& os, const day& d)
 {
     detail::save_ostream<CharT, Traits> _(os);
     os.fill('0');
     os.flags(std::ios::dec | std::ios::right);
     os.width(2);
     os << static_cast<unsigned>(d);
+    return os;
+}
+
+}  // namespace detail
+
+template<class CharT, class Traits>
+inline
+std::basic_ostream<CharT, Traits>&
+operator<<(std::basic_ostream<CharT, Traits>& os, const day& d)
+{
+    detail::low_level_fmt(os, d);
     if (!d.ok())
         os << " is not a valid day";
     return os;
@@ -1587,10 +1648,12 @@ operator-(const month& x, const months& y) NOEXCEPT
     return x + -y;
 }
 
+namespace detail
+{
+
 template<class CharT, class Traits>
-inline
 std::basic_ostream<CharT, Traits>&
-operator<<(std::basic_ostream<CharT, Traits>& os, const month& m)
+low_level_fmt(std::basic_ostream<CharT, Traits>& os, const month& m)
 {
     if (m.ok())
     {
@@ -1598,7 +1661,20 @@ operator<<(std::basic_ostream<CharT, Traits>& os, const month& m)
         os << format(os.getloc(), fmt, m);
     }
     else
-        os << static_cast<unsigned>(m) << " is not a valid month";
+        os << static_cast<unsigned>(m);
+    return os;
+}
+
+}  // namespace detail
+
+template<class CharT, class Traits>
+inline
+std::basic_ostream<CharT, Traits>&
+operator<<(std::basic_ostream<CharT, Traits>& os, const month& m)
+{
+    detail::low_level_fmt(os, m);
+    if (!m.ok())
+        os << " is not a valid month";
     return os;
 }
 
@@ -1712,10 +1788,12 @@ operator-(const year& x, const years& y) NOEXCEPT
     return year{static_cast<int>(x) - y.count()};
 }
 
+namespace detail
+{
+
 template<class CharT, class Traits>
-inline
 std::basic_ostream<CharT, Traits>&
-operator<<(std::basic_ostream<CharT, Traits>& os, const year& y)
+low_level_fmt(std::basic_ostream<CharT, Traits>& os, const year& y)
 {
     detail::save_ostream<CharT, Traits> _(os);
     os.fill('0');
@@ -1723,6 +1801,17 @@ operator<<(std::basic_ostream<CharT, Traits>& os, const year& y)
     os.width(4 + (y < year{0}));
     os.imbue(std::locale::classic());
     os << static_cast<int>(y);
+    return os;
+}
+
+}  // namespace detail
+
+template<class CharT, class Traits>
+inline
+std::basic_ostream<CharT, Traits>&
+operator<<(std::basic_ostream<CharT, Traits>& os, const year& y)
+{
+    detail::low_level_fmt(os, y);
     if (!y.ok())
         os << " is not a valid year";
     return os;
@@ -1848,10 +1937,12 @@ operator-(const weekday& x, const days& y) NOEXCEPT
     return x + -y;
 }
 
+namespace detail
+{
+
 template<class CharT, class Traits>
-inline
 std::basic_ostream<CharT, Traits>&
-operator<<(std::basic_ostream<CharT, Traits>& os, const weekday& wd)
+low_level_fmt(std::basic_ostream<CharT, Traits>& os, const weekday& wd)
 {
     if (wd.ok())
     {
@@ -1859,7 +1950,20 @@ operator<<(std::basic_ostream<CharT, Traits>& os, const weekday& wd)
         os << format(fmt, wd);
     }
     else
-        os << static_cast<unsigned>(wd.wd_) << " is not a valid weekday";
+        os << wd.c_encoding();
+    return os;
+}
+
+}  // namespace detail
+
+template<class CharT, class Traits>
+inline
+std::basic_ostream<CharT, Traits>&
+operator<<(std::basic_ostream<CharT, Traits>& os, const weekday& wd)
+{
+    detail::low_level_fmt(os, wd);
+    if (!wd.ok())
+        os << " is not a valid weekday";
     return os;
 }
 
@@ -1968,15 +2072,26 @@ weekday_indexed::weekday_indexed(const date::weekday& wd, unsigned index) NOEXCE
 #  pragma GCC diagnostic pop
 #endif  // __GNUC__
 
+namespace detail
+{
+
+template<class CharT, class Traits>
+std::basic_ostream<CharT, Traits>&
+low_level_fmt(std::basic_ostream<CharT, Traits>& os, const weekday_indexed& wdi)
+{
+    return low_level_fmt(os, wdi.weekday()) << '[' << wdi.index() << ']';
+}
+
+}  // namespace detail
+
 template<class CharT, class Traits>
 inline
 std::basic_ostream<CharT, Traits>&
 operator<<(std::basic_ostream<CharT, Traits>& os, const weekday_indexed& wdi)
 {
-    os << wdi.weekday() << '[' << wdi.index();
-    if (!(1 <= wdi.index() && wdi.index() <= 5))
-        os << " is not a valid index";
-    os << ']';
+    detail::low_level_fmt(os, wdi);
+    if (!wdi.ok())
+        os << " is not a valid weekday_indexed";
     return os;
 }
 
@@ -2026,12 +2141,27 @@ operator!=(const weekday_last& x, const weekday_last& y) NOEXCEPT
     return !(x == y);
 }
 
+namespace detail
+{
+
+template<class CharT, class Traits>
+std::basic_ostream<CharT, Traits>&
+low_level_fmt(std::basic_ostream<CharT, Traits>& os, const weekday_last& wdl)
+{
+    return low_level_fmt(os, wdl.weekday()) << "[last]";
+}
+
+}  // namespace detail
+
 template<class CharT, class Traits>
 inline
 std::basic_ostream<CharT, Traits>&
 operator<<(std::basic_ostream<CharT, Traits>& os, const weekday_last& wdl)
 {
-    return os << wdl.weekday() << "[last]";
+    detail::low_level_fmt(os, wdl);
+    if (!wdl.ok())
+        os << " is not a valid weekday_last";
+    return os;
 }
 
 CONSTCD11
@@ -2206,12 +2336,28 @@ operator-(const year_month& ym, const years& dy) NOEXCEPT
     return ym + -dy;
 }
 
+namespace detail
+{
+
+template<class CharT, class Traits>
+std::basic_ostream<CharT, Traits>&
+low_level_fmt(std::basic_ostream<CharT, Traits>& os, const year_month& ym)
+{
+    low_level_fmt(os, ym.year()) << '/';
+    return low_level_fmt(os, ym.month());
+}
+
+}  // namespace detail
+
 template<class CharT, class Traits>
 inline
 std::basic_ostream<CharT, Traits>&
 operator<<(std::basic_ostream<CharT, Traits>& os, const year_month& ym)
 {
-    return os << ym.year() << '/' << ym.month();
+    detail::low_level_fmt(os, ym);
+    if (!ym.ok())
+        os << " is not a valid year_month";
+    return os;
 }
 
 // month_day
@@ -2291,12 +2437,28 @@ operator>=(const month_day& x, const month_day& y) NOEXCEPT
     return !(x < y);
 }
 
+namespace detail
+{
+
+template<class CharT, class Traits>
+std::basic_ostream<CharT, Traits>&
+low_level_fmt(std::basic_ostream<CharT, Traits>& os, const month_day& md)
+{
+    low_level_fmt(os, md.month()) << '/';
+    return low_level_fmt(os, md.day());
+}
+
+}  // namespace detail
+
 template<class CharT, class Traits>
 inline
 std::basic_ostream<CharT, Traits>&
 operator<<(std::basic_ostream<CharT, Traits>& os, const month_day& md)
 {
-    return os << md.month() << '/' << md.day();
+    detail::low_level_fmt(os, md);
+    if (!md.ok())
+        os << " is not a valid month_day";
+    return os;
 }
 
 // month_day_last
@@ -2353,12 +2515,27 @@ operator>=(const month_day_last& x, const month_day_last& y) NOEXCEPT
     return !(x < y);
 }
 
+namespace detail
+{
+
+template<class CharT, class Traits>
+std::basic_ostream<CharT, Traits>&
+low_level_fmt(std::basic_ostream<CharT, Traits>& os, const month_day_last& mdl)
+{
+    return low_level_fmt(os, mdl.month()) << "/last";
+}
+
+}  // namespace detail
+
 template<class CharT, class Traits>
 inline
 std::basic_ostream<CharT, Traits>&
 operator<<(std::basic_ostream<CharT, Traits>& os, const month_day_last& mdl)
 {
-    return os << mdl.month() << "/last";
+    detail::low_level_fmt(os, mdl);
+    if (!mdl.ok())
+        os << " is not a valid month_day_last";
+    return os;
 }
 
 // month_weekday
@@ -2405,12 +2582,28 @@ operator!=(const month_weekday& x, const month_weekday& y) NOEXCEPT
     return !(x == y);
 }
 
+namespace detail
+{
+
+template<class CharT, class Traits>
+std::basic_ostream<CharT, Traits>&
+low_level_fmt(std::basic_ostream<CharT, Traits>& os, const month_weekday& mwd)
+{
+    low_level_fmt(os, mwd.month()) << '/';
+    return low_level_fmt(os, mwd.weekday_indexed());
+}
+
+}  // namespace detail
+
 template<class CharT, class Traits>
 inline
 std::basic_ostream<CharT, Traits>&
 operator<<(std::basic_ostream<CharT, Traits>& os, const month_weekday& mwd)
 {
-    return os << mwd.month() << '/' << mwd.weekday_indexed();
+    detail::low_level_fmt(os, mwd);
+    if (!mwd.ok())
+        os << " is not a valid month_weekday";
+    return os;
 }
 
 // month_weekday_last
@@ -2457,12 +2650,28 @@ operator!=(const month_weekday_last& x, const month_weekday_last& y) NOEXCEPT
     return !(x == y);
 }
 
+namespace detail
+{
+
+template<class CharT, class Traits>
+std::basic_ostream<CharT, Traits>&
+low_level_fmt(std::basic_ostream<CharT, Traits>& os, const month_weekday_last& mwdl)
+{
+    low_level_fmt(os, mwdl.month()) << '/';
+    return low_level_fmt(os, mwdl.weekday_last());
+}
+
+}  // namespace detail
+
 template<class CharT, class Traits>
 inline
 std::basic_ostream<CharT, Traits>&
 operator<<(std::basic_ostream<CharT, Traits>& os, const month_weekday_last& mwdl)
 {
-    return os << mwdl.month() << '/' << mwdl.weekday_last();
+    detail::low_level_fmt(os, mwdl);
+    if (!mwdl.ok())
+        os << " is not a valid month_weekday_last";
+    return os;
 }
 
 // year_month_day_last
@@ -2612,12 +2821,28 @@ operator>=(const year_month_day_last& x, const year_month_day_last& y) NOEXCEPT
     return !(x < y);
 }
 
+namespace detail
+{
+
+template<class CharT, class Traits>
+std::basic_ostream<CharT, Traits>&
+low_level_fmt(std::basic_ostream<CharT, Traits>& os, const year_month_day_last& ymdl)
+{
+    low_level_fmt(os, ymdl.year()) << '/';
+    return low_level_fmt(os, ymdl.month_day_last());
+}
+
+}  // namespace detail
+
 template<class CharT, class Traits>
 inline
 std::basic_ostream<CharT, Traits>&
 operator<<(std::basic_ostream<CharT, Traits>& os, const year_month_day_last& ymdl)
 {
-    return os << ymdl.year() << '/' << ymdl.month_day_last();
+    detail::low_level_fmt(os, ymdl);
+    if (!ymdl.ok())
+        os << " is not a valid year_month_day_last";
+    return os;
 }
 
 template<class>
@@ -2848,12 +3073,13 @@ operator<<(std::basic_ostream<CharT, Traits>& os, const year_month_day& ymd)
     os.fill('0');
     os.flags(std::ios::dec | std::ios::right);
     os.imbue(std::locale::classic());
-    os << ymd.year() << '-';
+    os << static_cast<int>(ymd.year()) << '-';
     os.width(2);
     os << static_cast<unsigned>(ymd.month()) << '-';
-    os << ymd.day();
+    os.width(2);
+    os << static_cast<unsigned>(ymd.day());
     if (!ymd.ok())
-        os << " is not a valid date";
+        os << " is not a valid year_month_day";
     return os;
 }
 
@@ -3089,8 +3315,12 @@ inline
 std::basic_ostream<CharT, Traits>&
 operator<<(std::basic_ostream<CharT, Traits>& os, const year_month_weekday& ymwdi)
 {
-    return os << ymwdi.year() << '/' << ymwdi.month()
-              << '/' << ymwdi.weekday_indexed();
+    detail::low_level_fmt(os, ymwdi.year()) << '/';
+    detail::low_level_fmt(os, ymwdi.month()) << '/';
+    detail::low_level_fmt(os, ymwdi.weekday_indexed());
+    if (!ymwdi.ok())
+        os << " is not a valid year_month_weekday";
+    return os;
 }
 
 template<class>
@@ -3266,7 +3496,12 @@ inline
 std::basic_ostream<CharT, Traits>&
 operator<<(std::basic_ostream<CharT, Traits>& os, const year_month_weekday_last& ymwdl)
 {
-    return os << ymwdl.year() << '/' << ymwdl.month() << '/' << ymwdl.weekday_last();
+    detail::low_level_fmt(os, ymwdl.year()) << '/';
+    detail::low_level_fmt(os, ymwdl.month()) << '/';
+    detail::low_level_fmt(os, ymwdl.weekday_last());
+    if (!ymwdl.ok())
+        os << " is not a valid year_month_weekday_last";
+    return os;
 }
 
 template<class>
@@ -3683,11 +3918,12 @@ struct undocumented {explicit undocumented() = default;};
 // Example:  width<4>::value    ==  2
 // Example:  width<10>::value   ==  1
 // Example:  width<1000>::value ==  3
-template <std::uint64_t n, std::uint64_t d = 10, unsigned w = 0,
-          bool should_continue = !(n < 2) && d != 0 && (w < 19)>
+template <std::uint64_t n, std::uint64_t d, unsigned w = 0,
+          bool should_continue = n%d != 0 && (w < 19)>
 struct width
 {
-    static CONSTDATA unsigned value = 1 + width<n, d%n*10, w+1>::value;
+    static_assert(d > 0, "width called with zero denominator");
+    static CONSTDATA unsigned value = 1 + width<n%d*10, d, w+1>::value;
 };
 
 template <std::uint64_t n, std::uint64_t d, unsigned w>
@@ -3716,9 +3952,10 @@ class decimal_format_seconds
 {
     using CT = typename std::common_type<Duration, std::chrono::seconds>::type;
     using rep = typename CT::rep;
+    static unsigned CONSTDATA trial_width =
+        detail::width<CT::period::num, CT::period::den>::value;
 public:
-    static unsigned constexpr width = detail::width<CT::period::den>::value < 19 ?
-                                      detail::width<CT::period::den>::value : 6u;
+    static unsigned CONSTDATA width = trial_width < 19 ? trial_width : 6u;
     using precision = std::chrono::duration<rep,
                                             std::ratio<1, static_pow10<width>::value>>;
 
@@ -3767,6 +4004,7 @@ class decimal_format_seconds
         std::chrono::duration<rep> d = s_ + sub_s_;
         if (d < std::chrono::seconds{10})
             os << '0';
+        os.precision(width+6);
         os << std::fixed << d.count();
         return os;
     }
@@ -3957,9 +4195,7 @@ make24(std::chrono::hours h, bool is_pm) NOEXCEPT
 template <class Duration>
 using time_of_day = hh_mm_ss<Duration>;
 
-template <class Rep, class Period,
-          class = typename std::enable_if
-              <!std::chrono::treat_as_floating_point<Rep>::value>::type>
+template <class Rep, class Period>
 CONSTCD11
 inline
 hh_mm_ss<std::chrono::duration<Rep, Period>>
@@ -3972,8 +4208,7 @@ template <class CharT, class Traits, class Duration>
 inline
 typename std::enable_if
 <
-    !std::chrono::treat_as_floating_point<typename Duration::rep>::value &&
-        std::ratio_less<typename Duration::period, days::period>::value
+    std::ratio_less<typename Duration::period, days::period>::value
     , std::basic_ostream<CharT, Traits>&
 >::type
 operator<<(std::basic_ostream<CharT, Traits>& os, const sys_time<Duration>& tp)
@@ -4554,7 +4789,11 @@ struct fields
     hh_mm_ss<Duration>    tod{};
     bool                  has_tod = false;
 
+#if !defined(__clang__) && defined(__GNUC__) && (__GNUC__ * 100 + __GNUC_MINOR__ <= 409)
+    fields() : ymd{nanyear/0/0}, wd{8u}, tod{}, has_tod{false} {}
+#else
     fields() = default;
+#endif
 
     fields(year_month_day ymd_) : ymd(ymd_) {}
     fields(weekday wd_) : wd(wd_) {}
@@ -4736,7 +4975,7 @@ scan_keyword(std::basic_istream<CharT, Traits>& is, FwdIter kb, FwdIter ke)
             is.setstate(std::ios::eofbit);
             break;
         }
-        auto c = static_cast<char>(toupper(ic));
+        auto c = static_cast<char>(toupper(static_cast<unsigned char>(ic)));
         bool consume = false;
         // For each keyword which might match, see if the indx character is c
         // If a match if found, consume c
@@ -4749,7 +4988,7 @@ scan_keyword(std::basic_istream<CharT, Traits>& is, FwdIter kb, FwdIter ke)
         {
             if (*st == might_match)
             {
-                if (c == static_cast<char>(toupper((*ky)[indx])))
+                if (c == static_cast<char>(toupper(static_cast<unsigned char>((*ky)[indx]))))
                 {
                     consume = true;
                     if (ky->size() == indx+1)
@@ -5976,8 +6215,13 @@ to_stream(std::basic_ostream<CharT, Traits>& os, const CharT* fmt,
           const std::chrono::seconds* offset_sec = nullptr)
 {
     using CT = typename std::common_type<Duration, std::chrono::seconds>::type;
-    auto ld = floor<days>(tp);
-    fields<CT> fds{year_month_day{ld}, hh_mm_ss<CT>{tp-local_seconds{ld}}};
+    auto ld = std::chrono::time_point_cast<days>(tp);
+    fields<CT> fds;
+    if (ld <= tp)
+        fds = fields<CT>{year_month_day{ld}, hh_mm_ss<CT>{tp-local_seconds{ld}}};
+    else
+        fds = fields<CT>{year_month_day{ld - days{1}},
+                         hh_mm_ss<CT>{days{1} - (local_seconds{ld} - tp)}};
     return to_stream(os, fmt, fds, abbrev, offset_sec);
 }
 
@@ -5990,8 +6234,13 @@ to_stream(std::basic_ostream<CharT, Traits>& os, const CharT* fmt,
     using CT = typename std::common_type<Duration, seconds>::type;
     const std::string abbrev("UTC");
     CONSTDATA seconds offset{0};
-    auto sd = floor<days>(tp);
-    fields<CT> fds{year_month_day{sd}, hh_mm_ss<CT>{tp-sys_seconds{sd}}};
+    auto sd = std::chrono::time_point_cast<days>(tp);
+    fields<CT> fds;
+    if (sd <= tp)
+        fds = fields<CT>{year_month_day{sd}, hh_mm_ss<CT>{tp-sys_seconds{sd}}};
+    else
+        fds = fields<CT>{year_month_day{sd - days{1}},
+                         hh_mm_ss<CT>{days{1} - (sys_seconds{sd} - tp)}};
     return to_stream(os, fmt, fds, &abbrev, &offset);
 }
 
@@ -6124,9 +6373,16 @@ long double
 read_long_double(std::basic_istream<CharT, Traits>& is, unsigned m = 1, unsigned M = 10)
 {
     unsigned count = 0;
+    unsigned fcount = 0;
+    unsigned long long i = 0;
+    unsigned long long f = 0;
+    bool parsing_fraction = false;
+#if ONLY_C_LOCALE
+    typename Traits::int_type decimal_point = '.';
+#else
     auto decimal_point = Traits::to_int_type(
         std::use_facet<std::numpunct<CharT>>(is.getloc()).decimal_point());
-    std::string buf;
+#endif
     while (true)
     {
         auto ic = is.peek();
@@ -6134,18 +6390,25 @@ read_long_double(std::basic_istream<CharT, Traits>& is, unsigned m = 1, unsigned
             break;
         if (Traits::eq_int_type(ic, decimal_point))
         {
-            buf += '.';
             decimal_point = Traits::eof();
-            is.get();
+            parsing_fraction = true;
         }
         else
         {
             auto c = static_cast<char>(Traits::to_char_type(ic));
             if (!('0' <= c && c <= '9'))
                 break;
-            buf += c;
-            (void)is.get();
+            if (!parsing_fraction)
+            {
+                i = 10*i + static_cast<unsigned>(c - '0');
+            }
+            else
+            {
+                f = 10*f + static_cast<unsigned>(c - '0');
+                ++fcount;
+            }
         }
+        (void)is.get();
         if (++count == M)
             break;
     }
@@ -6154,7 +6417,7 @@ read_long_double(std::basic_istream<CharT, Traits>& is, unsigned m = 1, unsigned
         is.setstate(std::ios::failbit);
         return 0;
     }
-    return std::stold(buf);
+    return static_cast<long double>(i) + static_cast<long double>(f)/std::pow(10.L, fcount);
 }
 
 struct rs
@@ -6311,6 +6574,7 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt,
     using std::chrono::seconds;
     using std::chrono::minutes;
     using std::chrono::hours;
+    using detail::round_i;
     typename std::basic_istream<CharT, Traits>::sentry ok{is, true};
     if (ok)
     {
@@ -6326,7 +6590,7 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt,
         auto modified = CharT{};
         auto width = -1;
 
-        CONSTDATA int not_a_year = numeric_limits<int>::min();
+        CONSTDATA int not_a_year = numeric_limits<short>::min();
         CONSTDATA int not_a_2digit_year = 100;
         CONSTDATA int not_a_century = not_a_year / 100;
         CONSTDATA int not_a_month = 0;
@@ -6519,12 +6783,12 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt,
                         CONSTDATA auto w = Duration::period::den == 1 ? 2 : 3 + dfs::width;
                         int tH;
                         int tM;
-                        long double S;
+                        long double S{};
                         read(is, ru{tH, 1, 2}, CharT{':'}, ru{tM, 1, 2},
                                                CharT{':'}, rld{S, 1, w});
                         checked_set(H, tH, not_a_hour, is);
                         checked_set(M, tM, not_a_minute, is);
-                        checked_set(s, round<Duration>(duration<long double>{S}),
+                        checked_set(s, round_i<Duration>(duration<long double>{S}),
                                     not_a_second, is);
                         ws(is);
                         int tY = not_a_year;
@@ -6599,12 +6863,12 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt,
                         CONSTDATA auto w = Duration::period::den == 1 ? 2 : 3 + dfs::width;
                         int tH = not_a_hour;
                         int tM = not_a_minute;
-                        long double S;
+                        long double S{};
                         read(is, ru{tH, 1, 2}, CharT{':'}, ru{tM, 1, 2},
                                                CharT{':'}, rld{S, 1, w});
                         checked_set(H, tH, not_a_hour, is);
                         checked_set(M, tM, not_a_minute, is);
-                        checked_set(s, round<Duration>(duration<long double>{S}),
+                        checked_set(s, round_i<Duration>(duration<long double>{S}),
                                     not_a_second, is);
 #endif
                     }
@@ -6920,7 +7184,7 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt,
 #else
                         auto nm = detail::ampm_names();
                         auto i = detail::scan_keyword(is, nm.first, nm.second) - nm.first;
-                        tp = i;
+                        tp = static_cast<decltype(tp)>(i);
 #endif
                         checked_set(p, tp, not_a_ampm, is);
                     }
@@ -6954,14 +7218,14 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt,
                         // "%I:%M:%S %p"
                         using dfs = detail::decimal_format_seconds<Duration>;
                         CONSTDATA auto w = Duration::period::den == 1 ? 2 : 3 + dfs::width;
-                        long double S;
+                        long double S{};
                         int tI = not_a_hour_12_value;
                         int tM = not_a_minute;
                         read(is, ru{tI, 1, 2}, CharT{':'}, ru{tM, 1, 2},
                                                CharT{':'}, rld{S, 1, w});
                         checked_set(I, tI, not_a_hour_12_value, is);
                         checked_set(M, tM, not_a_minute, is);
-                        checked_set(s, round<Duration>(duration<long double>{S}),
+                        checked_set(s, round_i<Duration>(duration<long double>{S}),
                                     not_a_second, is);
                         ws(is);
                         auto nm = detail::ampm_names();
@@ -7010,9 +7274,9 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt,
                     {
                         using dfs = detail::decimal_format_seconds<Duration>;
                         CONSTDATA auto w = Duration::period::den == 1 ? 2 : 3 + dfs::width;
-                        long double S;
+                        long double S{};
                         read(is, rld{S, 1, width == -1 ? w : static_cast<unsigned>(width)});
-                        checked_set(s, round<Duration>(duration<long double>{S}),
+                        checked_set(s, round_i<Duration>(duration<long double>{S}),
                                     not_a_second, is);
                     }
 #if !ONLY_C_LOCALE
@@ -7044,12 +7308,12 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt,
                         CONSTDATA auto w = Duration::period::den == 1 ? 2 : 3 + dfs::width;
                         int tH = not_a_hour;
                         int tM = not_a_minute;
-                        long double S;
+                        long double S{};
                         read(is, ru{tH, 1, 2}, CharT{':'}, ru{tM, 1, 2},
                                                CharT{':'}, rld{S, 1, w});
                         checked_set(H, tH, not_a_hour, is);
                         checked_set(M, tM, not_a_minute, is);
-                        checked_set(s, round<Duration>(duration<long double>{S}),
+                        checked_set(s, round_i<Duration>(duration<long double>{S}),
                                     not_a_second, is);
                     }
                     else
@@ -7507,11 +7771,11 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt,
             if (j != not_a_doy && Y != not_a_year)
             {
                 auto ymd_trial = year_month_day{local_days(year{Y}/1/1) + days{j-1}};
-                if (m == 0)
+                if (m == not_a_month)
                     m = static_cast<int>(static_cast<unsigned>(ymd_trial.month()));
                 else if (month(static_cast<unsigned>(m)) != ymd_trial.month())
                     goto broken;
-                if (d == 0)
+                if (d == not_a_day)
                     d = static_cast<int>(static_cast<unsigned>(ymd_trial.day()));
                 else if (day(static_cast<unsigned>(d)) != ymd_trial.day())
                     goto broken;
@@ -7597,6 +7861,8 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt,
                             goto broken;
                         }
                     }
+                    else  // I is ambiguous, AM or PM?
+                        goto broken;
                 }
             }
             if (H != not_a_hour)
@@ -7641,7 +7907,7 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt, year& y,
 {
     using CT = std::chrono::seconds;
     fields<CT> fds{};
-    from_stream(is, fmt, fds, abbrev, offset);
+    date::from_stream(is, fmt, fds, abbrev, offset);
     if (!fds.ymd.year().ok())
         is.setstate(std::ios::failbit);
     if (!is.fail())
@@ -7657,7 +7923,7 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt, month& m,
 {
     using CT = std::chrono::seconds;
     fields<CT> fds{};
-    from_stream(is, fmt, fds, abbrev, offset);
+    date::from_stream(is, fmt, fds, abbrev, offset);
     if (!fds.ymd.month().ok())
         is.setstate(std::ios::failbit);
     if (!is.fail())
@@ -7673,7 +7939,7 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt, day& d,
 {
     using CT = std::chrono::seconds;
     fields<CT> fds{};
-    from_stream(is, fmt, fds, abbrev, offset);
+    date::from_stream(is, fmt, fds, abbrev, offset);
     if (!fds.ymd.day().ok())
         is.setstate(std::ios::failbit);
     if (!is.fail())
@@ -7689,7 +7955,7 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt, weekday& wd
 {
     using CT = std::chrono::seconds;
     fields<CT> fds{};
-    from_stream(is, fmt, fds, abbrev, offset);
+    date::from_stream(is, fmt, fds, abbrev, offset);
     if (!fds.wd.ok())
         is.setstate(std::ios::failbit);
     if (!is.fail())
@@ -7705,7 +7971,7 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt, year_month&
 {
     using CT = std::chrono::seconds;
     fields<CT> fds{};
-    from_stream(is, fmt, fds, abbrev, offset);
+    date::from_stream(is, fmt, fds, abbrev, offset);
     if (!fds.ymd.month().ok())
         is.setstate(std::ios::failbit);
     if (!is.fail())
@@ -7721,7 +7987,7 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt, month_day&
 {
     using CT = std::chrono::seconds;
     fields<CT> fds{};
-    from_stream(is, fmt, fds, abbrev, offset);
+    date::from_stream(is, fmt, fds, abbrev, offset);
     if (!fds.ymd.month().ok() || !fds.ymd.day().ok())
         is.setstate(std::ios::failbit);
     if (!is.fail())
@@ -7737,7 +8003,7 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt,
 {
     using CT = std::chrono::seconds;
     fields<CT> fds{};
-    from_stream(is, fmt, fds, abbrev, offset);
+    date::from_stream(is, fmt, fds, abbrev, offset);
     if (!fds.ymd.ok())
         is.setstate(std::ios::failbit);
     if (!is.fail())
@@ -7752,15 +8018,16 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt,
             std::chrono::minutes* offset = nullptr)
 {
     using CT = typename std::common_type<Duration, std::chrono::seconds>::type;
+    using detail::round_i;
     std::chrono::minutes offset_local{};
     auto offptr = offset ? offset : &offset_local;
     fields<CT> fds{};
     fds.has_tod = true;
-    from_stream(is, fmt, fds, abbrev, offptr);
+    date::from_stream(is, fmt, fds, abbrev, offptr);
     if (!fds.ymd.ok() || !fds.tod.in_conventional_range())
         is.setstate(std::ios::failbit);
     if (!is.fail())
-        tp = round<Duration>(sys_days(fds.ymd) - *offptr + fds.tod.to_duration());
+        tp = round_i<Duration>(sys_days(fds.ymd) - *offptr + fds.tod.to_duration());
     return is;
 }
 
@@ -7771,13 +8038,14 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt,
             std::chrono::minutes* offset = nullptr)
 {
     using CT = typename std::common_type<Duration, std::chrono::seconds>::type;
+    using detail::round_i;
     fields<CT> fds{};
     fds.has_tod = true;
-    from_stream(is, fmt, fds, abbrev, offset);
+    date::from_stream(is, fmt, fds, abbrev, offset);
     if (!fds.ymd.ok() || !fds.tod.in_conventional_range())
         is.setstate(std::ios::failbit);
     if (!is.fail())
-        tp = round<Duration>(local_seconds{local_days(fds.ymd)} + fds.tod.to_duration());
+        tp = round_i<Duration>(local_seconds{local_days(fds.ymd)} + fds.tod.to_duration());
     return is;
 }
 
@@ -7790,12 +8058,13 @@ from_stream(std::basic_istream<CharT, Traits>& is, const CharT* fmt,
 {
     using Duration = std::chrono::duration<Rep, Period>;
     using CT = typename std::common_type<Duration, std::chrono::seconds>::type;
+    using detail::round_i;
     fields<CT> fds{};
-    from_stream(is, fmt, fds, abbrev, offset);
+    date::from_stream(is, fmt, fds, abbrev, offset);
     if (!fds.has_tod)
         is.setstate(std::ios::failbit);
     if (!is.fail())
-        d = std::chrono::duration_cast<Duration>(fds.tod.to_duration());
+        d = round_i<Duration>(fds.tod.to_duration());
     return is;
 }
 
@@ -7818,6 +8087,25 @@ struct parse_manip
         , offset_(offset)
         {}
 
+#if HAS_STRING_VIEW
+    parse_manip(const CharT* format, Parsable& tp,
+                std::basic_string<CharT, Traits, Alloc>* abbrev = nullptr,
+                std::chrono::minutes* offset = nullptr)
+        : format_(format)
+        , tp_(tp)
+        , abbrev_(abbrev)
+        , offset_(offset)
+        {}
+
+    parse_manip(std::basic_string_view<CharT, Traits> format, Parsable& tp,
+                std::basic_string<CharT, Traits, Alloc>* abbrev = nullptr,
+                std::chrono::minutes* offset = nullptr)
+        : format_(format)
+        , tp_(tp)
+        , abbrev_(abbrev)
+        , offset_(offset)
+        {}
+#endif  // HAS_STRING_VIEW
 };
 
 template <class Parsable, class CharT, class Traits, class Alloc>
@@ -7825,14 +8113,14 @@ std::basic_istream<CharT, Traits>&
 operator>>(std::basic_istream<CharT, Traits>& is,
            const parse_manip<Parsable, CharT, Traits, Alloc>& x)
 {
-    return from_stream(is, x.format_.c_str(), x.tp_, x.abbrev_, x.offset_);
+    return date::from_stream(is, x.format_.c_str(), x.tp_, x.abbrev_, x.offset_);
 }
 
 template <class Parsable, class CharT, class Traits, class Alloc>
 inline
 auto
 parse(const std::basic_string<CharT, Traits, Alloc>& format, Parsable& tp)
-    -> decltype(from_stream(std::declval<std::basic_istream<CharT, Traits>&>(),
+    -> decltype(date::from_stream(std::declval<std::basic_istream<CharT, Traits>&>(),
                             format.c_str(), tp),
                 parse_manip<Parsable, CharT, Traits, Alloc>{format, tp})
 {
@@ -7844,7 +8132,7 @@ inline
 auto
 parse(const std::basic_string<CharT, Traits, Alloc>& format, Parsable& tp,
       std::basic_string<CharT, Traits, Alloc>& abbrev)
-    -> decltype(from_stream(std::declval<std::basic_istream<CharT, Traits>&>(),
+    -> decltype(date::from_stream(std::declval<std::basic_istream<CharT, Traits>&>(),
                             format.c_str(), tp, &abbrev),
                 parse_manip<Parsable, CharT, Traits, Alloc>{format, tp, &abbrev})
 {
@@ -7856,7 +8144,7 @@ inline
 auto
 parse(const std::basic_string<CharT, Traits, Alloc>& format, Parsable& tp,
       std::chrono::minutes& offset)
-    -> decltype(from_stream(std::declval<std::basic_istream<CharT, Traits>&>(),
+    -> decltype(date::from_stream(std::declval<std::basic_istream<CharT, Traits>&>(),
                             format.c_str(), tp,
                             std::declval<std::basic_string<CharT, Traits, Alloc>*>(),
                             &offset),
@@ -7870,7 +8158,7 @@ inline
 auto
 parse(const std::basic_string<CharT, Traits, Alloc>& format, Parsable& tp,
       std::basic_string<CharT, Traits, Alloc>& abbrev, std::chrono::minutes& offset)
-    -> decltype(from_stream(std::declval<std::basic_istream<CharT, Traits>&>(),
+    -> decltype(date::from_stream(std::declval<std::basic_istream<CharT, Traits>&>(),
                             format.c_str(), tp, &abbrev, &offset),
                 parse_manip<Parsable, CharT, Traits, Alloc>{format, tp, &abbrev, &offset})
 {
@@ -7883,7 +8171,7 @@ template <class Parsable, class CharT>
 inline
 auto
 parse(const CharT* format, Parsable& tp)
-    -> decltype(from_stream(std::declval<std::basic_istream<CharT>&>(), format, tp),
+    -> decltype(date::from_stream(std::declval<std::basic_istream<CharT>&>(), format, tp),
                 parse_manip<Parsable, CharT>{format, tp})
 {
     return {format, tp};
@@ -7893,7 +8181,7 @@ template <class Parsable, class CharT, class Traits, class Alloc>
 inline
 auto
 parse(const CharT* format, Parsable& tp, std::basic_string<CharT, Traits, Alloc>& abbrev)
-    -> decltype(from_stream(std::declval<std::basic_istream<CharT, Traits>&>(), format,
+    -> decltype(date::from_stream(std::declval<std::basic_istream<CharT, Traits>&>(), format,
                             tp, &abbrev),
                 parse_manip<Parsable, CharT, Traits, Alloc>{format, tp, &abbrev})
 {
@@ -7904,7 +8192,7 @@ template <class Parsable, class CharT>
 inline
 auto
 parse(const CharT* format, Parsable& tp, std::chrono::minutes& offset)
-    -> decltype(from_stream(std::declval<std::basic_istream<CharT>&>(), format,
+    -> decltype(date::from_stream(std::declval<std::basic_istream<CharT>&>(), format,
                             tp, std::declval<std::basic_string<CharT>*>(), &offset),
                 parse_manip<Parsable, CharT>{format, tp, nullptr, &offset})
 {
@@ -7916,7 +8204,7 @@ inline
 auto
 parse(const CharT* format, Parsable& tp,
       std::basic_string<CharT, Traits, Alloc>& abbrev, std::chrono::minutes& offset)
-    -> decltype(from_stream(std::declval<std::basic_istream<CharT, Traits>&>(), format,
+    -> decltype(date::from_stream(std::declval<std::basic_istream<CharT, Traits>&>(), format,
                             tp, &abbrev, &offset),
                 parse_manip<Parsable, CharT, Traits, Alloc>{format, tp, &abbrev, &offset})
 {
diff --git a/cpp/src/arrow/vendored/datetime/ios.h b/cpp/src/arrow/vendored/datetime/ios.h
index 46567d69b18..acad28d13b5 100644
--- a/cpp/src/arrow/vendored/datetime/ios.h
+++ b/cpp/src/arrow/vendored/datetime/ios.h
@@ -38,10 +38,10 @@
     {
     namespace iOSUtils
     {
-    
+
     std::string get_tzdata_path();
     std::string get_current_timezone();
-    
+
     }  // namespace iOSUtils
     }  // namespace date
     }  // namespace arrow_vendored
diff --git a/cpp/src/arrow/vendored/datetime/ios.mm b/cpp/src/arrow/vendored/datetime/ios.mm
index 18c521201d3..22b7ce6c30b 100644
--- a/cpp/src/arrow/vendored/datetime/ios.mm
+++ b/cpp/src/arrow/vendored/datetime/ios.mm
@@ -53,7 +53,7 @@
 {
     namespace iOSUtils
     {
-        
+
         struct TarInfo
         {
             char objType;
@@ -62,14 +62,14 @@
             size_t blocksContentSize; // adjusted size to 512 bytes blocks
             bool success;
         };
-        
+
         std::string convertCFStringRefPathToCStringPath(CFStringRef ref);
         bool extractTzdata(CFURLRef homeUrl, CFURLRef archiveUrl, std::string destPath);
         TarInfo getTarObjectInfo(std::ifstream &readStream);
         std::string getTarObject(std::ifstream &readStream, int64_t size);
         bool writeFile(const std::string &tzdataPath, const std::string &fileName,
                        const std::string &data, size_t realContentSize);
-        
+
         std::string
         get_current_timezone()
         {
@@ -77,18 +77,18 @@ bool writeFile(const std::string &tzdataPath, const std::string &fileName,
             CFStringRef tzNameRef = CFTimeZoneGetName(tzRef);
             CFIndex bufferSize = CFStringGetLength(tzNameRef) + 1;
             char buffer[bufferSize];
-            
+
             if (CFStringGetCString(tzNameRef, buffer, bufferSize, kCFStringEncodingUTF8))
             {
                 CFRelease(tzRef);
                 return std::string(buffer);
             }
-            
+
             CFRelease(tzRef);
-            
+
             return "";
         }
-        
+
         std::string
         get_tzdata_path()
         {
@@ -98,7 +98,7 @@ bool writeFile(const std::string &tzdataPath, const std::string &fileName,
                              INTERNAL_DIR + "/" + TZDATA_DIR);
             std::string result_path(std::string(convertCFStringRefPathToCStringPath(homePath)) +
                                     INTERNAL_DIR);
-            
+
             if (access(path.c_str(), F_OK) == 0)
             {
 #if TAR_DEBUG
@@ -106,34 +106,34 @@ bool writeFile(const std::string &tzdataPath, const std::string &fileName,
 #endif
                 CFRelease(homeUrlRef);
                 CFRelease(homePath);
-                
+
                 return result_path;
             }
-            
+
             CFBundleRef mainBundle = CFBundleGetMainBundle();
             CFArrayRef paths = CFBundleCopyResourceURLsOfType(mainBundle, CFSTR(TARGZ_EXTENSION),
                                                               NULL);
-            
+
             if (CFArrayGetCount(paths) != 0)
             {
                 // get archive path, assume there is no other tar.gz in bundle
                 CFURLRef archiveUrl = static_cast<CFURLRef>(CFArrayGetValueAtIndex(paths, 0));
                 CFStringRef archiveName = CFURLCopyPath(archiveUrl);
                 archiveUrl = CFBundleCopyResourceURL(mainBundle, archiveName, NULL, NULL);
-                
+
                 extractTzdata(homeUrlRef, archiveUrl, path);
-                
+
                 CFRelease(archiveUrl);
                 CFRelease(archiveName);
             }
-            
+
             CFRelease(homeUrlRef);
             CFRelease(homePath);
             CFRelease(paths);
-            
+
             return result_path;
         }
-        
+
         std::string
         convertCFStringRefPathToCStringPath(CFStringRef ref)
         {
@@ -144,55 +144,55 @@ bool writeFile(const std::string &tzdataPath, const std::string &fileName,
             delete[] buffer;
             return result;
         }
-        
+
         bool
         extractTzdata(CFURLRef homeUrl, CFURLRef archiveUrl, std::string destPath)
         {
             std::string TAR_TMP_PATH = "/tmp.tar";
-            
+
             CFStringRef homeStringRef = CFURLCopyPath(homeUrl);
             auto homePath = convertCFStringRefPathToCStringPath(homeStringRef);
             CFRelease(homeStringRef);
-            
+
             CFStringRef archiveStringRef = CFURLCopyPath(archiveUrl);
             auto archivePath = convertCFStringRefPathToCStringPath(archiveStringRef);
             CFRelease(archiveStringRef);
-            
+
             // create Library path
             auto libraryPath = homePath + INTERNAL_DIR;
-            
+
             // create tzdata path
             auto tzdataPath = libraryPath + "/" + TZDATA_DIR;
-            
+
             // -- replace %20 with " "
             const std::string search = "%20";
             const std::string replacement = " ";
             size_t pos = 0;
-            
+
             while ((pos = archivePath.find(search, pos)) != std::string::npos) {
                 archivePath.replace(pos, search.length(), replacement);
                 pos += replacement.length();
             }
-            
+
             gzFile tarFile = gzopen(archivePath.c_str(), "rb");
-            
+
             // create tar unpacking path
             auto tarPath = libraryPath + TAR_TMP_PATH;
-            
+
             // create tzdata directory
             mkdir(destPath.c_str(), S_IRWXU | S_IRWXG | S_IROTH | S_IXOTH);
-            
+
             // ======= extract tar ========
-            
+
             std::ofstream os(tarPath.c_str(), std::ofstream::out | std::ofstream::app);
             unsigned int bufferLength = 1024 * 256;  // 256Kb
             unsigned char *buffer = (unsigned char *)malloc(bufferLength);
             bool success = true;
-            
+
             while (true)
             {
                 int readBytes = gzread(tarFile, buffer, bufferLength);
-                
+
                 if (readBytes > 0)
                 {
                     os.write((char *) &buffer[0], readBytes);
@@ -216,21 +216,21 @@ bool writeFile(const std::string &tzdataPath, const std::string &fileName,
                             break;
                         }
             }
-            
+
             os.close();
             free(buffer);
             gzclose(tarFile);
-            
+
             if (!success)
             {
                 remove(tarPath.c_str());
                 return false;
             }
-            
+
             // ======== extract files =========
-            
+
             uint64_t location = 0; // Position in the file
-            
+
             // get file size
             struct stat stat_buf;
             int res = stat(tarPath.c_str(), &stat_buf);
@@ -241,20 +241,20 @@ bool writeFile(const std::string &tzdataPath, const std::string &fileName,
                 return false;
             }
             int64_t tarSize = stat_buf.st_size;
-            
+
             // create read stream
             std::ifstream is(tarPath.c_str(), std::ifstream::in | std::ifstream::binary);
-            
+
             // process files
             while (location < tarSize)
             {
                 TarInfo info = getTarObjectInfo(is);
-                
+
                 if (!info.success || info.realContentSize == 0)
                 {
                     break; // something wrong or all files are read
                 }
-                
+
                 switch (info.objType)
                 {
                     case '0':   // file
@@ -268,17 +268,17 @@ bool writeFile(const std::string &tzdataPath, const std::string &fileName,
 #endif
                         writeFile(tzdataPath, info.objName, obj, info.realContentSize);
                         location += info.blocksContentSize;
-                        
+
                         break;
                     }
                 }
             }
-            
+
             remove(tarPath.c_str());
-            
+
             return true;
         }
-        
+
         TarInfo
         getTarObjectInfo(std::ifstream &readStream)
         {
@@ -287,22 +287,22 @@ bool writeFile(const std::string &tzdataPath, const std::string &fileName,
             char type;
             char name[TAR_NAME_SIZE + 1];
             char sizeBuf[TAR_SIZE_SIZE + 1];
-            
+
             readStream.read(buffer, length);
-            
+
             memcpy(&type, &buffer[TAR_TYPE_POSITION], 1);
-            
+
             memset(&name, '\0', TAR_NAME_SIZE + 1);
             memcpy(&name, &buffer[TAR_NAME_POSITION], TAR_NAME_SIZE);
-            
+
             memset(&sizeBuf, '\0', TAR_SIZE_SIZE + 1);
             memcpy(&sizeBuf, &buffer[TAR_SIZE_POSITION], TAR_SIZE_SIZE);
             size_t realSize = strtol(sizeBuf, NULL, 8);
             size_t blocksSize = realSize + (TAR_BLOCK_SIZE - (realSize % TAR_BLOCK_SIZE));
-            
+
             return {type, std::string(name), realSize, blocksSize, true};
         }
-        
+
         std::string
         getTarObject(std::ifstream &readStream, int64_t size)
         {
@@ -310,29 +310,29 @@ bool writeFile(const std::string &tzdataPath, const std::string &fileName,
             readStream.read(buffer, size);
             return std::string(buffer);
         }
-        
+
         bool
         writeFile(const std::string &tzdataPath, const std::string &fileName, const std::string &data,
                   size_t realContentSize)
         {
             std::ofstream os(tzdataPath + "/" + fileName, std::ofstream::out | std::ofstream::binary);
-            
+
             if (!os) {
                 return false;
             }
-            
+
             // trim empty space
             char trimmedData[realContentSize + 1];
             memset(&trimmedData, '\0', realContentSize);
             memcpy(&trimmedData, data.c_str(), realContentSize);
-            
+
             // write
             os.write(trimmedData, realContentSize);
             os.close();
-            
+
             return true;
         }
-        
+
     }  // namespace iOSUtils
 }  // namespace date
 }  // namespace arrow_vendored
diff --git a/cpp/src/arrow/vendored/datetime/tz.cpp b/cpp/src/arrow/vendored/datetime/tz.cpp
index 9efc01d8d7c..9047a31c79a 100644
--- a/cpp/src/arrow/vendored/datetime/tz.cpp
+++ b/cpp/src/arrow/vendored/datetime/tz.cpp
@@ -33,6 +33,7 @@
 // NOTE(ARROW): This is required so that symbols are properly exported from the DLL
 #include "visibility.h"
 
+
 #ifdef _WIN32
    // windows.h will be included directly and indirectly (e.g. by curl).
    // We need to define these macros to prevent windows.h bringing in
@@ -144,7 +145,7 @@
 #  endif  // HAS_REMOTE_API
 #else   // !_WIN32
 #  include <unistd.h>
-#  if !USE_OS_TZDB
+#  if !USE_OS_TZDB && !defined(INSTALL)
 #    include <wordexp.h>
 #  endif
 #  include <limits.h>
@@ -425,20 +426,20 @@ tzdb_list::~tzdb_list()
     }
 }
 
-tzdb_list::tzdb_list(tzdb_list&& x) noexcept
+tzdb_list::tzdb_list(tzdb_list&& x) NOEXCEPT
    : head_{x.head_.exchange(nullptr)}
 {
 }
 
 void
-tzdb_list::push_front(tzdb* tzdb) noexcept
+tzdb_list::push_front(tzdb* tzdb) NOEXCEPT
 {
     tzdb->next = head_;
     head_ = tzdb;
 }
 
 tzdb_list::const_iterator
-tzdb_list::erase_after(const_iterator p) noexcept
+tzdb_list::erase_after(const_iterator p) NOEXCEPT
 {
     auto t = p.p_->next;
     p.p_->next = p.p_->next->next;
@@ -448,7 +449,7 @@ tzdb_list::erase_after(const_iterator p) noexcept
 
 struct tzdb_list::undocumented_helper
 {
-    static void push_front(tzdb_list& db_list, tzdb* tzdb) noexcept
+    static void push_front(tzdb_list& db_list, tzdb* tzdb) NOEXCEPT
     {
         db_list.push_front(tzdb);
     }
@@ -470,6 +471,32 @@ get_tzdb_list()
     return tz_db;
 }
 
+static
+std::string
+parse3(std::istream& in)
+{
+    std::string r(3, ' ');
+    ws(in);
+    r[0] = static_cast<char>(in.get());
+    r[1] = static_cast<char>(in.get());
+    r[2] = static_cast<char>(in.get());
+    return r;
+}
+
+static
+unsigned
+parse_month(std::istream& in)
+{
+    CONSTDATA char*const month_names[] =
+        {"Jan", "Feb", "Mar", "Apr", "May", "Jun",
+         "Jul", "Aug", "Sep", "Oct", "Nov", "Dec"};
+    auto s = parse3(in);
+    auto m = std::find(std::begin(month_names), std::end(month_names), s) - month_names;
+    if (m >= std::end(month_names) - std::begin(month_names))
+        throw std::runtime_error("oops: bad month name: " + s);
+    return static_cast<unsigned>(++m);
+}
+
 #if !USE_OS_TZDB
 
 #ifdef _WIN32
@@ -684,18 +711,6 @@ load_timezone_mappings_from_xml_file(const std::string& input_path)
 
 // Parsing helpers
 
-static
-std::string
-parse3(std::istream& in)
-{
-    std::string r(3, ' ');
-    ws(in);
-    r[0] = static_cast<char>(in.get());
-    r[1] = static_cast<char>(in.get());
-    r[2] = static_cast<char>(in.get());
-    return r;
-}
-
 static
 unsigned
 parse_dow(std::istream& in)
@@ -709,20 +724,6 @@ parse_dow(std::istream& in)
     return static_cast<unsigned>(dow);
 }
 
-static
-unsigned
-parse_month(std::istream& in)
-{
-    CONSTDATA char*const month_names[] =
-        {"Jan", "Feb", "Mar", "Apr", "May", "Jun",
-         "Jul", "Aug", "Sep", "Oct", "Nov", "Dec"};
-    auto s = parse3(in);
-    auto m = std::find(std::begin(month_names), std::end(month_names), s) - month_names;
-    if (m >= std::end(month_names) - std::begin(month_names))
-        throw std::runtime_error("oops: bad month name: " + s);
-    return static_cast<unsigned>(++m);
-}
-
 static
 std::chrono::seconds
 parse_unsigned_time(std::istream& in)
@@ -2130,14 +2131,25 @@ time_zone::load_sys_info(std::vector<detail::transition>::const_iterator i) cons
 {
     using namespace std::chrono;
     assert(!transitions_.empty());
-    assert(i != transitions_.begin());
     sys_info r;
-    r.begin = i[-1].timepoint;
-    r.end = i != transitions_.end() ? i->timepoint :
-                                      sys_seconds(sys_days(year::max()/max_day));
-    r.offset = i[-1].info->offset;
-    r.save = i[-1].info->is_dst ? minutes{1} : minutes{0};
-    r.abbrev = i[-1].info->abbrev;
+    if (i != transitions_.begin())
+    {
+        r.begin = i[-1].timepoint;
+        r.end = i != transitions_.end() ? i->timepoint :
+                                          sys_seconds(sys_days(year::max()/max_day));
+        r.offset = i[-1].info->offset;
+        r.save = i[-1].info->is_dst ? minutes{1} : minutes{0};
+        r.abbrev = i[-1].info->abbrev;
+    }
+    else
+    {
+        r.begin = sys_days(year::min()/min_day);
+        r.end = i+1 != transitions_.end() ? i[1].timepoint :
+                                          sys_seconds(sys_days(year::max()/max_day));
+        r.offset = i[0].info->offset;
+        r.save = i[0].info->is_dst ? minutes{1} : minutes{0};
+        r.abbrev = i[0].info->abbrev;
+    }
     return r;
 }
 
@@ -2158,7 +2170,7 @@ time_zone::get_info_impl(local_seconds tp) const
 {
     using namespace std::chrono;
     init();
-    local_info i;
+    local_info i{};
     i.result = local_info::unique;
     auto tr = upper_bound(transitions_.begin(), transitions_.end(), tp,
                           [](const local_seconds& x, const transition& t)
@@ -2172,7 +2184,7 @@ time_zone::get_info_impl(local_seconds tp) const
     {
         i.second = load_sys_info(--tr);
         tps = sys_seconds{(tp - i.second.offset).time_since_epoch()};
-        if (tps < i.second.end)
+        if (tps < i.second.end && i.first.end != i.second.end)
         {
            i.result = local_info::ambiguous;
            std::swap(i.first, i.second);
@@ -2215,15 +2227,11 @@ operator<<(std::ostream& os, const time_zone& z)
     return os;
 }
 
-#if !MISSING_LEAP_SECONDS
-
 leap_second::leap_second(const sys_seconds& s, detail::undocumented)
     : date_(s)
 {
 }
 
-#endif  // !MISSING_LEAP_SECONDS
-
 #else  // !USE_OS_TZDB
 
 time_zone::time_zone(const std::string& s, detail::undocumented)
@@ -2620,8 +2628,6 @@ operator<<(std::ostream& os, const time_zone& z)
 
 #endif  // !USE_OS_TZDB
 
-#if !MISSING_LEAP_SECONDS
-
 std::ostream&
 operator<<(std::ostream& os, const leap_second& x)
 {
@@ -2629,11 +2635,8 @@ operator<<(std::ostream& os, const leap_second& x)
     return os << x.date_ << "  +";
 }
 
-#endif  // !MISSING_LEAP_SECONDS
-
 #if USE_OS_TZDB
 
-# ifdef __APPLE__
 static
 std::string
 get_version()
@@ -2642,12 +2645,99 @@ get_version()
     auto path = get_tz_dir() + string("/+VERSION");
     ifstream in{path};
     string version;
-    in >> version;
-    if (in.fail())
-        throw std::runtime_error("Unable to get Timezone database version from " + path);
-    return version;
+    if (in)
+    {
+        in >> version;
+        return version;
+    }
+    in.clear();
+    in.open(get_tz_dir() + std::string(1, folder_delimiter) + "version");
+    if (in)
+    {
+        in >> version;
+        return version;
+    }
+    return "unknown";
+}
+
+static
+std::vector<leap_second>
+find_read_and_leap_seconds()
+{
+    std::ifstream in(get_tz_dir() + std::string(1, folder_delimiter) + "leapseconds",
+                     std::ios_base::binary);
+    if (in)
+    {
+        std::vector<leap_second> leap_seconds;
+        std::string line;
+        while (in)
+        {
+            std::getline(in, line);
+            if (!line.empty() && line[0] != '#')
+            {
+                std::istringstream in(line);
+                in.exceptions(std::ios::failbit | std::ios::badbit);
+                std::string word;
+                in >> word;
+                if (word == "Leap")
+                {
+                    int y, m, d;
+                    in >> y;
+                    m = static_cast<int>(parse_month(in));
+                    in >> d;
+                    leap_seconds.push_back(leap_second(sys_days{year{y}/m/d} + days{1},
+                                                                 detail::undocumented{}));
+                }
+                else
+                {
+                    std::cerr << line << '\n';
+                }
+            }
+        }
+        return leap_seconds;
+    }
+    in.clear();
+    in.open(get_tz_dir() + std::string(1, folder_delimiter) + "leap-seconds.list",
+                     std::ios_base::binary);
+    if (in)
+    {
+        std::vector<leap_second> leap_seconds;
+        std::string line;
+        const auto offset = sys_days{1970_y/1/1}-sys_days{1900_y/1/1};
+        while (in)
+        {
+            std::getline(in, line);
+            if (!line.empty() && line[0] != '#')
+            {
+                std::istringstream in(line);
+                in.exceptions(std::ios::failbit | std::ios::badbit);
+                using seconds = std::chrono::seconds;
+                seconds::rep s;
+                in >> s;
+                if (s == 2272060800)
+                    continue;
+                leap_seconds.push_back(leap_second(sys_seconds{seconds{s}} - offset,
+                                                                 detail::undocumented{}));
+            }
+        }
+        return leap_seconds;
+    }
+    in.clear();
+    in.open(get_tz_dir() + std::string(1, folder_delimiter) + "right/UTC",
+                     std::ios_base::binary);
+    if (in)
+    {
+        return load_just_leaps(in);
+    }
+    in.clear();
+    in.open(get_tz_dir() + std::string(1, folder_delimiter) + "UTC",
+                     std::ios_base::binary);
+    if (in)
+    {
+        return load_just_leaps(in);
+    }
+    return {};
 }
-# endif
 
 static
 std::unique_ptr<tzdb>
@@ -2676,6 +2766,7 @@ init_tzdb()
                 strcmp(d->d_name, "iso3166.tab")  == 0      ||
                 strcmp(d->d_name, "right")        == 0      ||
                 strcmp(d->d_name, "+VERSION")     == 0      ||
+                strcmp(d->d_name, "version")      == 0      ||
                 strcmp(d->d_name, "zone.tab")     == 0      ||
                 strcmp(d->d_name, "zone1970.tab") == 0      ||
                 strcmp(d->d_name, "tzdata.zi")    == 0      ||
@@ -2703,28 +2794,8 @@ init_tzdb()
     }
     db->zones.shrink_to_fit();
     std::sort(db->zones.begin(), db->zones.end());
-#  if !MISSING_LEAP_SECONDS
-    std::ifstream in(get_tz_dir() + std::string(1, folder_delimiter) + "right/UTC",
-                     std::ios_base::binary);
-    if (in)
-    {
-        in.exceptions(std::ios::failbit | std::ios::badbit);
-        db->leap_seconds = load_just_leaps(in);
-    }
-    else
-    {
-        in.clear();
-        in.open(get_tz_dir() + std::string(1, folder_delimiter) +
-                "UTC", std::ios_base::binary);
-        if (!in)
-            throw std::runtime_error("Unable to extract leap second information");
-        in.exceptions(std::ios::failbit | std::ios::badbit);
-        db->leap_seconds = load_just_leaps(in);
-    }
-#  endif  // !MISSING_LEAP_SECONDS
-#  ifdef __APPLE__
+    db->leap_seconds = find_read_and_leap_seconds();
     db->version = get_version();
-#  endif
     return db;
 }
 
@@ -2781,17 +2852,23 @@ file_exists(const std::string& filename)
 
 // CURL tools
 
-static
-int
-curl_global()
+namespace
 {
-    if (::curl_global_init(CURL_GLOBAL_DEFAULT) != 0)
-        throw std::runtime_error("CURL global initialization failed");
-    return 0;
-}
 
-namespace
+struct curl_global_init_and_cleanup
 {
+    ~curl_global_init_and_cleanup()
+    {
+        ::curl_global_cleanup();
+    }
+    curl_global_init_and_cleanup()
+    {
+        if (::curl_global_init(CURL_GLOBAL_DEFAULT) != 0)
+            throw std::runtime_error("CURL global initialization failed");
+    }
+    curl_global_init_and_cleanup(curl_global_init_and_cleanup const&) = delete;
+    curl_global_init_and_cleanup& operator=(curl_global_init_and_cleanup const&) = delete;
+};
 
 struct curl_deleter
 {
@@ -2807,8 +2884,7 @@ static
 std::unique_ptr<CURL, curl_deleter>
 curl_init()
 {
-    static const auto curl_is_now_initiailized = curl_global();
-    (void)curl_is_now_initiailized;
+    static const curl_global_init_and_cleanup _{};
     return std::unique_ptr<CURL, curl_deleter>{::curl_easy_init()};
 }
 
@@ -3299,8 +3375,8 @@ remote_download(const std::string& version, char* error_buffer)
     {
         auto mapping_file = get_download_mapping_file(version);
         result = download_to_file(
-			"https://raw.githubusercontent.com/unicode-org/cldr/master/"
-			"common/supplemental/windowsZones.xml",
+            "https://raw.githubusercontent.com/unicode-org/cldr/master/"
+            "common/supplemental/windowsZones.xml",
             mapping_file, download_file_options::text, error_buffer);
     }
 #  endif  // _WIN32
@@ -3574,11 +3650,9 @@ operator<<(std::ostream& os, const tzdb& db)
     os << "Version: " << db.version << "\n\n";
     for (const auto& x : db.zones)
         os << x << '\n';
-#if !MISSING_LEAP_SECONDS
     os << '\n';
     for (const auto& x : db.leap_seconds)
         os << x << '\n';
-#endif  // !MISSING_LEAP_SECONDS
     return os;
 }
 
diff --git a/cpp/src/arrow/vendored/datetime/tz.h b/cpp/src/arrow/vendored/datetime/tz.h
index 23c6742143c..6d54e49ea22 100644
--- a/cpp/src/arrow/vendored/datetime/tz.h
+++ b/cpp/src/arrow/vendored/datetime/tz.h
@@ -44,8 +44,7 @@
 // Technically any OS may use the mapping process but currently only Windows does use it.
 
 // NOTE(ARROW): If this is not set, then the library will attempt to
-// use libcurl to obtain a timezone database, and we do not yet have
-// curl in our build toolchain
+// use libcurl to obtain a timezone database, and we probably do not want this.
 #ifndef _WIN32
 #define USE_OS_TZDB 1
 #endif
@@ -93,15 +92,6 @@ static_assert(HAS_REMOTE_API == 0 ? AUTO_DOWNLOAD == 0 : true,
 #  ifdef _WIN32
 #    error "USE_OS_TZDB can not be used on Windows"
 #  endif
-#  ifndef MISSING_LEAP_SECONDS
-#    ifdef __APPLE__
-#      define MISSING_LEAP_SECONDS 1
-#    else
-#      define MISSING_LEAP_SECONDS 0
-#    endif
-#  endif
-#else
-#  define MISSING_LEAP_SECONDS 0
 #endif
 
 #ifndef HAS_DEDUCTION_GUIDES
@@ -712,6 +702,11 @@ class zoned_time
 
 private:
     template <class D, class T> friend class zoned_time;
+
+    template <class TimeZonePtr2>
+    static
+    TimeZonePtr2&&
+    check(TimeZonePtr2&& p);
 };
 
 using zoned_seconds = zoned_time<std::chrono::seconds>;
@@ -999,8 +994,6 @@ inline bool operator>=(const time_zone_link& x, const time_zone_link& y) {return
 
 #endif  // !USE_OS_TZDB
 
-#if !MISSING_LEAP_SECONDS
-
 class leap_second
 {
 private:
@@ -1124,8 +1117,6 @@ operator>=(const sys_time<Duration>& x, const leap_second& y)
 
 using leap = leap_second;
 
-#endif  // !MISSING_LEAP_SECONDS
-
 #ifdef _WIN32
 
 namespace detail
@@ -1171,9 +1162,7 @@ struct tzdb
 #if !USE_OS_TZDB
     std::vector<time_zone_link> links;
 #endif
-#if !MISSING_LEAP_SECONDS
     std::vector<leap_second>    leap_seconds;
-#endif
 #if !USE_OS_TZDB
     std::vector<detail::Rule>   rules;
 #endif
@@ -1230,31 +1219,31 @@ class tzdb_list
 public:
     ~tzdb_list();
     tzdb_list() = default;
-    tzdb_list(tzdb_list&& x) noexcept;
+    tzdb_list(tzdb_list&& x) NOEXCEPT;
 
-    const tzdb& front() const noexcept {return *head_;}
-          tzdb& front()       noexcept {return *head_;}
+    const tzdb& front() const NOEXCEPT {return *head_;}
+          tzdb& front()       NOEXCEPT {return *head_;}
 
     class const_iterator;
 
-    const_iterator begin() const noexcept;
-    const_iterator end() const noexcept;
+    const_iterator begin() const NOEXCEPT;
+    const_iterator end() const NOEXCEPT;
 
-    const_iterator cbegin() const noexcept;
-    const_iterator cend() const noexcept;
+    const_iterator cbegin() const NOEXCEPT;
+    const_iterator cend() const NOEXCEPT;
 
-    const_iterator erase_after(const_iterator p) noexcept;
+    const_iterator erase_after(const_iterator p) NOEXCEPT;
 
     struct undocumented_helper;
 private:
-    void push_front(tzdb* tzdb) noexcept;
+    void push_front(tzdb* tzdb) NOEXCEPT;
 };
 
 class tzdb_list::const_iterator
 {
     tzdb* p_ = nullptr;
 
-    explicit const_iterator(tzdb* p) noexcept : p_{p} {}
+    explicit const_iterator(tzdb* p) NOEXCEPT : p_{p} {}
 public:
     const_iterator() = default;
 
@@ -1264,20 +1253,20 @@ class tzdb_list::const_iterator
     using pointer           = const value_type*;
     using difference_type   = std::ptrdiff_t;
 
-    reference operator*() const noexcept {return *p_;}
-    pointer  operator->() const noexcept {return p_;}
+    reference operator*() const NOEXCEPT {return *p_;}
+    pointer  operator->() const NOEXCEPT {return p_;}
 
-    const_iterator& operator++() noexcept {p_ = p_->next; return *this;}
-    const_iterator  operator++(int) noexcept {auto t = *this; ++(*this); return t;}
+    const_iterator& operator++() NOEXCEPT {p_ = p_->next; return *this;}
+    const_iterator  operator++(int) NOEXCEPT {auto t = *this; ++(*this); return t;}
 
     friend
     bool
-    operator==(const const_iterator& x, const const_iterator& y) noexcept
+    operator==(const const_iterator& x, const const_iterator& y) NOEXCEPT
         {return x.p_ == y.p_;}
 
     friend
     bool
-    operator!=(const const_iterator& x, const const_iterator& y) noexcept
+    operator!=(const const_iterator& x, const const_iterator& y) NOEXCEPT
         {return !(x == y);}
 
     friend class tzdb_list;
@@ -1285,28 +1274,28 @@ class tzdb_list::const_iterator
 
 inline
 tzdb_list::const_iterator
-tzdb_list::begin() const noexcept
+tzdb_list::begin() const NOEXCEPT
 {
     return const_iterator{head_};
 }
 
 inline
 tzdb_list::const_iterator
-tzdb_list::end() const noexcept
+tzdb_list::end() const NOEXCEPT
 {
     return const_iterator{nullptr};
 }
 
 inline
 tzdb_list::const_iterator
-tzdb_list::cbegin() const noexcept
+tzdb_list::cbegin() const NOEXCEPT
 {
     return begin();
 }
 
 inline
 tzdb_list::const_iterator
-tzdb_list::cend() const noexcept
+tzdb_list::cend() const NOEXCEPT
 {
     return end();
 }
@@ -1337,7 +1326,7 @@ namespace detail
 template <class T>
 inline
 T*
-to_raw_pointer(T* p) noexcept
+to_raw_pointer(T* p) NOEXCEPT
 {
     return p;
 }
@@ -1345,7 +1334,7 @@ to_raw_pointer(T* p) noexcept
 template <class Pointer>
 inline
 auto
-to_raw_pointer(Pointer p) noexcept
+to_raw_pointer(Pointer p) NOEXCEPT
     -> decltype(detail::to_raw_pointer(p.operator->()))
 {
     return detail::to_raw_pointer(p.operator->());
@@ -1353,13 +1342,25 @@ to_raw_pointer(Pointer p) noexcept
 
 }  // namespace detail
 
+template <class Duration, class TimeZonePtr>
+template <class TimeZonePtr2>
+inline
+TimeZonePtr2&&
+zoned_time<Duration, TimeZonePtr>::check(TimeZonePtr2&& p)
+{
+    if (detail::to_raw_pointer(p) == nullptr)
+        throw std::runtime_error(
+            "zoned_time constructed with a time zone pointer == nullptr");
+    return std::forward<TimeZonePtr2>(p);
+}
+
 template <class Duration, class TimeZonePtr>
 #if !defined(_MSC_VER) || (_MSC_VER > 1916)
 template <class T, class>
 #endif
 inline
 zoned_time<Duration, TimeZonePtr>::zoned_time()
-    : zone_(zoned_traits<TimeZonePtr>::default_zone())
+    : zone_(check(zoned_traits<TimeZonePtr>::default_zone()))
     {}
 
 template <class Duration, class TimeZonePtr>
@@ -1368,15 +1369,15 @@ template <class T, class>
 #endif
 inline
 zoned_time<Duration, TimeZonePtr>::zoned_time(const sys_time<Duration>& st)
-    : zone_(zoned_traits<TimeZonePtr>::default_zone())
+    : zone_(check(zoned_traits<TimeZonePtr>::default_zone()))
     , tp_(st)
     {}
 
 template <class Duration, class TimeZonePtr>
 inline
 zoned_time<Duration, TimeZonePtr>::zoned_time(TimeZonePtr z)
-    : zone_(std::move(z))
-    {assert(detail::to_raw_pointer(zone_) != nullptr);}
+    : zone_(check(std::move(z)))
+    {}
 
 #if HAS_STRING_VIEW
 
@@ -1411,7 +1412,7 @@ zoned_time<Duration, TimeZonePtr>::zoned_time(const zoned_time<Duration2, TimeZo
 template <class Duration, class TimeZonePtr>
 inline
 zoned_time<Duration, TimeZonePtr>::zoned_time(TimeZonePtr z, const sys_time<Duration>& st)
-    : zone_(std::move(z))
+    : zone_(check(std::move(z)))
     , tp_(st)
     {}
 
@@ -1421,7 +1422,7 @@ template <class T, class>
 #endif
 inline
 zoned_time<Duration, TimeZonePtr>::zoned_time(TimeZonePtr z, const local_time<Duration>& t)
-    : zone_(std::move(z))
+    : zone_(check(std::move(z)))
     , tp_(zone_->to_sys(t))
     {}
 
@@ -1432,7 +1433,7 @@ template <class T, class>
 inline
 zoned_time<Duration, TimeZonePtr>::zoned_time(TimeZonePtr z, const local_time<Duration>& t,
                                               choose c)
-    : zone_(std::move(z))
+    : zone_(check(std::move(z)))
     , tp_(zone_->to_sys(t, c))
     {}
 
@@ -1441,7 +1442,7 @@ template <class Duration2, class TimeZonePtr2, class>
 inline
 zoned_time<Duration, TimeZonePtr>::zoned_time(TimeZonePtr z,
                                               const zoned_time<Duration2, TimeZonePtr2>& zt)
-    : zone_(std::move(z))
+    : zone_(check(std::move(z)))
     , tp_(zt.tp_)
     {}
 
@@ -1856,8 +1857,6 @@ operator<<(std::basic_ostream<CharT, Traits>& os, const zoned_time<Duration, Tim
     return to_stream(os, fmt, t);
 }
 
-#if !MISSING_LEAP_SECONDS
-
 class utc_clock
 {
 public:
@@ -2796,8 +2795,6 @@ to_gps_time(const tai_time<Duration>& t)
     return gps_clock::from_utc(tai_clock::to_utc(t));
 }
 
-#endif  // !MISSING_LEAP_SECONDS
-
 }  // namespace date
 }  // namespace arrow_vendored
 
diff --git a/cpp/src/arrow/vendored/datetime/tz_private.h b/cpp/src/arrow/vendored/datetime/tz_private.h
index 282842e7441..6b7a91493e1 100644
--- a/cpp/src/arrow/vendored/datetime/tz_private.h
+++ b/cpp/src/arrow/vendored/datetime/tz_private.h
@@ -97,9 +97,9 @@ class MonthDayTime
         U& operator=(const pair& x);
     } u;
 
-    std::chrono::hours           h_{};
-    std::chrono::minutes         m_{};
-    std::chrono::seconds         s_{};
+    std::chrono::hours           h_{0};
+    std::chrono::minutes         m_{0};
+    std::chrono::seconds         s_{0};
     tz                           zone_{tz::local};
 
 public:
@@ -247,7 +247,7 @@ struct zonelet
     sys_seconds                        until_utc_;
     local_seconds                      until_std_;
     local_seconds                      until_loc_;
-    std::chrono::minutes               initial_save_{};
+    std::chrono::minutes               initial_save_{0};
     std::string                        initial_abbrev_;
     std::pair<const Rule*, date::year> first_rule_{nullptr, date::year::min()};
     std::pair<const Rule*, date::year> last_rule_{nullptr, date::year::max()};
diff --git a/cpp/src/parquet/arrow/arrow_reader_writer_test.cc b/cpp/src/parquet/arrow/arrow_reader_writer_test.cc
index a7b5155c40f..2bb7abc2023 100644
--- a/cpp/src/parquet/arrow/arrow_reader_writer_test.cc
+++ b/cpp/src/parquet/arrow/arrow_reader_writer_test.cc
@@ -4004,6 +4004,7 @@ TEST_P(TestArrowReadDictionary, ZeroChunksListOfDictionary) {
   auto values = std::make_shared<ChunkedArray>(::arrow::ArrayVector{},
                                                ::arrow::list(::arrow::utf8()));
   options.num_rows = 0;
+  options.num_uniques = 0;
   options.num_row_groups = 1;
   expected_dense_ = MakeSimpleTable(values, false);
 
@@ -4064,6 +4065,7 @@ TEST_P(TestArrowReadDictionary, StreamReadWholeFileDict) {
   // Recompute generated data with only one row-group
   options.num_row_groups = 1;
   options.num_rows = 16;
+  options.num_uniques = 7;
   SetUp();
   WriteSimple();
 
diff --git a/cpp/src/parquet/encoding.cc b/cpp/src/parquet/encoding.cc
index e3460144fc1..2639c3dd4aa 100644
--- a/cpp/src/parquet/encoding.cc
+++ b/cpp/src/parquet/encoding.cc
@@ -2105,22 +2105,33 @@ class DeltaBitPackDecoder : public DecoderImpl, virtual public TypedDecoder<DTyp
   }
 
  private:
+  static constexpr int kMaxDeltaBitWidth = static_cast<int>(sizeof(T) * 8);
+
   void InitHeader() {
-    if (!decoder_.GetVlqInt(&values_per_block_)) ParquetException::EofException();
-    if (!decoder_.GetVlqInt(&mini_blocks_per_block_)) ParquetException::EofException();
-    if (!decoder_.GetVlqInt(&total_value_count_)) {
+    if (!decoder_.GetVlqInt(&values_per_block_) ||
+        !decoder_.GetVlqInt(&mini_blocks_per_block_) ||
+        !decoder_.GetVlqInt(&total_value_count_) ||
+        !decoder_.GetZigZagVlqInt(&last_value_)) {
       ParquetException::EofException();
     }
-    if (!decoder_.GetZigZagVlqInt(&last_value_)) ParquetException::EofException();
 
-    delta_bit_widths_ = AllocateBuffer(pool_, mini_blocks_per_block_);
+    if (values_per_block_ == 0) {
+      throw ParquetException("cannot have zero value per block");
+    }
+    if (mini_blocks_per_block_ == 0) {
+      throw ParquetException("cannot have zero miniblock per block");
+    }
     values_per_mini_block_ = values_per_block_ / mini_blocks_per_block_;
+    if (values_per_mini_block_ == 0) {
+      throw ParquetException("cannot have zero value per miniblock");
+    }
     if (values_per_mini_block_ % 32 != 0) {
       throw ParquetException(
           "the number of values in a miniblock must be multiple of 32, but it's " +
           std::to_string(values_per_mini_block_));
     }
 
+    delta_bit_widths_ = AllocateBuffer(pool_, mini_blocks_per_block_);
     block_initialized_ = false;
     values_current_mini_block_ = 0;
   }
@@ -2134,6 +2145,9 @@ class DeltaBitPackDecoder : public DecoderImpl, virtual public TypedDecoder<DTyp
       if (!decoder_.GetAligned<uint8_t>(1, bit_width_data + i)) {
         ParquetException::EofException();
       }
+      if (bit_width_data[i] > kMaxDeltaBitWidth) {
+        throw ParquetException("delta bit width larger than integer bit width");
+      }
     }
     mini_block_idx_ = 0;
     delta_bit_width_ = bit_width_data[0];
diff --git a/cpp/thirdparty/versions.txt b/cpp/thirdparty/versions.txt
index 12c95fd4349..cd1b8f73e23 100644
--- a/cpp/thirdparty/versions.txt
+++ b/cpp/thirdparty/versions.txt
@@ -50,8 +50,8 @@ ARROW_GLOG_BUILD_VERSION=v0.4.0
 ARROW_GLOG_BUILD_SHA256_CHECKSUM=f28359aeba12f30d73d9e4711ef356dc842886968112162bc73002645139c39c
 ARROW_GRPC_BUILD_VERSION=v1.35.0
 ARROW_GRPC_BUILD_SHA256_CHECKSUM=27dd2fc5c9809ddcde8eb6fa1fa278a3486566dfc28335fca13eb8df8bd3b958
-ARROW_GTEST_BUILD_VERSION=1.10.0
-ARROW_GTEST_BUILD_SHA256_CHECKSUM=9dc9157a9a1551ec7a7e43daea9a694a0bb5fb8bec81235d8a1e6ef64c716dcb
+ARROW_GTEST_BUILD_VERSION=1.11.0
+ARROW_GTEST_BUILD_SHA256_CHECKSUM=b4870bf121ff7795ba20d20bcdd8627b8e088f2d1dab299a031c1034eddc93d5
 ARROW_JEMALLOC_BUILD_VERSION=5.2.1
 ARROW_JEMALLOC_BUILD_SHA256_CHECKSUM=34330e5ce276099e2e8950d9335db5a875689a4c6a56751ef3b1d8c537f887f6
 ARROW_LZ4_BUILD_VERSION=v1.9.3
diff --git a/dev/tasks/conda-recipes/arrow-cpp/build-arrow.sh b/dev/tasks/conda-recipes/arrow-cpp/build-arrow.sh
index e07b4f758fe..9e4c02c5c6e 100644
--- a/dev/tasks/conda-recipes/arrow-cpp/build-arrow.sh
+++ b/dev/tasks/conda-recipes/arrow-cpp/build-arrow.sh
@@ -36,9 +36,13 @@ fi
 
 if [[ "${target_platform}" == "osx-arm64" ]]; then
     # We need llvm 11+ support in Arrow for this
-    EXTRA_CMAKE_ARGS=" ${EXTRA_CMAKE_ARGS} -DARROW_GANDIVA=OFF"
+    # Tell jemalloc to support 16K page size on apple arm64 silicon
+    EXTRA_CMAKE_ARGS=" ${EXTRA_CMAKE_ARGS} -DARROW_GANDIVA=OFF -DARROW_JEMALLOC_LG_PAGE=14"
     sed -ie "s;protoc-gen-grpc.*$;protoc-gen-grpc=${BUILD_PREFIX}/bin/grpc_cpp_plugin\";g" ../src/arrow/flight/CMakeLists.txt
-    sed -ie 's;"--with-jemalloc-prefix\=je_arrow_";"--with-jemalloc-prefix\=je_arrow_" "--with-lg-page\=14";g' ../cmake_modules/ThirdpartyToolchain.cmake
+elif [[ "${target_platform}" == "linux-aarch64" ]]; then
+    # Tell jemalloc to support both 4k and 64k page arm64 systems
+    # See https://github.com/apache/arrow/pull/10940
+    EXTRA_CMAKE_ARGS=" ${EXTRA_CMAKE_ARGS} -DARROW_GANDIVA=ON -DARROW_JEMALLOC_LG_PAGE=16"
 else
     EXTRA_CMAKE_ARGS=" ${EXTRA_CMAKE_ARGS} -DARROW_GANDIVA=ON"
 fi
diff --git a/dev/tasks/conda-recipes/azure.osx.yml b/dev/tasks/conda-recipes/azure.osx.yml
index d3cbcbbb787..99bb76ba520 100755
--- a/dev/tasks/conda-recipes/azure.osx.yml
+++ b/dev/tasks/conda-recipes/azure.osx.yml
@@ -18,6 +18,7 @@ jobs:
 
   - script: |
       source activate base
+      conda config --set channel_priority strict
       conda install -n base -c conda-forge --quiet --yes conda-forge-ci-setup=3 conda-build
     displayName: 'Add conda-forge-ci-setup=3'
 
@@ -27,7 +28,6 @@ jobs:
       /usr/bin/sudo -k
     displayName: Mangle homebrew
 
-
   {{ macros.azure_checkout_arrow() }}
 
   - script: |
@@ -37,7 +37,7 @@ jobs:
       setup_conda_rc ./ ./ ./.ci_support/${CONFIG}.yaml
       export CI=azure
       source run_conda_forge_build_setup
-      conda update --yes --quiet --override-channels -c conda-forge -c defaults --all
+      conda update --yes --quiet --override-channels -c conda-forge --all
     displayName: Configure conda and conda-build
     workingDirectory: arrow/dev/tasks/conda-recipes
     env:
diff --git a/dev/tasks/conda-recipes/r-arrow/configure.win b/dev/tasks/conda-recipes/r-arrow/configure.win
index 43a5945558a..0b11d1335c0 100755
--- a/dev/tasks/conda-recipes/r-arrow/configure.win
+++ b/dev/tasks/conda-recipes/r-arrow/configure.win
@@ -3,7 +3,7 @@
 set -euxo pipefail
 
 # Remove the -I../inst/include/ when unvendoring cpp11 in ARROW-13610
-echo "PKG_CPPFLAGS=-DNDEBUG -I\"${LIBRARY_PREFIX}/include\" -I\"${PREFIX}/include\" -DARROW_R_WITH_ARROW -DARROW_R_WITH_PARQUET -DARROW_R_WITH_DATASET -DARROW_R_WITH_S3 -I../inst/include/" > src/Makevars.win
+echo "PKG_CPPFLAGS=-DNDEBUG -I\"${LIBRARY_PREFIX}/include\" -I\"${PREFIX}/include\" -DARROW_R_WITH_ARROW -DARROW_R_WITH_PARQUET -DARROW_R_WITH_DATASET -DARROW_R_WITH_S3 -DARROW_R_WITH_JSON -I../inst/include/" > src/Makevars.win
 echo "PKG_CXXFLAGS=\$(CXX_VISIBILITY)" >> src/Makevars.win
 echo 'CXX_STD=CXX11' >> src/Makevars.win
 echo "PKG_LIBS=-L\"${LIBRARY_PREFIX}/lib\" -larrow_dataset -lparquet -larrow" >> src/Makevars.win
diff --git a/dev/tasks/r/azure.linux.yml b/dev/tasks/r/azure.linux.yml
index 8564935162a..92e725f6862 100644
--- a/dev/tasks/r/azure.linux.yml
+++ b/dev/tasks/r/azure.linux.yml
@@ -50,17 +50,7 @@ jobs:
           export ARROW_R_DEV={{ not_cran|default("TRUE") }}
           # Note that by default, ci/scripts/r_test.sh sets NOT_CRAN=true
           # if ARROW_R_DEV=TRUE. Pass `-e NOT_CRAN=false` to turn that off.
-          docker-compose run \
-            {{ flags|default("") }} \
-            -e ARROW_DATASET={{ arrow_dataset|default("") }} \
-            -e ARROW_PARQUET={{ arrow_parquet|default("") }} \
-            -e ARROW_S3={{ arrow_s3|default("") }} \
-            -e ARROW_WITH_RE2={{ arrow_with_re2|default("") }} \
-            -e ARROW_WITH_UTF8PROC={{ arrow_with_utf8proc|default("") }} \
-            -e LIBARROW_MINIMAL={{ libarrow_minimal|default("") }} \
-            -e LIBARROW_DOWNLOAD={{ libarrow_download|default("") }} \
-            -e LIBARROW_BUILD={{ libarrow_build|default("") }} \
-            r
+          docker-compose run {{ flags|default("") }} r
         displayName: Docker run
 
       - script: |
diff --git a/dev/tasks/r/github.devdocs.yml b/dev/tasks/r/github.devdocs.yml
index e4d6bfb6953..5591e6587ae 100644
--- a/dev/tasks/r/github.devdocs.yml
+++ b/dev/tasks/r/github.devdocs.yml
@@ -15,36 +15,22 @@
 # specific language governing permissions and limitations
 # under the License.
 
-# NOTE: must set "Crossbow" as name to have the badge links working in the
-# github comment reports!
-name: Crossbow
+{% import 'macros.jinja' as macros with context %}
 
-on:
-  push:
-    branches:
-      - "*-github-*"
+{{ macros.github_header() }}
 
 jobs:
   devdocs:
-    name: 'R devdocs {{ "${{ matrix.os }}" }} system install: {{ "${{ matrix.system-install }}" }}'
+    name: 'R devdocs {{ "${{ matrix.os }}" }}'
     runs-on: {{ "${{ matrix.os }}" }}
     strategy:
       fail-fast: false
       matrix:
         os: [macOS-latest, ubuntu-20.04]
-        # should the install method install libarrow into a system directory
-        # or a temporary directory. old is the same as a temporary
-        # directory, but an old version of libarrow will be installed
-        # into a system directory first (to make sure we can link correctly when building)
-        system-install: [true, false]
 
     steps:
-      - name: Checkout Arrow
-        run: |
-          git clone --no-checkout {{ arrow.remote }} arrow
-          git -C arrow fetch -t {{ arrow.remote }} {{ arrow.branch }}
-          git -C arrow checkout FETCH_HEAD
-          git -C arrow submodule update --init --recursive
+      {{ macros.github_checkout_arrow()|indent }}
+
       - uses: r-lib/actions/setup-r@v1
       - uses: r-lib/actions/setup-pandoc@v1
       - name: Install knitr, rmarkdown
@@ -64,8 +50,6 @@ jobs:
           RUN_DEVDOCS: TRUE
           DEVDOCS_MACOS: {{ "${{contains(matrix.os, 'macOS')}}" }}
           DEVDOCS_UBUNTU: {{ "${{contains(matrix.os, 'ubuntu')}}" }}
-          DEVDOCS_SYSTEM_INSTALL: {{ "${{contains(matrix.system-install, 'true')}}" }}
-          DEVDOCS_PRIOR_SYSTEM_INSTALL: {{ "${{contains(matrix.system-install, 'old')}}" }}
         run: |
           # This isn't actually rendering the docs, but will save arrow/r/vignettes/script.sh
           # which can be sourced to install arrow.
diff --git a/dev/tasks/r/github.linux.offline.build.yml b/dev/tasks/r/github.linux.offline.build.yml
new file mode 100644
index 00000000000..60685b18c5c
--- /dev/null
+++ b/dev/tasks/r/github.linux.offline.build.yml
@@ -0,0 +1,117 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+# NOTE: must set "Crossbow" as name to have the badge links working in the
+# github comment reports!
+name: Crossbow
+
+on:
+  push:
+    branches:
+      - "*-github-*"
+
+jobs:
+  grab-dependencies:
+    name: "Download thirdparty dependencies"
+    runs-on: ubuntu-20.04
+    strategy:
+      fail-fast: false
+    env:
+      ARROW_R_DEV: "TRUE"
+      RSPM: "https://packagemanager.rstudio.com/cran/__linux__/focal/latest"
+    steps:
+      - name: Checkout Arrow
+        run: |
+          git clone --no-checkout {{ arrow.remote }} arrow
+          git -C arrow fetch -t {{ arrow.remote }} {{ arrow.branch }}
+          git -C arrow checkout FETCH_HEAD
+          git -C arrow submodule update --init --recursive
+      - name: Free Up Disk Space
+        shell: bash
+        run: arrow/ci/scripts/util_cleanup.sh
+      - name: Fetch Submodules and Tags
+        shell: bash
+        run: cd arrow && ci/scripts/util_checkout.sh
+      - uses: r-lib/actions/setup-r@v1
+      - name: Pull Arrow dependencies
+        run: |
+          cd arrow/r
+          # This is `make build`, but with no vignettes and not running `make doc`
+          cp ../NOTICE.txt inst/NOTICE.txt
+          rsync --archive --delete ../cpp tools/
+          cp -p ../.env tools/
+          cp -p ../NOTICE.txt tools/
+          cp -p ../LICENSE.txt tools/
+          R CMD build --no-build-vignettes --no-manual .
+          built_tar=$(ls -1 arrow*.tar.gz | head -n 1)
+          R -e "source('R/install-arrow.R'); create_package_with_all_dependencies(dest_file = 'arrow_with_deps.tar.gz', source_file = \"${built_tar}\")"
+        shell: bash
+      - name: Upload the third party dependency artifacts
+        uses: actions/upload-artifact@v2
+        with:
+          name: thirdparty_deps
+          path: arrow/r/arrow_with_deps.tar.gz
+
+  intall-offline:
+    name: "Install offline"
+    needs: [grab-dependencies]
+    runs-on: ubuntu-20.04
+    strategy:
+      fail-fast: false
+    env:
+      ARROW_R_DEV: TRUE
+      RSPM: "https://packagemanager.rstudio.com/cran/__linux__/focal/latest"
+    steps:
+      - name: Checkout Arrow
+        run: |
+          git clone --no-checkout {{ arrow.remote }} arrow
+          git -C arrow fetch -t {{ arrow.remote }} {{ arrow.branch }}
+          git -C arrow checkout FETCH_HEAD
+          git -C arrow submodule update --init --recursive
+      - uses: r-lib/actions/setup-r@v1
+      - name: Download artifacts
+        uses: actions/download-artifact@v2
+        with:
+          name: thirdparty_deps
+          path: arrow/r/
+      - name: Install system dependencies
+        run: |
+          sudo apt-get update
+          sudo apt install libcurl4-openssl-dev libssl-dev
+      - name: Install dependencies
+        run: |
+          install.packages(c("remotes", "glue", "sys"))
+          remotes::install_deps("arrow/r", dependencies = TRUE)
+        shell: Rscript {0}
+      - name: Install
+        env:
+          TEST_OFFLINE_BUILD: true
+          LIBARROW_MINIMAL: false
+        run: |
+          cd arrow/r
+          R CMD INSTALL --install-tests --no-test-load --no-docs --no-help --no-byte-compile arrow_with_deps.tar.gz
+      - name: Run the tests
+        run: R -e 'if(tools::testInstalledPackage("arrow") != 0L) stop("There was a test failure.")'
+      - name: Dump test logs
+        run: cat arrow-tests/testthat.Rout*
+        if: always()
+      - name: Save the test output
+        uses: actions/upload-artifact@v2
+        with:
+          name: test-output
+          path: arrow-tests/testthat.Rout*
+        if: always()
diff --git a/dev/tasks/tasks.yml b/dev/tasks/tasks.yml
index 8b87c982983..0fd8c0c3b87 100644
--- a/dev/tasks/tasks.yml
+++ b/dev/tasks/tasks.yml
@@ -1033,6 +1033,19 @@ tasks:
       flags: '-e ARROW_SOURCE_HOME="/arrow" -e FORCE_BUNDLED_BUILD=TRUE -e LIBARROW_BUILD=TRUE -e ARROW_DEPENDENCY_SOURCE=SYSTEM'
       image: ubuntu-r-only-r
 
+  test-r-offline-minimal:
+      ci: azure
+      template: r/azure.linux.yml
+      params:
+        r_org: rocker
+        r_image: r-base
+        r_tag: latest
+        flags: '-e TEST_OFFLINE_BUILD=true'
+
+  test-r-offline-maximal:
+    ci: github
+    template: r/github.linux.offline.build.yml
+
 
 {% for r_org, r_image, r_tag in [("rhub", "ubuntu-gcc-release", "latest"),
                                  ("rocker", "r-base", "latest"),
@@ -1101,12 +1114,7 @@ tasks:
       r_org: rocker
       r_image: r-base
       r_tag: latest
-      arrow_dataset: "OFF"
-      arrow_parquet: "OFF"
-      arrow_s3: "OFF"
-      arrow_with_re2: "OFF"
-      arrow_with_utf8proc: "OFF"
-      libarrow_minimal: "TRUE"
+      flags: "-e LIBARROW_MINIMAL=TRUE"
 
   test-ubuntu-18.04-r-sanitizer:
     ci: azure
diff --git a/docs/source/cpp/compute.rst b/docs/source/cpp/compute.rst
index 7263d77acf2..26781a2a1e5 100644
--- a/docs/source/cpp/compute.rst
+++ b/docs/source/cpp/compute.rst
@@ -360,7 +360,8 @@ Arithmetic functions
 These functions expect inputs of numeric type and apply a given arithmetic
 operation to each element(s) gathered from the input(s).  If any of the
 input element(s) is null, the corresponding output element is null.
-Input(s) will be cast to the :ref:`common numeric type <common-numeric-type>`
+For binary functions, input(s) will be cast to the
+:ref:`common numeric type <common-numeric-type>`
 (and dictionary decoded, if applicable) before the operation is applied.
 
 The default variant of these functions does not detect overflow (the result
@@ -368,6 +369,12 @@ then typically wraps around).  Most functions are also available in an
 overflow-checking variant, suffixed ``_checked``, which returns
 an ``Invalid`` :class:`Status` when overflow is detected.
 
+For functions which support decimal inputs (currently ``add``, ``subtract``,
+``multiply``, and ``divide`` and their checked variants), decimals of different
+precisions/scales will be promoted appropriately. Mixed decimal and
+floating-point arguments will cast all arguments to floating-point, while mixed
+decimal and integer arguments will cast all arguments to decimals.
+
 +------------------+--------+----------------+----------------------+-------+
 | Function name    | Arity  | Input types    | Output type          | Notes |
 +==================+========+================+======================+=======+
@@ -457,18 +464,94 @@ Bit-wise functions
 Rounding functions
 ~~~~~~~~~~~~~~~~~~
 
-Rounding functions convert a numeric input into an approximate value with a
-simpler representation based on the rounding strategy.
-
-+------------------+--------+----------------+-----------------+-------+
-| Function name    | Arity  | Input types    | Output type     | Notes |
-+==================+========+================+=================+=======+
-| floor            | Unary  | Numeric        | Float32/Float64 |       |
-+------------------+--------+----------------+-----------------+-------+
-| ceil             | Unary  | Numeric        | Float32/Float64 |       |
-+------------------+--------+----------------+-----------------+-------+
-| trunc            | Unary  | Numeric        | Float32/Float64 |       |
-+------------------+--------+----------------+-----------------+-------+
+Rounding functions displace numeric inputs to an approximate value with a simpler
+representation based on the rounding criterion.
+
++-------------------+------------+-------------+------------------+----------------------------------+--------+
+| Function name     | Arity      | Input types | Output type      | Options class                    | Notes  |
++===================+============+=============+==================+==================================+========+
+| ceil              | Unary      | Numeric     | Float32/Float64  |                                  |        |
++-------------------+------------+-------------+------------------+----------------------------------+--------+
+| floor             | Unary      | Numeric     | Float32/Float64  |                                  |        |
++-------------------+------------+-------------+------------------+----------------------------------+--------+
+| round             | Unary      | Numeric     | Float32/Float64  | :struct:`RoundOptions`           | (1)(2) |
++-------------------+------------+-------------+------------------+----------------------------------+--------+
+| round_to_multiple | Unary      | Numeric     | Float32/Float64  | :struct:`RoundToMultipleOptions` | (1)(3) |
++-------------------+------------+-------------+------------------+----------------------------------+--------+
+| trunc             | Unary      | Numeric     | Float32/Float64  |                                  |        |
++-------------------+------------+-------------+------------------+----------------------------------+--------+
+
+* \(1) Output value is a 64-bit floating-point for integral inputs and the
+  retains the same type for floating-point inputs.  By default rounding
+  functions displace a value to the nearest integer using HALF_TO_EVEN
+  to resolve ties.  Options are available to control the rounding criterion.
+  Both ``round`` and ``round_to_multiple`` have the ``round_mode`` option to set
+  the rounding mode.
+* \(2) Round to a number of digits where the ``ndigits`` option of
+  :struct:`RoundOptions` specifies the rounding precision in terms of number of
+  digits.  A negative value corresponds to digits in the non-fractional part.
+  For example, -2 corresponds to rounding to the nearest multiple of 100
+  (zeroing the ones and tens digits).  Default value of ``ndigits`` is 0 which
+  rounds to the nearest integer.
+* \(3) Round to a multiple where the ``multiple`` option of :struct:`RoundToMultipleOptions`
+  specifies the rounding scale.  The rounding multiple has to be a positive value.
+  For example, 100 corresponds to rounding to the nearest multiple of 100
+  (zeroing the ones and tens digits).  Default value of ``multiple`` is 1 which
+  rounds to the nearest integer.
+
+For ``round`` and ``round_to_multiple``, the following rounding modes are available.
+Tie-breaking modes are prefixed with HALF and round non-ties to the nearest integer.
+The example values are given for default values of ``ndigits`` and ``multiple``.
+
++-----------------------+--------------------------------------------------------------+---------------------------+
+| ``round_mode``        | Operation performed                                          | Example values            |
++=======================+==============================================================+===========================+
+| DOWN                  | Round to nearest integer less than or equal in magnitude;    | 3.2 -> 3, 3.7 -> 3,       |
+|                       | also known as ``floor(x)``                                   | -3.2 -> -4, -3.7 -> -4    |
++-----------------------+--------------------------------------------------------------+---------------------------+
+| UP                    | Round to nearest integer greater than or equal in magnitude; | 3.2 -> 4, 3.7 -> 4,       |
+|                       | also known as ``ceil(x)``                                    | -3.2 -> -3, -3.7 -> -3    |
++-----------------------+--------------------------------------------------------------+---------------------------+
+| TOWARDS_ZERO          | Get the integral part without fractional digits;             | 3.2 -> 3, 3.7 -> 3,       |
+|                       | also known as ``trunc(x)``                                   | -3.2 -> -3, -3.7 -> -3    |
++-----------------------+--------------------------------------------------------------+---------------------------+
+| TOWARDS_INFINITY      | Round negative values with ``DOWN`` rule,                    | 3.2 -> 4, 3.7 -> 4,       |
+|                       | round positive values with ``UP`` rule                       | -3.2 -> -4, -3.7 -> -4    |
++-----------------------+--------------------------------------------------------------+---------------------------+
+| HALF_DOWN             | Round ties with ``DOWN`` rule                                | 3.5 -> 3, 4.5 -> 4,       |
+|                       |                                                              | -3.5 -> -4, -3.5 -> -5    |
++-----------------------+--------------------------------------------------------------+---------------------------+
+| HALF_UP               | Round ties with ``UP`` rule                                  | 3.5 -> 4, 4.5 -> 5,       |
+|                       |                                                              | -3.5 -> -3, -3.5 -> -4    |
++-----------------------+--------------------------------------------------------------+---------------------------+
+| HALF_TOWARDS_ZERO     | Round ties with ``TOWARDS_ZERO`` rule                        | 3.5 -> 3, 4.5 -> 4,       |
+|                       |                                                              | -3.5 -> -3, -3.5 -> -4    |
++-----------------------+--------------------------------------------------------------+---------------------------+
+| HALF_TOWARDS_INFINITY | Round ties with ``TOWARDS_INFINITY`` rule                    | 3.5 -> 4, 4.5 -> 5,       |
+|                       |                                                              | -3.5 -> -4, -3.5 -> -5    |
++-----------------------+--------------------------------------------------------------+---------------------------+
+| HALF_TO_EVEN          | Round ties to nearest even integer                           | 3.5 -> 5, 4.5 -> 4,       |
+|                       |                                                              | -3.5 -> -4, -3.5 -> -4    |
++-----------------------+--------------------------------------------------------------+---------------------------+
+| HALF_TO_ODD           | Round ties to nearest odd integer                            | 3.5 -> 3, 4.5 -> 5,       |
+|                       |                                                              | -3.5 -> -3, -3.5 -> -5    |
++-----------------------+--------------------------------------------------------------+---------------------------+
+
+The following table gives examples of how ``ndigits`` (for the ``round``
+function) and ``multiple`` (for ``round_to_multiple``) influence the operance
+performed, respectively.
+
++--------------------+-------------------+---------------------------+
+| Round ``multiple`` | Round ``ndigits`` | Operation performed       |
++====================+===================+===========================+
+| 1                  | 0                 | Round to integer          |
++--------------------+-------------------+---------------------------+
+| 0.001              | 3                 | Round to 3 decimal places |
++--------------------+-------------------+---------------------------+
+| 10                 | -1                | Round to multiple of 10   |
++--------------------+-------------------+---------------------------+
+| 2                  | NA                | Round to multiple of 2    |
++--------------------+-------------------+---------------------------+
 
 Logarithmic functions
 ~~~~~~~~~~~~~~~~~~~~~
@@ -542,7 +625,8 @@ cast to the :ref:`common numeric type <common-numeric-type>` before comparison),
 or two inputs of Binary- or String-like types, or two inputs of Temporal types.
 If any input is dictionary encoded it will be expanded for the purposes of
 comparison. If any of the input elements in a pair is null, the corresponding
-output element is null.
+output element is null. Decimal arguments will be promoted in the same way as
+for ``add`` and ``subtract``.
 
 +--------------------------+------------+---------------------------------------------+---------------------+
 | Function names           | Arity      | Input types                                 | Output type         |
@@ -734,7 +818,6 @@ String transforms
 | utf8_upper              | Unary | String-like            | String-like            |                                   | \(8)  |
 +-------------------------+-------+------------------------+------------------------+-----------------------------------+-------+
 
-
 * \(1) Each ASCII character in the input is converted to lowercase or
   uppercase.  Non-ASCII characters are left untouched.
 
@@ -1022,7 +1105,7 @@ Categorizations
 * \(3) Output is true iff the corresponding input element is NaN.
 
 * \(4) Output is true iff the corresponding input element is null. NaN values
-  can also be considered null by setting :struct:`NullOptions::nan_is_null`.
+  can also be considered null by setting :member:`NullOptions::nan_is_null`.
 
 * \(5) Output is true iff the corresponding input element is non-null.
 
@@ -1105,19 +1188,29 @@ number of input and output types.  The type to cast to can be passed in a
 :struct:`CastOptions` instance.  As an alternative, the same service is
 provided by a concrete function :func:`~arrow::compute::Cast`.
 
-+--------------------------+------------+--------------------+------------------+------------------------------+
-| Function name            | Arity      | Input types        | Output type      | Options class                |
-+==========================+============+====================+==================+==============================+
-| cast                     | Unary      | Many               | Variable         | :struct:`CastOptions`        |
-+--------------------------+------------+--------------------+------------------+------------------------------+
-| strftime                 | Unary      | Timestamp          | String           | :struct:`StrftimeOptions`    |
-+--------------------------+------------+--------------------+------------------+------------------------------+
-| strptime                 | Unary      | String-like        | Timestamp        | :struct:`StrptimeOptions`    |
-+--------------------------+------------+--------------------+------------------+------------------------------+
++-----------------+------------+--------------------+------------------+------------------------------+-------+
+| Function name   | Arity      | Input types        | Output type      | Options class                | Notes |
++=================+============+====================+==================+==============================+=======+
+| cast            | Unary      | Many               | Variable         | :struct:`CastOptions`        |       |
++-----------------+------------+--------------------+------------------+------------------------------+-------+
+| strftime        | Unary      | Timestamp          | String           | :struct:`StrftimeOptions`    | \(1)  |
++-----------------+------------+--------------------+------------------+------------------------------+-------+
+| strptime        | Unary      | String-like        | Timestamp        | :struct:`StrptimeOptions`    |       |
++-----------------+------------+--------------------+------------------+------------------------------+-------+
 
 The conversions available with ``cast`` are listed below.  In all cases, a
 null input value is converted into a null output value.
 
+* \(1) Output precision of ``%S`` (seconds) flag depends on the input timestamp
+  precision. Timestamps with second precision are represented as integers while
+  milliseconds, microsecond and nanoseconds are represented as fixed floating
+  point numbers with 3, 6 and 9 decimal places respectively. To obtain integer
+  seconds, cast to timestamp with second resolution.
+  The character for the decimal point is localized according to the locale.
+  See `detailed formatting documentation`_ for descriptions of other flags.
+
+.. _detailed formatting documentation: https://howardhinnant.github.io/date/date.html#to_stream_formatting
+
 **Truth value extraction**
 
 +-----------------------------+------------------------------------+--------------+
@@ -1203,29 +1296,29 @@ null input value is converted into a null output value.
 Temporal component extraction
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-These functions extract datetime components (year, month, day, etc) from timestamp type.
-If the input timestamps have a non-empty timezone, localized timestamp components will be returned.
+These functions extract datetime components (year, month, day, etc) from temporal types.
+For timestamps inputs with non-empty timezone, localized timestamp components will be returned.
 
 +--------------------+------------+-------------------+---------------+----------------------------+-------+
 | Function name      | Arity      | Input types       | Output type   | Options class              | Notes |
 +====================+============+===================+===============+============================+=======+
-| year               | Unary      | Timestamp         | Int64         |                            |       |
+| year               | Unary      | Temporal          | Int64         |                            |       |
 +--------------------+------------+-------------------+---------------+----------------------------+-------+
-| month              | Unary      | Timestamp         | Int64         |                            |       |
+| month              | Unary      | Temporal          | Int64         |                            |       |
 +--------------------+------------+-------------------+---------------+----------------------------+-------+
-| day                | Unary      | Timestamp         | Int64         |                            |       |
+| day                | Unary      | Temporal          | Int64         |                            |       |
 +--------------------+------------+-------------------+---------------+----------------------------+-------+
-| day_of_week        | Unary      | Timestamp         | Int64         | :struct:`DayOfWeekOptions` | \(1)  |
+| day_of_week        | Unary      | Temporal          | Int64         | :struct:`DayOfWeekOptions` | \(1)  |
 +--------------------+------------+-------------------+---------------+----------------------------+-------+
-| day_of_year        | Unary      | Timestamp         | Int64         |                            |       |
+| day_of_year        | Unary      | Temporal          | Int64         |                            |       |
 +--------------------+------------+-------------------+---------------+----------------------------+-------+
-| iso_year           | Unary      | Timestamp         | Int64         |                            | \(2)  |
+| iso_year           | Unary      | Temporal          | Int64         |                            | \(2)  |
 +--------------------+------------+-------------------+---------------+----------------------------+-------+
-| iso_week           | Unary      | Timestamp         | Int64         |                            | \(2)  |
+| iso_week           | Unary      | Temporal          | Int64         |                            | \(2)  |
 +--------------------+------------+-------------------+---------------+----------------------------+-------+
-| iso_calendar       | Unary      | Timestamp         | Struct        |                            | \(3)  |
+| iso_calendar       | Unary      | Temporal          | Struct        |                            | \(3)  |
 +--------------------+------------+-------------------+---------------+----------------------------+-------+
-| quarter            | Unary      | Timestamp         | Int64         |                            |       |
+| quarter            | Unary      | Temporal          | Int64         |                            |       |
 +--------------------+------------+-------------------+---------------+----------------------------+-------+
 | hour               | Unary      | Timestamp         | Int64         |                            |       |
 +--------------------+------------+-------------------+---------------+----------------------------+-------+
@@ -1253,6 +1346,30 @@ If the input timestamps have a non-empty timezone, localized timestamp component
 
 .. _ISO 8601 week date definition: https://en.wikipedia.org/wiki/ISO_week_date#First_week
 
+Timezone handling
+~~~~~~~~~~~~~~~~~
+
+This function is meant to be used when an external system produces
+"timezone-naive" timestamps which need to be converted to "timezone-aware"
+timestamps (see for example the `definition
+<https://docs.python.org/3/library/datetime.html#aware-and-naive-objects>`__
+in the Python documentation).
+
+Input timestamps are assumed to be relative to the timezone given in
+:member:`AssumeTimezoneOptions::timezone`. They are converted to
+UTC-relative timestamps with the timezone metadata set to the above value.
+An error is returned if the timestamps already have the timezone metadata set.
+
++--------------------+------------+-------------------+---------------+----------------------------------+-------+
+| Function name      | Arity      | Input types       | Output type   | Options class                    | Notes |
++====================+============+===================+===============+==================================+=======+
+| assume_timezone    | Unary      | Timestamp         | Timestamp     | :struct:`AssumeTimezoneOptions`  | \(1)  |
++--------------------+------------+-------------------+---------------+----------------------------------+-------+
+
+* \(1) In addition to the timezone value, :struct:`AssumeTimezoneOptions`
+  allows choosing the behaviour when a timestamp is ambiguous or nonexistent
+  in the given timezone (because of DST shifts).
+
 
 Array-wise ("vector") functions
 -------------------------------
@@ -1318,21 +1435,17 @@ In these functions, nulls are considered greater than any other value
 Floating-point NaN values are considered greater than any other non-null
 value, but smaller than nulls.
 
-+-----------------------+------------+-----------------------------+-------------------+--------------------------------+----------------+
-| Function name         | Arity      | Input types                 | Output type       | Options class                  | Notes          |
-+=======================+============+=============================+===================+================================+================+
-| partition_nth_indices | Unary      | Binary- and String-like     | UInt64            | :struct:`PartitionNthOptions`  | \(1) \(3)      |
-+-----------------------+------------+-----------------------------+-------------------+--------------------------------+----------------+
-| partition_nth_indices | Unary      | Boolean, Numeric, Temporal  | UInt64            | :struct:`PartitionNthOptions`  | \(1)           |
-+-----------------------+------------+-----------------------------+-------------------+--------------------------------+----------------+
-| array_sort_indices    | Unary      | Binary- and String-like     | UInt64            | :struct:`ArraySortOptions`     | \(2) \(3) \(4) |
-+-----------------------+------------+-----------------------------+-------------------+--------------------------------+----------------+
-| array_sort_indices    | Unary      | Boolean, Numeric, Temporal  | UInt64            | :struct:`ArraySortOptions`     | \(2) \(4)      |
-+-----------------------+------------+-----------------------------+-------------------+--------------------------------+----------------+
-| sort_indices          | Unary      | Binary- and String-like     | UInt64            | :struct:`SortOptions`          | \(2) \(3) \(5) |
-+-----------------------+------------+-----------------------------+-------------------+--------------------------------+----------------+
-| sort_indices          | Unary      | Boolean, Numeric, Temporal  | UInt64            | :struct:`SortOptions`          | \(2) \(5)      |
-+-----------------------+------------+-----------------------------+-------------------+--------------------------------+----------------+
++-----------------------+------------+---------------------------------------------------------+-------------------+--------------------------------+----------------+
+| Function name         | Arity      | Input types                                             | Output type       | Options class                  | Notes          |
++=======================+============+=========================================================+===================+================================+================+
+| partition_nth_indices | Unary      | Boolean, Numeric, Temporal, Binary- and String-like     | UInt64            | :struct:`PartitionNthOptions`  | \(1) \(3)      |
++-----------------------+------------+---------------------------------------------------------+-------------------+--------------------------------+----------------+
+| array_sort_indices    | Unary      | Boolean, Numeric, Temporal, Binary- and String-like     | UInt64            | :struct:`ArraySortOptions`     | \(2) \(4) \(3) |
++-----------------------+------------+---------------------------------------------------------+-------------------+--------------------------------+----------------+
+| select_k_unstable     | Unary      | Boolean, Numeric, Temporal, Binary- and String-like     | UInt64            | :struct:`SelectKOptions`       | \(5) \(6) \(3) |
++-----------------------+------------+---------------------------------------------------------+-------------------+--------------------------------+----------------+
+| sort_indices          | Unary      | Boolean, Numeric, Temporal, Binary- and String-like     | UInt64            | :struct:`SortOptions`          | \(2) \(5) \(3) |
++-----------------------+------------+---------------------------------------------------------+-------------------+--------------------------------+----------------+
 
 * \(1) The output is an array of indices into the input array, that define
   a partial non-stable sort such that the *N*'th index points to the *N*'th
@@ -1353,6 +1466,9 @@ value, but smaller than nulls.
   table. If the input is a record batch or table, one or more sort
   keys must be specified.
 
+* \(6) The output is an array of indices into the input, that define a
+  non-stable sort of the input.
+
 .. _cpp-compute-vector-structural-transforms:
 
 Structural transforms
diff --git a/docs/source/python/api/compute.rst b/docs/source/python/api/compute.rst
index f7f740c24e5..dff2a0052f4 100644
--- a/docs/source/python/api/compute.rst
+++ b/docs/source/python/api/compute.rst
@@ -78,14 +78,16 @@ Bit-wise operations do not offer (or need) a checked variant.
 Rounding Functions
 ------------------
 
-Rounding functions convert a numeric input into an approximate value with a
-simpler representation based on the rounding strategy.
+Rounding functions displace numeric inputs to an approximate value with a simpler
+representation based on the rounding criterion.
 
 .. autosummary::
    :toctree: ../generated/
 
    ceil
    floor
+   round
+   round_to_multiple
    trunc
 
 Logarithmic Functions
@@ -349,6 +351,7 @@ Sorts and partitions
    :toctree: ../generated/
 
    partition_nth_indices
+   select_k_unstable
    sort_indices
 
 Structural Transforms
diff --git a/docs/source/python/dataset.rst b/docs/source/python/dataset.rst
index 27744e8b188..f8142a7b026 100644
--- a/docs/source/python/dataset.rst
+++ b/docs/source/python/dataset.rst
@@ -147,7 +147,7 @@ The format name as a string, like::
 
 is short hand for a default constructed :class:`ParquetFileFormat`::
 
-    ds.dataset(..., format=ds.ParquetFileForma())
+    ds.dataset(..., format=ds.ParquetFileFormat())
 
 The :class:`FileFormat` objects can be customized using keywords. For example::
 
diff --git a/docs/source/python/parquet.rst b/docs/source/python/parquet.rst
index 812748ad27f..82461ec5da1 100644
--- a/docs/source/python/parquet.rst
+++ b/docs/source/python/parquet.rst
@@ -483,7 +483,7 @@ Reading from Partitioned Datasets
 ------------------------------------------------
 
 The :class:`~.ParquetDataset` class accepts either a directory name or a list
-or file paths, and can discover and infer some common partition structures,
+of file paths, and can discover and infer some common partition structures,
 such as those produced by Hive:
 
 .. code-block:: python
diff --git a/go/arrow/bitutil/bitmaps.go b/go/arrow/bitutil/bitmaps.go
new file mode 100644
index 00000000000..206cde79015
--- /dev/null
+++ b/go/arrow/bitutil/bitmaps.go
@@ -0,0 +1,435 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package bitutil
+
+import (
+	"math/bits"
+	"unsafe"
+
+	"github.com/apache/arrow/go/arrow/endian"
+	"github.com/apache/arrow/go/arrow/internal/debug"
+)
+
+// helper function to handle big-endian architectures properly
+var toFromLEFunc func(uint64) uint64
+
+func init() {
+	if endian.IsBigEndian {
+		// if we're on a big endian architecture, then use the reverse bytes
+		// function so we can perform byte-swaps when necessary
+		toFromLEFunc = bits.ReverseBytes64
+	} else {
+		// identity function if we're on a little endian architecture
+		toFromLEFunc = func(in uint64) uint64 { return in }
+	}
+}
+
+// BitmapReader is a simple bitmap reader for a byte slice.
+type BitmapReader struct {
+	bitmap []byte
+	pos    int
+	len    int
+
+	current    byte
+	byteOffset int
+	bitOffset  int
+}
+
+// NewBitmapReader creates and returns a new bitmap reader for the given bitmap
+func NewBitmapReader(bitmap []byte, offset, length int) *BitmapReader {
+	curbyte := byte(0)
+	if length > 0 && bitmap != nil {
+		curbyte = bitmap[offset/8]
+	}
+	return &BitmapReader{
+		bitmap:     bitmap,
+		byteOffset: offset / 8,
+		bitOffset:  offset % 8,
+		current:    curbyte,
+		len:        length,
+	}
+}
+
+// Set returns true if the current bit is set
+func (b *BitmapReader) Set() bool {
+	return (b.current & (1 << b.bitOffset)) != 0
+}
+
+// NotSet returns true if the current bit is not set
+func (b *BitmapReader) NotSet() bool {
+	return (b.current & (1 << b.bitOffset)) == 0
+}
+
+// Next advances the reader to the next bit in the bitmap.
+func (b *BitmapReader) Next() {
+	b.bitOffset++
+	b.pos++
+	if b.bitOffset == 8 {
+		b.bitOffset = 0
+		b.byteOffset++
+		if b.pos < b.len {
+			b.current = b.bitmap[int(b.byteOffset)]
+		}
+	}
+}
+
+// Pos returns the current bit position in the bitmap that the reader is looking at
+func (b *BitmapReader) Pos() int { return b.pos }
+
+// Len returns the total number of bits in the bitmap
+func (b *BitmapReader) Len() int { return b.len }
+
+// BitmapWriter is a simple writer for writing bitmaps to byte slices
+type BitmapWriter struct {
+	buf    []byte
+	pos    int
+	length int
+
+	curByte    uint8
+	bitMask    uint8
+	byteOffset int
+}
+
+// NewBitmapWriter returns a sequential bitwise writer that preserves surrounding
+// bit values as it writes.
+func NewBitmapWriter(bitmap []byte, start, length int) *BitmapWriter {
+	ret := &BitmapWriter{
+		buf:        bitmap,
+		length:     length,
+		byteOffset: start / 8,
+		bitMask:    BitMask[start%8],
+	}
+	if length > 0 {
+		ret.curByte = bitmap[int(ret.byteOffset)]
+	}
+	return ret
+}
+
+// Reset resets the position and view of the slice to restart writing a bitmap
+// to the same byte slice.
+func (b *BitmapWriter) Reset(start, length int) {
+	b.pos = 0
+	b.byteOffset = start / 8
+	b.bitMask = BitMask[start%8]
+	b.length = length
+	if b.length > 0 {
+		b.curByte = b.buf[int(b.byteOffset)]
+	}
+}
+
+func (b *BitmapWriter) Pos() int { return b.pos }
+func (b *BitmapWriter) Set()     { b.curByte |= b.bitMask }
+func (b *BitmapWriter) Clear()   { b.curByte &= ^b.bitMask }
+
+// Next increments the writer to the next bit for writing.
+func (b *BitmapWriter) Next() {
+	b.bitMask = b.bitMask << 1
+	b.pos++
+	if b.bitMask == 0 {
+		b.bitMask = 0x01
+		b.buf[b.byteOffset] = b.curByte
+		b.byteOffset++
+		if b.pos < b.length {
+			b.curByte = b.buf[int(b.byteOffset)]
+		}
+	}
+}
+
+// AppendBools writes a series of booleans to the bitmapwriter and returns
+// the number of remaining bytes left in the buffer for writing.
+func (b *BitmapWriter) AppendBools(in []bool) int {
+	space := min(int(BytesForBits(int64(b.length-b.pos))), len(in))
+
+	// location that the first byte needs to be written to for appending
+	appslice := b.buf[int(b.byteOffset):]
+	// update everything but curByte
+	bitOffset := bits.TrailingZeros32(uint32(b.bitMask))
+	appslice[0] = b.curByte
+	for i, b := range in[:space] {
+		if b {
+			SetBit(appslice, i)
+		} else {
+			ClearBit(appslice, i)
+		}
+	}
+
+	b.pos += space
+	b.bitMask = BitMask[(bitOffset+space)%8]
+	b.byteOffset += (bitOffset + space) / 8
+	b.curByte = appslice[len(appslice)-1]
+
+	return int(space)
+}
+
+// Finish flushes the final byte out to the byteslice in case it was not already
+// on a byte aligned boundary.
+func (b *BitmapWriter) Finish() {
+	if b.length > 0 && (b.bitMask != 0x01 || b.pos < b.length) {
+		b.buf[int(b.byteOffset)] = b.curByte
+	}
+}
+
+// BitmapWordReader is a reader for bitmaps that reads a word at a time (a word being an 8 byte uint64)
+// and then provides functions to grab the individual trailing bytes after the last word
+type BitmapWordReader struct {
+	bitmap        []byte
+	offset        int
+	nwords        int
+	trailingBits  int
+	trailingBytes int
+	curword       uint64
+}
+
+// NewBitmapWordReader sets up a word reader, calculates the number of trailing bits and
+// number of trailing bytes, along with the number of words.
+func NewBitmapWordReader(bitmap []byte, offset, length int) *BitmapWordReader {
+	bitoffset := offset % 8
+	byteOffset := offset / 8
+	bm := &BitmapWordReader{
+		offset: bitoffset,
+		bitmap: bitmap[byteOffset : byteOffset+int(BytesForBits(int64(bitoffset+length)))],
+		// decrement wordcount by 1 as we may touch two adjacent words in one iteration
+		nwords: length/int(unsafe.Sizeof(uint64(0))*8) - 1,
+	}
+	if bm.nwords < 0 {
+		bm.nwords = 0
+	}
+	bm.trailingBits = length - bm.nwords*int(unsafe.Sizeof(uint64(0)))*8
+	bm.trailingBytes = int(BytesForBits(int64(bm.trailingBits)))
+
+	if bm.nwords > 0 {
+		bm.curword = toFromLEFunc(endian.Native.Uint64(bm.bitmap))
+	} else {
+		bm.curword = toFromLEFunc(uint64(bm.bitmap[0]))
+	}
+	return bm
+}
+
+// NextWord returns the next full word read from the bitmap, should not be called
+// if Words() is 0 as it will step outside of the bounds of the bitmap slice and panic.
+//
+// We don't perform the bounds checking in order to improve performance.
+func (bm *BitmapWordReader) NextWord() uint64 {
+	bm.bitmap = bm.bitmap[unsafe.Sizeof(bm.curword):]
+	word := bm.curword
+	nextWord := toFromLEFunc(endian.Native.Uint64(bm.bitmap))
+	if bm.offset != 0 {
+		// combine two adjacent words into one word
+		// |<------ next ----->|<---- current ---->|
+		// +-------------+-----+-------------+-----+
+		// |     ---     |  A  |      B      | --- |
+		// +-------------+-----+-------------+-----+
+		//                  |         |       offset
+		//                  v         v
+		//               +-----+-------------+
+		//               |  A  |      B      |
+		//               +-----+-------------+
+		//               |<------ word ----->|
+		word >>= uint64(bm.offset)
+		word |= nextWord << (int64(unsafe.Sizeof(uint64(0))*8) - int64(bm.offset))
+	}
+	bm.curword = nextWord
+	return word
+}
+
+// NextTrailingByte returns the next trailing byte of the bitmap after the last word
+// along with the number of valid bits in that byte. When validBits < 8, that
+// is the last byte.
+//
+// If the bitmap ends on a byte alignment, then the last byte can also return 8 valid bits.
+// Thus the TrailingBytes function should be used to know how many trailing bytes to read.
+func (bm *BitmapWordReader) NextTrailingByte() (val byte, validBits int) {
+	debug.Assert(bm.trailingBits > 0, "next trailing byte called with no trailing bits")
+
+	if bm.trailingBits <= 8 {
+		// last byte
+		validBits = bm.trailingBits
+		bm.trailingBits = 0
+		rdr := NewBitmapReader(bm.bitmap, bm.offset, validBits)
+		for i := 0; i < validBits; i++ {
+			val >>= 1
+			if rdr.Set() {
+				val |= 0x80
+			}
+			rdr.Next()
+		}
+		val >>= (8 - validBits)
+		return
+	}
+
+	bm.bitmap = bm.bitmap[1:]
+	nextByte := bm.bitmap[0]
+	val = (*[8]byte)(unsafe.Pointer(&bm.curword))[0]
+	if bm.offset != 0 {
+		val >>= byte(bm.offset)
+		val |= nextByte << (8 - bm.offset)
+	}
+	(*[8]byte)(unsafe.Pointer(&bm.curword))[0] = nextByte
+	bm.trailingBits -= 8
+	bm.trailingBytes--
+	validBits = 8
+	return
+}
+
+func (bm *BitmapWordReader) Words() int         { return bm.nwords }
+func (bm *BitmapWordReader) TrailingBytes() int { return bm.trailingBytes }
+
+// BitmapWordWriter is a bitmap writer for writing a full word at a time (a word being
+// a uint64). After the last full word is written, PutNextTrailingByte can be used to
+// write the remaining trailing bytes.
+type BitmapWordWriter struct {
+	bitmap []byte
+	offset int
+	len    int
+
+	bitMask     uint64
+	currentWord uint64
+}
+
+// NewBitmapWordWriter initializes a new bitmap word writer which will start writing
+// into the byte slice at bit offset start, expecting to write len bits.
+func NewBitmapWordWriter(bitmap []byte, start, len int) *BitmapWordWriter {
+	ret := &BitmapWordWriter{
+		bitmap:  bitmap[start/8:],
+		len:     len,
+		offset:  start % 8,
+		bitMask: (uint64(1) << uint64(start%8)) - 1,
+	}
+
+	if ret.offset != 0 {
+		if ret.len >= int(unsafe.Sizeof(uint64(0))*8) {
+			ret.currentWord = toFromLEFunc(endian.Native.Uint64(ret.bitmap))
+		} else if ret.len > 0 {
+			ret.currentWord = toFromLEFunc(uint64(ret.bitmap[0]))
+		}
+	}
+	return ret
+}
+
+// PutNextWord writes the given word to the bitmap, potentially splitting across
+// two adjacent words.
+func (bm *BitmapWordWriter) PutNextWord(word uint64) {
+	sz := int(unsafe.Sizeof(word))
+	if bm.offset != 0 {
+		// split one word into two adjacent words, don't touch unused bits
+		//               |<------ word ----->|
+		//               +-----+-------------+
+		//               |  A  |      B      |
+		//               +-----+-------------+
+		//                  |         |
+		//                  v         v       offset
+		// +-------------+-----+-------------+-----+
+		// |     ---     |  A  |      B      | --- |
+		// +-------------+-----+-------------+-----+
+		// |<------ next ----->|<---- current ---->|
+		word = (word << uint64(bm.offset)) | (word >> (int64(sz*8) - int64(bm.offset)))
+		next := endian.Native.Uint64(bm.bitmap[sz:])
+		bm.currentWord = (bm.currentWord & bm.bitMask) | (word &^ bm.bitMask)
+		next = (next &^ bm.bitMask) | (word & bm.bitMask)
+		endian.Native.PutUint64(bm.bitmap, toFromLEFunc(bm.currentWord))
+		endian.Native.PutUint64(bm.bitmap[sz:], toFromLEFunc(next))
+		bm.currentWord = next
+	} else {
+		endian.Native.PutUint64(bm.bitmap, toFromLEFunc(word))
+	}
+	bm.bitmap = bm.bitmap[sz:]
+}
+
+// PutNextTrailingByte writes the number of bits indicated by validBits from b to
+// the bitmap.
+func (bm *BitmapWordWriter) PutNextTrailingByte(b byte, validBits int) {
+	curbyte := (*[8]byte)(unsafe.Pointer(&bm.currentWord))[0]
+	if validBits == 8 {
+		if bm.offset != 0 {
+			b = (b << bm.offset) | (b >> (8 - bm.offset))
+			next := bm.bitmap[1]
+			curbyte = (curbyte & byte(bm.bitMask)) | (b &^ byte(bm.bitMask))
+			next = (next &^ byte(bm.bitMask)) | (b & byte(bm.bitMask))
+			bm.bitmap[0] = curbyte
+			bm.bitmap[1] = next
+			bm.currentWord = uint64(next)
+		} else {
+			bm.bitmap[0] = b
+		}
+		bm.bitmap = bm.bitmap[1:]
+	} else {
+		debug.Assert(validBits > 0 && validBits < 8, "invalid valid bits in bitmap word writer")
+		debug.Assert(BytesForBits(int64(bm.offset+validBits)) <= int64(len(bm.bitmap)), "writing trailiing byte outside of bounds of bitmap")
+		wr := NewBitmapWriter(bm.bitmap, int(bm.offset), validBits)
+		for i := 0; i < validBits; i++ {
+			if b&0x01 != 0 {
+				wr.Set()
+			} else {
+				wr.Clear()
+			}
+			wr.Next()
+			b >>= 1
+		}
+		wr.Finish()
+	}
+}
+
+// CopyBitmap copies the bitmap indicated by src, starting at bit offset srcOffset,
+// and copying length bits into dst, starting at bit offset dstOffset.
+func CopyBitmap(src []byte, srcOffset, length int, dst []byte, dstOffset int) {
+	if length == 0 {
+		// if there's nothing to write, end early.
+		return
+	}
+
+	bitOffset := srcOffset % 8
+	destBitOffset := dstOffset % 8
+
+	// slow path, one of the bitmaps are not byte aligned.
+	if bitOffset != 0 || destBitOffset != 0 {
+		rdr := NewBitmapWordReader(src, srcOffset, length)
+		wr := NewBitmapWordWriter(dst, dstOffset, length)
+
+		nwords := rdr.Words()
+		for nwords > 0 {
+			nwords--
+			wr.PutNextWord(rdr.NextWord())
+		}
+		nbytes := rdr.TrailingBytes()
+		for nbytes > 0 {
+			nbytes--
+			bt, validBits := rdr.NextTrailingByte()
+			wr.PutNextTrailingByte(bt, validBits)
+		}
+		return
+	}
+
+	// fast path, both are starting with byte-aligned bitmaps
+	nbytes := int(BytesForBits(int64(length)))
+
+	// shift by its byte offset
+	src = src[srcOffset/8:]
+	dst = dst[dstOffset/8:]
+
+	// Take care of the trailing bits in the last byte
+	// E.g., if trailing_bits = 5, last byte should be
+	// - low  3 bits: new bits from last byte of data buffer
+	// - high 5 bits: old bits from last byte of dest buffer
+	trailingBits := nbytes*8 - length
+	trailMask := byte(uint(1)<<(8-trailingBits)) - 1
+
+	copy(dst, src[:nbytes-1])
+	lastData := src[nbytes-1]
+
+	dst[nbytes-1] &= ^trailMask
+	dst[nbytes-1] |= lastData & trailMask
+}
diff --git a/go/arrow/bitutil/bitmaps_test.go b/go/arrow/bitutil/bitmaps_test.go
new file mode 100644
index 00000000000..211949c6895
--- /dev/null
+++ b/go/arrow/bitutil/bitmaps_test.go
@@ -0,0 +1,344 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package bitutil_test
+
+import (
+	"fmt"
+	"math/rand"
+	"strconv"
+	"testing"
+
+	"github.com/apache/arrow/go/arrow/bitutil"
+	"github.com/stretchr/testify/assert"
+)
+
+func bitmapFromSlice(vals []int, bitOffset int) []byte {
+	out := make([]byte, int(bitutil.BytesForBits(int64(len(vals)+bitOffset))))
+	writer := bitutil.NewBitmapWriter(out, bitOffset, len(vals))
+	for _, val := range vals {
+		if val == 1 {
+			writer.Set()
+		} else {
+			writer.Clear()
+		}
+		writer.Next()
+	}
+	writer.Finish()
+
+	return out
+}
+
+func assertReaderVals(t *testing.T, reader *bitutil.BitmapReader, vals []bool) {
+	for _, v := range vals {
+		if v {
+			assert.True(t, reader.Set())
+			assert.False(t, reader.NotSet())
+		} else {
+			assert.True(t, reader.NotSet())
+			assert.False(t, reader.Set())
+		}
+		reader.Next()
+	}
+}
+
+func TestNormalOperation(t *testing.T) {
+	for _, offset := range []int{0, 1, 3, 5, 7, 8, 12, 13, 21, 38, 75, 120} {
+		buf := bitmapFromSlice([]int{0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1}, offset)
+
+		reader := bitutil.NewBitmapReader(buf, offset, 14)
+		assertReaderVals(t, reader, []bool{false, true, true, true, false, false, false, true, false, true, false, true, false, true})
+	}
+}
+
+func TestDoesNotReadOutOfBounds(t *testing.T) {
+	var bitmap [16]byte
+	const length = 128
+
+	reader := bitutil.NewBitmapReader(bitmap[:], 0, length)
+	assert.EqualValues(t, length, reader.Len())
+	assert.NotPanics(t, func() {
+		for i := 0; i < length; i++ {
+			assert.True(t, reader.NotSet())
+			reader.Next()
+		}
+	})
+	assert.EqualValues(t, length, reader.Pos())
+
+	reader = bitutil.NewBitmapReader(bitmap[:], 5, length-5)
+	assert.EqualValues(t, length-5, reader.Len())
+	assert.NotPanics(t, func() {
+		for i := 0; i < length-5; i++ {
+			assert.True(t, reader.NotSet())
+			reader.Next()
+		}
+	})
+	assert.EqualValues(t, length-5, reader.Pos())
+
+	assert.NotPanics(t, func() {
+		reader = bitutil.NewBitmapReader(nil, 0, 0)
+	})
+}
+
+func writeToWriter(vals []int, wr *bitutil.BitmapWriter) {
+	for _, v := range vals {
+		if v != 0 {
+			wr.Set()
+		} else {
+			wr.Clear()
+		}
+		wr.Next()
+	}
+	wr.Finish()
+}
+
+func TestBitmapWriter(t *testing.T) {
+	for _, fillByte := range []byte{0x00, 0xFF} {
+		{
+			bitmap := []byte{fillByte, fillByte, fillByte, fillByte}
+			wr := bitutil.NewBitmapWriter(bitmap, 0, 12)
+			writeToWriter([]int{0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1}, wr)
+			// {0b00110110, 0b....1010, ........, ........}
+			assert.Equal(t, []byte{0x36, (0x0A | (fillByte & 0xF0)), fillByte, fillByte}, bitmap)
+		}
+		{
+			bitmap := []byte{fillByte, fillByte, fillByte, fillByte}
+			wr := bitutil.NewBitmapWriter(bitmap, 3, 12)
+			writeToWriter([]int{0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1}, wr)
+			// {0b10110..., 0b.1010001, ........, ........}
+			assert.Equal(t, []byte{0xb0 | (fillByte & 0x07), 0x51 | (fillByte & 0x80), fillByte, fillByte}, bitmap)
+		}
+		{
+			bitmap := []byte{fillByte, fillByte, fillByte, fillByte}
+			wr := bitutil.NewBitmapWriter(bitmap, 20, 12)
+			writeToWriter([]int{0, 1, 1, 0, 1, 1, 0, 0, 0, 1, 0, 1}, wr)
+			// {........, ........, 0b0110...., 0b10100011}
+			assert.Equal(t, []byte{fillByte, fillByte, 0x60 | (fillByte & 0x0f), 0xa3}, bitmap)
+		}
+	}
+}
+
+func TestBitmapReader(t *testing.T) {
+	assertReaderVals := func(vals []int, rdr *bitutil.BitmapReader) {
+		for _, v := range vals {
+			if v != 0 {
+				assert.True(t, rdr.Set())
+				assert.False(t, rdr.NotSet())
+			} else {
+				assert.False(t, rdr.Set())
+				assert.True(t, rdr.NotSet())
+			}
+			rdr.Next()
+		}
+	}
+
+	vals := []int{0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1}
+
+	for _, offset := range []int{0, 1, 3, 5, 7, 8, 12, 13, 21, 38, 75, 120} {
+		bm := make([]byte, bitutil.BytesForBits(int64(len(vals)+offset)))
+		wr := bitutil.NewBitmapWriter(bm, offset, len(vals))
+		writeToWriter(vals, wr)
+
+		rdr := bitutil.NewBitmapReader(bm, offset, 14)
+		assertReaderVals(vals, rdr)
+	}
+}
+
+func TestCopyBitmap(t *testing.T) {
+	const bufsize = 1000
+	lengths := []int{bufsize*8 - 4, bufsize * 8}
+	offsets := []int{0, 12, 16, 32, 37, 63, 64, 128}
+
+	buffer := make([]byte, bufsize)
+
+	// random bytes
+	r := rand.New(rand.NewSource(0))
+	r.Read(buffer)
+
+	// add 16 byte padding
+	otherBuffer := make([]byte, bufsize+32)
+	r.Read(otherBuffer)
+
+	for _, nbits := range lengths {
+		for _, offset := range offsets {
+			for _, destOffset := range offsets {
+				t.Run(fmt.Sprintf("bits %d off %d dst %d", nbits, offset, destOffset), func(t *testing.T) {
+					copyLen := nbits - offset
+
+					bmCopy := make([]byte, len(otherBuffer))
+					copy(bmCopy, otherBuffer)
+
+					bitutil.CopyBitmap(buffer, offset, copyLen, bmCopy, destOffset)
+
+					for i := 0; i < int(destOffset); i++ {
+						assert.Equalf(t, bitutil.BitIsSet(otherBuffer, i), bitutil.BitIsSet(bmCopy, i), "bit index: %d", i)
+					}
+					for i := 0; i < int(copyLen); i++ {
+						assert.Equalf(t, bitutil.BitIsSet(buffer, i+int(offset)), bitutil.BitIsSet(bmCopy, i+int(destOffset)), "bit index: %d", i)
+					}
+					for i := int(destOffset + copyLen); i < len(otherBuffer); i++ {
+						assert.Equalf(t, bitutil.BitIsSet(otherBuffer, i), bitutil.BitIsSet(bmCopy, i), "bit index: %d", i)
+					}
+				})
+			}
+		}
+	}
+}
+
+func benchmarkCopyBitmapN(b *testing.B, offsetSrc, offsetDest, n int) {
+	nbits := n * 8
+	// random bytes
+	r := rand.New(rand.NewSource(0))
+	src := make([]byte, n)
+	r.Read(src)
+
+	length := nbits - offsetSrc
+
+	dest := make([]byte, bitutil.BytesForBits(int64(length+offsetDest)))
+
+	b.ResetTimer()
+	b.SetBytes(int64(n))
+	for i := 0; i < b.N; i++ {
+		bitutil.CopyBitmap(src, offsetSrc, length, dest, offsetDest)
+	}
+}
+
+// Fast path which is just a memcopy
+func BenchmarkCopyBitmapWithoutOffset(b *testing.B) {
+	for _, sz := range []int{32, 128, 1000, 1024} {
+		b.Run(strconv.Itoa(sz), func(b *testing.B) {
+			benchmarkCopyBitmapN(b, 0, 0, sz)
+		})
+	}
+}
+
+// slow path where the source buffer is not byte aligned
+func BenchmarkCopyBitmapWithOffset(b *testing.B) {
+	for _, sz := range []int{32, 128, 1000, 1024} {
+		b.Run(strconv.Itoa(sz), func(b *testing.B) {
+			benchmarkCopyBitmapN(b, 4, 0, sz)
+		})
+	}
+}
+
+// slow path where both source and dest are not byte aligned
+func BenchmarkCopyBitmapWithOffsetBoth(b *testing.B) {
+	for _, sz := range []int{32, 128, 1000, 1024} {
+		b.Run(strconv.Itoa(sz), func(b *testing.B) {
+			benchmarkCopyBitmapN(b, 3, 7, sz)
+		})
+	}
+}
+
+const bufferSize = 1024 * 8
+
+// a naive bitmap reader for a baseline
+
+type NaiveBitmapReader struct {
+	bitmap []byte
+	pos    int
+}
+
+func (n *NaiveBitmapReader) IsSet() bool    { return bitutil.BitIsSet(n.bitmap, n.pos) }
+func (n *NaiveBitmapReader) IsNotSet() bool { return !n.IsSet() }
+func (n *NaiveBitmapReader) Next()          { n.pos++ }
+
+// naive bitmap writer for a baseline
+
+type NaiveBitmapWriter struct {
+	bitmap []byte
+	pos    int
+}
+
+func (n *NaiveBitmapWriter) Set() {
+	byteOffset := n.pos / 8
+	bitOffset := n.pos % 8
+	bitSetMask := uint8(1 << bitOffset)
+	n.bitmap[byteOffset] |= bitSetMask
+}
+
+func (n *NaiveBitmapWriter) Clear() {
+	byteOffset := n.pos / 8
+	bitOffset := n.pos % 8
+	bitClearMask := uint8(0xFF ^ (1 << bitOffset))
+	n.bitmap[byteOffset] &= bitClearMask
+}
+
+func (n *NaiveBitmapWriter) Next()   { n.pos++ }
+func (n *NaiveBitmapWriter) Finish() {}
+
+func randomBuffer(nbytes int64) []byte {
+	buf := make([]byte, nbytes)
+	r := rand.New(rand.NewSource(0))
+	r.Read(buf)
+	return buf
+}
+
+func BenchmarkBitmapReader(b *testing.B) {
+	buf := randomBuffer(bufferSize)
+	nbits := bufferSize * 8
+
+	b.Run("naive baseline", func(b *testing.B) {
+		b.SetBytes(2 * bufferSize)
+		for i := 0; i < b.N; i++ {
+			{
+				total := 0
+				rdr := NaiveBitmapReader{buf, 0}
+				for j := 0; j < nbits; j++ {
+					if rdr.IsSet() {
+						total++
+					}
+					rdr.Next()
+				}
+			}
+			{
+				total := 0
+				rdr := NaiveBitmapReader{buf, 0}
+				for j := 0; j < nbits; j++ {
+					if rdr.IsSet() {
+						total++
+					}
+					rdr.Next()
+				}
+			}
+		}
+	})
+	b.Run("bitmap reader", func(b *testing.B) {
+		b.SetBytes(2 * bufferSize)
+		for i := 0; i < b.N; i++ {
+			{
+				total := 0
+				rdr := bitutil.NewBitmapReader(buf, 0, nbits)
+				for j := 0; j < nbits; j++ {
+					if rdr.Set() {
+						total++
+					}
+					rdr.Next()
+				}
+			}
+			{
+				total := 0
+				rdr := bitutil.NewBitmapReader(buf, 0, nbits)
+				for j := 0; j < nbits; j++ {
+					if rdr.Set() {
+						total++
+					}
+					rdr.Next()
+				}
+			}
+		}
+	})
+}
diff --git a/go/arrow/bitutil/bitutil.go b/go/arrow/bitutil/bitutil.go
index a75167442d5..02a417067c6 100644
--- a/go/arrow/bitutil/bitutil.go
+++ b/go/arrow/bitutil/bitutil.go
@@ -17,9 +17,12 @@
 package bitutil
 
 import (
+	"math"
 	"math/bits"
 	"reflect"
 	"unsafe"
+
+	"github.com/apache/arrow/go/arrow/memory"
 )
 
 var (
@@ -157,3 +160,61 @@ func bytesToUint64(b []byte) []uint64 {
 
 	return res
 }
+
+var (
+	// PrecedingBitmask is a convenience set of values as bitmasks for checking
+	// prefix bits of a byte
+	PrecedingBitmask = [8]byte{0, 1, 3, 7, 15, 31, 63, 127}
+	// TrailingBitmask is the bitwise complement version of kPrecedingBitmask
+	TrailingBitmask = [8]byte{255, 254, 252, 248, 240, 224, 192, 128}
+)
+
+// SetBitsTo is a convenience function to quickly set or unset all the bits
+// in a bitmap starting at startOffset for length bits.
+func SetBitsTo(bits []byte, startOffset, length int64, areSet bool) {
+	if length == 0 {
+		return
+	}
+
+	beg := startOffset
+	end := startOffset + length
+	var fill uint8 = 0
+	if areSet {
+		fill = math.MaxUint8
+	}
+
+	byteBeg := beg / 8
+	byteEnd := end/8 + 1
+
+	// don't modify bits before the startOffset by using this mask
+	firstByteMask := PrecedingBitmask[beg%8]
+	// don't modify bits past the length by using this mask
+	lastByteMask := TrailingBitmask[end%8]
+
+	if byteEnd == byteBeg+1 {
+		// set bits within a single byte
+		onlyByteMask := firstByteMask
+		if end%8 != 0 {
+			onlyByteMask = firstByteMask | lastByteMask
+		}
+
+		bits[byteBeg] &= onlyByteMask
+		bits[byteBeg] |= fill &^ onlyByteMask
+		return
+	}
+
+	// set/clear trailing bits of first byte
+	bits[byteBeg] &= firstByteMask
+	bits[byteBeg] |= fill &^ firstByteMask
+
+	if byteEnd-byteBeg > 2 {
+		memory.Set(bits[byteBeg+1:byteEnd-1], fill)
+	}
+
+	if end%8 == 0 {
+		return
+	}
+
+	bits[byteEnd-1] &= lastByteMask
+	bits[byteEnd-1] |= fill &^ lastByteMask
+}
diff --git a/go/arrow/bitutil/bitutil_test.go b/go/arrow/bitutil/bitutil_test.go
index fcb362f9daa..0a4b725885e 100644
--- a/go/arrow/bitutil/bitutil_test.go
+++ b/go/arrow/bitutil/bitutil_test.go
@@ -197,6 +197,39 @@ func TestCountSetBitsOffset(t *testing.T) {
 	}
 }
 
+func TestSetBitsTo(t *testing.T) {
+	for _, fillByte := range []byte{0x00, 0xFF} {
+		{
+			// set within a byte
+			bm := []byte{fillByte, fillByte, fillByte, fillByte}
+			bitutil.SetBitsTo(bm, 2, 2, true)
+			bitutil.SetBitsTo(bm, 4, 2, false)
+			assert.Equal(t, []byte{(fillByte &^ 0x3C) | 0xC}, bm[:1])
+		}
+		{
+			// test straddling a single byte boundary
+			bm := []byte{fillByte, fillByte, fillByte, fillByte}
+			bitutil.SetBitsTo(bm, 4, 7, true)
+			bitutil.SetBitsTo(bm, 11, 7, false)
+			assert.Equal(t, []byte{(fillByte & 0xF) | 0xF0, 0x7, fillByte &^ 0x3}, bm[:3])
+		}
+		{
+			// test byte aligned end
+			bm := []byte{fillByte, fillByte, fillByte, fillByte}
+			bitutil.SetBitsTo(bm, 4, 4, true)
+			bitutil.SetBitsTo(bm, 8, 8, false)
+			assert.Equal(t, []byte{(fillByte & 0xF) | 0xF0, 0x00, fillByte}, bm[:3])
+		}
+		{
+			// test byte aligned end, multiple bytes
+			bm := []byte{fillByte, fillByte, fillByte, fillByte}
+			bitutil.SetBitsTo(bm, 0, 24, false)
+			falseByte := byte(0)
+			assert.Equal(t, []byte{falseByte, falseByte, falseByte, fillByte}, bm)
+		}
+	}
+}
+
 func bbits(v ...int32) []byte {
 	return tools.IntsToBitsLSB(v...)
 }
diff --git a/go/arrow/go.sum b/go/arrow/go.sum
index 0ac57bae563..24da3ea6871 100644
--- a/go/arrow/go.sum
+++ b/go/arrow/go.sum
@@ -56,7 +56,6 @@ github.com/pmezard/go-difflib v1.0.0 h1:4DBwDE0NGyQoBHbLQYPwSUPoCMWR5BEzIk/f1lZb
 github.com/pmezard/go-difflib v1.0.0/go.mod h1:iKH77koFhYxTK1pcRnkKkqfTogsbg7gZNVY4sRDYZ/4=
 github.com/prometheus/client_model v0.0.0-20190812154241-14fe0d1b01d4/go.mod h1:xMI15A0UPsDsEKsMN9yxemIoYk6Tm2C1GtYGdfGttqA=
 github.com/rogpeppe/fastuuid v1.2.0/go.mod h1:jVj6XXZzXRy/MSR5jhDC/2q6DgLz+nrA6LYCDYWNEvQ=
-github.com/stretchr/objx v0.1.0 h1:4G4v2dO3VZwixGIRoQ5Lfboy6nUhCyYzaqnIAPPhYs4=
 github.com/stretchr/objx v0.1.0/go.mod h1:HFkY916IF+rwdDfMAkV7OtwuqBVzrE8GR6GFx+wExME=
 github.com/stretchr/testify v1.5.1/go.mod h1:5W2xD1RspED5o8YsWQXVCued0rvSQ+mT+I5cxcmMvtA=
 github.com/stretchr/testify v1.7.0 h1:nwc3DEeHmmLAfoZucVR881uASk0Mfjw8xYJ99tb5CcY=
@@ -70,10 +69,8 @@ golang.org/x/exp v0.0.0-20190121172915-509febef88a4/go.mod h1:CJ0aWSM057203Lf6IL
 golang.org/x/lint v0.0.0-20181026193005-c67002cb31c3/go.mod h1:UVdnD1Gm6xHRNCYTkRU2/jEulfH38KcIWyp/GAMgvoE=
 golang.org/x/lint v0.0.0-20190227174305-5b3e6a55c961/go.mod h1:wehouNa3lNwaWXcvxsM5YxQ5yQlVC4a0KAMCusXpPoU=
 golang.org/x/lint v0.0.0-20190313153728-d0100b6bd8b3/go.mod h1:6SW0HCj/g11FgYtHlgUYUwCkIfeOF89ocIRzGO/8vkc=
-golang.org/x/lint v0.0.0-20210508222113-6edffad5e616 h1:VLliZ0d+/avPrXXH+OakdXhpJuEoBZuwh1m2j7U6Iug=
 golang.org/x/lint v0.0.0-20210508222113-6edffad5e616/go.mod h1:3xt1FjdF8hUf6vQPIChWIBhFzV8gjjsPE/fR3IyQdNY=
 golang.org/x/mod v0.1.1-0.20191105210325-c90efee705ee/go.mod h1:QqPTAvyqsEbceGzBzNggFXnrqF1CaUcvgkdR5Ot7KZg=
-golang.org/x/mod v0.4.2 h1:Gz96sIWK3OalVv/I/qNygP42zyoKp3xptRVCWRFEBvo=
 golang.org/x/mod v0.4.2/go.mod h1:s0Qsj1ACt9ePp/hMypM3fl4fZqREWJwdYDEqhRiZZUA=
 golang.org/x/net v0.0.0-20180724234803-3673e40ba225/go.mod h1:mL1N/T3taQHkDXs73rZJwtUhF3w3ftmwwsq0BUmARs4=
 golang.org/x/net v0.0.0-20180826012351-8a410e7b638d/go.mod h1:mL1N/T3taQHkDXs73rZJwtUhF3w3ftmwwsq0BUmARs4=
@@ -116,7 +113,6 @@ golang.org/x/tools v0.0.0-20190311212946-11955173bddd/go.mod h1:LCzVGOaR6xXOjkQ3
 golang.org/x/tools v0.0.0-20190524140312-2c0ae7006135/go.mod h1:RgjU9mgBXZiqYHBnxXauZ1Gv1EHHAz9KjViQ78xBX0Q=
 golang.org/x/tools v0.0.0-20191119224855-298f0cb1881e/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
 golang.org/x/tools v0.0.0-20200130002326-2f3ba24bd6e7/go.mod h1:TB2adYChydJhpapKDTa4BR/hXlZSLoq2Wpct/0txZ28=
-golang.org/x/tools v0.1.4 h1:cVngSRcfgyZCzys3KYOpCFa+4dqX/Oub9tAq00ttGVs=
 golang.org/x/tools v0.1.4/go.mod h1:o0xws9oXOQQZyjljx8fwUC0k7L1pTE6eaCbjGeHmOkk=
 golang.org/x/xerrors v0.0.0-20190717185122-a985d3407aa7/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
 golang.org/x/xerrors v0.0.0-20191011141410-1b5146add898/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
diff --git a/go/parquet/go.mod b/go/parquet/go.mod
index cf2be66aba0..ccb401e9d53 100644
--- a/go/parquet/go.mod
+++ b/go/parquet/go.mod
@@ -21,17 +21,17 @@ go 1.15
 require (
 	github.com/JohnCGriffin/overflow v0.0.0-20170615021017-4d914c927216
 	github.com/andybalholm/brotli v1.0.1
-	github.com/apache/arrow/go/arrow v0.0.0-20210520144409-d07f30ada677
+	github.com/apache/arrow/go/arrow v0.0.0-20210909182554-946bdcf83611
 	github.com/apache/thrift/lib/go/thrift v0.0.0-20210120171102-e27e82c46ba4
 	github.com/golang/snappy v0.0.3
 	github.com/klauspost/asmfmt v1.2.3
-	github.com/klauspost/compress v1.12.2
+	github.com/klauspost/compress v1.13.1
 	github.com/minio/asm2plan9s v0.0.0-20200509001527-cdd76441f9d8
 	github.com/minio/c2goasm v0.0.0-20190812172519-36a3d3bbc4f3
 	github.com/stretchr/testify v1.7.0
 	github.com/zeebo/xxh3 v0.10.0
 	golang.org/x/exp v0.0.0-20210220032938-85be41e4509f
-	golang.org/x/sys v0.0.0-20210309074719-68d13333faf2
+	golang.org/x/sys v0.0.0-20210630005230-0f9fa26af87c
 	golang.org/x/xerrors v0.0.0-20200804184101-5ec99f83aff1
 	gonum.org/v1/gonum v0.8.2
 )
diff --git a/go/parquet/go.sum b/go/parquet/go.sum
index bebc1ff48a1..cf7b6789c2a 100644
--- a/go/parquet/go.sum
+++ b/go/parquet/go.sum
@@ -1,4 +1,5 @@
 cloud.google.com/go v0.26.0/go.mod h1:aQUYkXzVsufM+DwF1aE+0xfcU+56JwCaLick0ClmMTw=
+cloud.google.com/go v0.34.0/go.mod h1:aQUYkXzVsufM+DwF1aE+0xfcU+56JwCaLick0ClmMTw=
 dmitri.shuralyov.com/gpu/mtl v0.0.0-20201218220906-28db891af037/go.mod h1:H6x//7gZCb22OMCxBHrMx7a5I7Hp++hsVxbQ4BYO7hU=
 github.com/BurntSushi/toml v0.3.1/go.mod h1:xHWCNGjB5oqiDr8zfno3MHue2Ht5sIBksp03qcyfWMU=
 github.com/BurntSushi/xgb v0.0.0-20160522181843-27f122750802/go.mod h1:IVnqGOEym/WlBOVXweHU+Q+/VP0lqqI8lqeDx9IjBqo=
@@ -7,20 +8,28 @@ github.com/JohnCGriffin/overflow v0.0.0-20170615021017-4d914c927216/go.mod h1:X0
 github.com/ajstarks/svgo v0.0.0-20180226025133-644b8db467af/go.mod h1:K08gAheRH3/J6wwsYMMT4xOr94bZjxIelGM0+d/wbFw=
 github.com/andybalholm/brotli v1.0.1 h1:KqhlKozYbRtJvsPrrEeXcO+N2l6NYT5A2QAFmSULpEc=
 github.com/andybalholm/brotli v1.0.1/go.mod h1:loMXtMfwqflxFJPmdbJO0a3KNoPuLBgiu3qAvBg8x/Y=
-github.com/apache/arrow/go/arrow v0.0.0-20210520144409-d07f30ada677 h1:F7HiqIf4aBsF4YUBcLolXZ8duSEideNnZnr3lBGa2sA=
-github.com/apache/arrow/go/arrow v0.0.0-20210520144409-d07f30ada677/go.mod h1:R4hW3Ug0s+n4CUsWHKOj00Pu01ZqU4x/hSF5kXUcXKQ=
+github.com/antihax/optional v1.0.0/go.mod h1:uupD/76wgC+ih3iEmQUL+0Ugr19nfwCT1kdvxnR2qWY=
+github.com/apache/arrow/go/arrow v0.0.0-20210909182554-946bdcf83611 h1:17eVDdLcmI8iNy6dDimoLT+5jG3Y68KxZkDkKI1rLuw=
+github.com/apache/arrow/go/arrow v0.0.0-20210909182554-946bdcf83611/go.mod h1:2qMFB56yOP3KzkB3PbYZ4AlUFg3a88F67TIx5lB/WwY=
 github.com/apache/thrift/lib/go/thrift v0.0.0-20210120171102-e27e82c46ba4 h1:orNYqmQGnSjgOauLWjHEp9/qIDT98xv/0Aa4Zet3/Y8=
 github.com/apache/thrift/lib/go/thrift v0.0.0-20210120171102-e27e82c46ba4/go.mod h1:V/LzksIyqd3KZuQ2SunvReTG/UkArhII1dAWY5U1sCE=
 github.com/census-instrumentation/opencensus-proto v0.2.1/go.mod h1:f6KPmirojxKA12rnyqOA5BBL4O983OfeGPqjHWSTneU=
 github.com/client9/misspell v0.3.4/go.mod h1:qj6jICC3Q7zFZvVWo7KLAzC3yx5G7kyvSDkc90ppPyw=
 github.com/cncf/udpa/go v0.0.0-20191209042840-269d4d468f6f/go.mod h1:M8M6+tZqaGXZJjfX53e64911xZQV5JYwmTeXPW+k8Sc=
-github.com/davecgh/go-spew v1.1.0 h1:ZDRjVQ15GmhC3fiQ8ni8+OwkZQO4DARzQgrnXU1Liz8=
+github.com/cncf/udpa/go v0.0.0-20201120205902-5459f2c99403/go.mod h1:WmhPx2Nbnhtbo57+VJT5O0JRkEi1Wbu0z5j0R8u5Hbk=
+github.com/cncf/xds/go v0.0.0-20210312221358-fbca930ec8ed/go.mod h1:eXthEFrGJvWHgFFCl3hGmgk+/aYT6PnTQLykKQRLhEs=
 github.com/davecgh/go-spew v1.1.0/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
+github.com/davecgh/go-spew v1.1.1 h1:vj9j/u1bqnvCEfJOwUhtlOARqs3+rkHYY13jYWTU97c=
+github.com/davecgh/go-spew v1.1.1/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
 github.com/envoyproxy/go-control-plane v0.9.0/go.mod h1:YTl/9mNaCwkRvm6d1a2C3ymFceY/DCBVvsKhRF0iEA4=
 github.com/envoyproxy/go-control-plane v0.9.1-0.20191026205805-5f8ba28d4473/go.mod h1:YTl/9mNaCwkRvm6d1a2C3ymFceY/DCBVvsKhRF0iEA4=
 github.com/envoyproxy/go-control-plane v0.9.4/go.mod h1:6rpuAdCZL397s3pYoYcLgu1mIlRU8Am5FuJP05cCM98=
+github.com/envoyproxy/go-control-plane v0.9.9-0.20201210154907-fd9021fe5dad/go.mod h1:cXg6YxExXjJnVBQHBLXeUAgxn2UodCpnH306RInaBQk=
+github.com/envoyproxy/go-control-plane v0.9.9-0.20210217033140-668b12f5399d/go.mod h1:cXg6YxExXjJnVBQHBLXeUAgxn2UodCpnH306RInaBQk=
+github.com/envoyproxy/go-control-plane v0.9.9-0.20210512163311-63b5d3c536b0/go.mod h1:hliV/p42l8fGbc6Y9bQ70uLwIvmJyVE5k4iMKlh8wCQ=
 github.com/envoyproxy/protoc-gen-validate v0.1.0/go.mod h1:iSmxcyjqTsJpI2R4NaDN7+kN2VEUnK/pcBlmesArF7c=
 github.com/fogleman/gg v1.2.1-0.20190220221249-0403632d5b90/go.mod h1:R/bRT+9gY/C5z7JzPU0zXsXHKM4/ayA+zqcVNZzPa1k=
+github.com/ghodss/yaml v1.0.0/go.mod h1:4dBDuWmgqj2HViK6kFavaiC9ZROes6MMH2rRYeMEF04=
 github.com/go-gl/glfw/v3.3/glfw v0.0.0-20200222043503-6f7a984d4dc4/go.mod h1:tQ2UAYgL5IevRw8kRxooKSPJfGvJ9fJQFa0TUsXzTg8=
 github.com/golang/freetype v0.0.0-20170609003504-e2365dfdc4a0/go.mod h1:E/TSTwGwJL78qG/PmXZO1EjYhfJinVAhrmmHX6Z8B9k=
 github.com/golang/glog v0.0.0-20160126235308-23def4e6c14b/go.mod h1:SBH7ygxi8pfUlaOkMMuAQtPIUF8ecWP5IEl/CR7VP2Q=
@@ -35,37 +44,45 @@ github.com/golang/protobuf v1.4.0-rc.4.0.20200313231945-b860323f09d0/go.mod h1:W
 github.com/golang/protobuf v1.4.0/go.mod h1:jodUvKwWbYaEsadDk5Fwe5c77LiNKVO9IDvqG2KuDX0=
 github.com/golang/protobuf v1.4.1/go.mod h1:U8fpvMrcmy5pZrNK1lt4xCsGvpyWQ/VVv6QDs8UjoX8=
 github.com/golang/protobuf v1.4.2/go.mod h1:oDoupMAO8OvCJWAcko0GGGIgR6R6ocIYbsSw735rRwI=
+github.com/golang/protobuf v1.4.3/go.mod h1:oDoupMAO8OvCJWAcko0GGGIgR6R6ocIYbsSw735rRwI=
+github.com/golang/protobuf v1.5.0/go.mod h1:FsONVRAS9T7sI+LIUmWTfcYkHO4aIWwzhcaSAoJOfIk=
+github.com/golang/protobuf v1.5.2/go.mod h1:XVQd3VNwM+JqD3oG2Ue2ip4fOMUkwXdXDdiuN0vRsmY=
 github.com/golang/snappy v0.0.3 h1:fHPg5GQYlCeLIPB9BZqMVR5nR9A+IM5zcgeTdjMYmLA=
 github.com/golang/snappy v0.0.3/go.mod h1:/XxbfmMg8lxefKM7IXC3fBNl/7bRcc72aCRzEWrmP2Q=
-github.com/google/flatbuffers v1.11.0 h1:O7CEyB8Cb3/DmtxODGtLHcEvpr81Jm5qLg/hsHnxA2A=
-github.com/google/flatbuffers v1.11.0/go.mod h1:1AeVuKshWv4vARoZatz6mlQ0JxURH0Kv5+zNeJKJCa8=
+github.com/google/flatbuffers v2.0.0+incompatible h1:dicJ2oXwypfwUGnB2/TYWYEKiuk9eYQlQO/AnOHl5mI=
+github.com/google/flatbuffers v2.0.0+incompatible/go.mod h1:1AeVuKshWv4vARoZatz6mlQ0JxURH0Kv5+zNeJKJCa8=
 github.com/google/go-cmp v0.2.0/go.mod h1:oXzfMopK8JAjlY9xF4vHSVASa0yLyX7SntLO5aqRK0M=
 github.com/google/go-cmp v0.3.0/go.mod h1:8QqcDgzrUqlUb/G2PQTWiueGozuR1884gddMywk6iLU=
 github.com/google/go-cmp v0.3.1/go.mod h1:8QqcDgzrUqlUb/G2PQTWiueGozuR1884gddMywk6iLU=
 github.com/google/go-cmp v0.4.0/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
 github.com/google/go-cmp v0.5.0/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
-github.com/google/go-cmp v0.5.4/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
+github.com/google/go-cmp v0.5.5/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
+github.com/google/go-cmp v0.5.6/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
+github.com/google/uuid v1.1.2/go.mod h1:TIyPZe4MgqvfeYDBFedMoGGpEw/LqOeaOT+nhxU+yHo=
+github.com/grpc-ecosystem/grpc-gateway v1.16.0/go.mod h1:BDjrQk3hbvj6Nolgz8mAMFbcEtjT1g+wF4CSlocrBnw=
 github.com/jung-kurt/gofpdf v1.0.3-0.20190309125859-24315acbbda5/go.mod h1:7Id9E/uU8ce6rXgefFLlgrJj/GYY22cpxn+r32jIOes=
 github.com/klauspost/asmfmt v1.2.3 h1:qEM7SLDo6DXXXz5yTpqUoxhsrtwH30nNR2riO2ZjznY=
 github.com/klauspost/asmfmt v1.2.3/go.mod h1:RAoUvqkWr2rUa2I19qKMEVZQe4BVtcHGTMCUOcCU2Lg=
-github.com/klauspost/compress v1.11.13/go.mod h1:aoV0uJVorq1K+umq18yTdKaF57EivdYsUV+/s2qKfXs=
-github.com/klauspost/compress v1.12.2 h1:2KCfW3I9M7nSc5wOqXAlW2v2U6v+w6cbjvbfp+OykW8=
-github.com/klauspost/compress v1.12.2/go.mod h1:8dP1Hq4DHOhN9w426knH3Rhby4rFm6D8eO+e+Dq5Gzg=
+github.com/klauspost/compress v1.13.1 h1:wXr2uRxZTJXHLly6qhJabee5JqIhTRoLBhDOA74hDEQ=
+github.com/klauspost/compress v1.13.1/go.mod h1:8dP1Hq4DHOhN9w426knH3Rhby4rFm6D8eO+e+Dq5Gzg=
 github.com/minio/asm2plan9s v0.0.0-20200509001527-cdd76441f9d8 h1:AMFGa4R4MiIpspGNG7Z948v4n35fFGB3RR3G/ry4FWs=
 github.com/minio/asm2plan9s v0.0.0-20200509001527-cdd76441f9d8/go.mod h1:mC1jAcsrzbxHt8iiaC+zU4b1ylILSosueou12R++wfY=
 github.com/minio/c2goasm v0.0.0-20190812172519-36a3d3bbc4f3 h1:+n/aFZefKZp7spd8DFdX7uMikMLXX4oubIzJF4kv/wI=
 github.com/minio/c2goasm v0.0.0-20190812172519-36a3d3bbc4f3/go.mod h1:RagcQ7I8IeTMnF8JTXieKnO4Z6JCsikNEzj0DwauVzE=
-github.com/pierrec/lz4/v4 v4.1.4 h1:PjkB+qEooc9nw4F6Pxe/e0xaRdWz3suItXWxWqAO1QE=
-github.com/pierrec/lz4/v4 v4.1.4/go.mod h1:gZWDp/Ze/IJXGXf23ltt2EXimqmTUXEy0GFuRQyBid4=
+github.com/pierrec/lz4/v4 v4.1.8 h1:ieHkV+i2BRzngO4Wd/3HGowuZStgq6QkPsD1eolNAO4=
+github.com/pierrec/lz4/v4 v4.1.8/go.mod h1:gZWDp/Ze/IJXGXf23ltt2EXimqmTUXEy0GFuRQyBid4=
 github.com/pmezard/go-difflib v1.0.0 h1:4DBwDE0NGyQoBHbLQYPwSUPoCMWR5BEzIk/f1lZbAQM=
 github.com/pmezard/go-difflib v1.0.0/go.mod h1:iKH77koFhYxTK1pcRnkKkqfTogsbg7gZNVY4sRDYZ/4=
 github.com/prometheus/client_model v0.0.0-20190812154241-14fe0d1b01d4/go.mod h1:xMI15A0UPsDsEKsMN9yxemIoYk6Tm2C1GtYGdfGttqA=
+github.com/rogpeppe/fastuuid v1.2.0/go.mod h1:jVj6XXZzXRy/MSR5jhDC/2q6DgLz+nrA6LYCDYWNEvQ=
 github.com/stretchr/objx v0.1.0/go.mod h1:HFkY916IF+rwdDfMAkV7OtwuqBVzrE8GR6GFx+wExME=
-github.com/stretchr/testify v1.2.0/go.mod h1:a8OnRcib4nhh0OaRAV+Yts87kKdq0PP7pXfy6kDkUVs=
+github.com/stretchr/testify v1.5.1/go.mod h1:5W2xD1RspED5o8YsWQXVCued0rvSQ+mT+I5cxcmMvtA=
 github.com/stretchr/testify v1.7.0 h1:nwc3DEeHmmLAfoZucVR881uASk0Mfjw8xYJ99tb5CcY=
 github.com/stretchr/testify v1.7.0/go.mod h1:6Fq8oRcR53rry900zMqJjRRixrwX3KX962/h/Wwjteg=
+github.com/yuin/goldmark v1.3.5/go.mod h1:mwnBkeHKe2W/ZEtQ+71ViKU8L12m81fl3OWwC1Zlc8k=
 github.com/zeebo/xxh3 v0.10.0 h1:1+2Mov9zfxTNUeoDG9k9i13VfxTR0p1JQu8L0vikxB0=
 github.com/zeebo/xxh3 v0.10.0/go.mod h1:AQY73TOrhF3jNsdiM9zZOb8MThrYbZONHj7ryDBaLpg=
+go.opentelemetry.io/proto/otlp v0.7.0/go.mod h1:PqfVotwruBrMGOCsRd/89rSnXhoiJIqeYNgFYFoEGnI=
 golang.org/x/crypto v0.0.0-20190308221718-c2843e01d9a2/go.mod h1:djNgcEr1/C05ACkg1iLfiJU5Ep61QUkGW8qpdssI0+w=
 golang.org/x/crypto v0.0.0-20190510104115-cbcb75029529/go.mod h1:yigFU9vqHzYiE8UmvKecakEJjdnWj3jj499lnFckfCI=
 golang.org/x/crypto v0.0.0-20191011191535-87dc89f01550/go.mod h1:yigFU9vqHzYiE8UmvKecakEJjdnWj3jj499lnFckfCI=
@@ -83,34 +100,48 @@ golang.org/x/image v0.0.0-20190802002840-cff245a6509b/go.mod h1:FeLwcggjj3mMvU+o
 golang.org/x/lint v0.0.0-20181026193005-c67002cb31c3/go.mod h1:UVdnD1Gm6xHRNCYTkRU2/jEulfH38KcIWyp/GAMgvoE=
 golang.org/x/lint v0.0.0-20190227174305-5b3e6a55c961/go.mod h1:wehouNa3lNwaWXcvxsM5YxQ5yQlVC4a0KAMCusXpPoU=
 golang.org/x/lint v0.0.0-20190313153728-d0100b6bd8b3/go.mod h1:6SW0HCj/g11FgYtHlgUYUwCkIfeOF89ocIRzGO/8vkc=
+golang.org/x/lint v0.0.0-20210508222113-6edffad5e616/go.mod h1:3xt1FjdF8hUf6vQPIChWIBhFzV8gjjsPE/fR3IyQdNY=
 golang.org/x/mobile v0.0.0-20190312151609-d3739f865fa6/go.mod h1:z+o9i4GpDbdi3rU15maQ/Ox0txvL9dWGYEHz965HBQE=
 golang.org/x/mobile v0.0.0-20201217150744-e6ae53a27f4f/go.mod h1:skQtrUTUwhdJvXM/2KKJzY8pDgNr9I/FOMqDVRPBUS4=
 golang.org/x/mod v0.1.0/go.mod h1:0QHyrYULN0/3qlju5TqG8bIK38QM8yzMo5ekMj3DlcY=
 golang.org/x/mod v0.1.1-0.20191105210325-c90efee705ee/go.mod h1:QqPTAvyqsEbceGzBzNggFXnrqF1CaUcvgkdR5Ot7KZg=
 golang.org/x/mod v0.1.1-0.20191209134235-331c550502dd/go.mod h1:s0Qsj1ACt9ePp/hMypM3fl4fZqREWJwdYDEqhRiZZUA=
 golang.org/x/mod v0.3.1-0.20200828183125-ce943fd02449/go.mod h1:s0Qsj1ACt9ePp/hMypM3fl4fZqREWJwdYDEqhRiZZUA=
+golang.org/x/mod v0.4.2/go.mod h1:s0Qsj1ACt9ePp/hMypM3fl4fZqREWJwdYDEqhRiZZUA=
 golang.org/x/net v0.0.0-20180724234803-3673e40ba225/go.mod h1:mL1N/T3taQHkDXs73rZJwtUhF3w3ftmwwsq0BUmARs4=
 golang.org/x/net v0.0.0-20180826012351-8a410e7b638d/go.mod h1:mL1N/T3taQHkDXs73rZJwtUhF3w3ftmwwsq0BUmARs4=
+golang.org/x/net v0.0.0-20190108225652-1e06a53dbb7e/go.mod h1:mL1N/T3taQHkDXs73rZJwtUhF3w3ftmwwsq0BUmARs4=
 golang.org/x/net v0.0.0-20190213061140-3a22650c66bd/go.mod h1:mL1N/T3taQHkDXs73rZJwtUhF3w3ftmwwsq0BUmARs4=
 golang.org/x/net v0.0.0-20190311183353-d8887717615a/go.mod h1:t9HGtf8HONx5eT2rtn7q6eTqICYqUVnKs3thJo3Qplg=
 golang.org/x/net v0.0.0-20190404232315-eb5bcb51f2a3/go.mod h1:t9HGtf8HONx5eT2rtn7q6eTqICYqUVnKs3thJo3Qplg=
 golang.org/x/net v0.0.0-20190620200207-3b0461eec859/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
-golang.org/x/net v0.0.0-20200904194848-62affa334b73/go.mod h1:/O7V0waA8r7cgGh81Ro3o1hOxt32SMVPicZroKQ2sZA=
+golang.org/x/net v0.0.0-20200822124328-c89045814202/go.mod h1:/O7V0waA8r7cgGh81Ro3o1hOxt32SMVPicZroKQ2sZA=
+golang.org/x/net v0.0.0-20210405180319-a5a99cb37ef4/go.mod h1:p54w0d4576C0XHj96bSt6lcn1PtDYWL6XObtHCRCNQM=
+golang.org/x/net v0.0.0-20210614182718-04defd469f4e/go.mod h1:9nx3DQGgdP8bBQD5qxJ1jj9UTztislL4KSBs9R2vV5Y=
 golang.org/x/oauth2 v0.0.0-20180821212333-d2e6202438be/go.mod h1:N/0e6XlmueqKjAGxoOufVs8QHGRruUQn6yWY3a++T0U=
+golang.org/x/oauth2 v0.0.0-20200107190931-bf48bf16ab8d/go.mod h1:gOpvHmFTYa4IltrdGE7lF6nIHvwfUNPOp7c8zoXwtLw=
 golang.org/x/sync v0.0.0-20180314180146-1d60e4601c6f/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
 golang.org/x/sync v0.0.0-20181108010431-42b317875d0f/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
+golang.org/x/sync v0.0.0-20181221193216-37e7f081c4d4/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
 golang.org/x/sync v0.0.0-20190423024810-112230192c58/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
+golang.org/x/sync v0.0.0-20210220032951-036812b2e83c/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
 golang.org/x/sys v0.0.0-20180830151530-49385e6e1522/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY=
 golang.org/x/sys v0.0.0-20190215142949-d0b11bdaac8a/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY=
 golang.org/x/sys v0.0.0-20190412213103-97732733099d/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
 golang.org/x/sys v0.0.0-20191001151750-bb3f8db39f24/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
 golang.org/x/sys v0.0.0-20200323222414-85ca7c5b95cd/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
 golang.org/x/sys v0.0.0-20200727154430-2d971f7391a4/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200909081042-eff7692f9009/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210309074719-68d13333faf2 h1:46ULzRKLh1CwgRq2dC5SlBzEqqNCi8rreOZnNrbqcIY=
-golang.org/x/sys v0.0.0-20210309074719-68d13333faf2/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
+golang.org/x/sys v0.0.0-20201119102817-f84b799fce68/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
+golang.org/x/sys v0.0.0-20210330210617-4fbd30eecc44/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
+golang.org/x/sys v0.0.0-20210423082822-04245dca01da/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
+golang.org/x/sys v0.0.0-20210510120138-977fb7262007/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
+golang.org/x/sys v0.0.0-20210630005230-0f9fa26af87c h1:F1jZWGFhYfh0Ci55sIpILtKKK8p3i2/krTr0H1rg74I=
+golang.org/x/sys v0.0.0-20210630005230-0f9fa26af87c/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
+golang.org/x/term v0.0.0-20201126162022-7de9c90e9dd1/go.mod h1:bj7SfCRtBDWHUb9snDiAeCFNEtKQo2Wmx5Cou7ajbmo=
 golang.org/x/text v0.3.0/go.mod h1:NqM8EUOU14njkJ3fqMW+pc6Ldnwhi/IjpwHt7yyuwOQ=
 golang.org/x/text v0.3.3/go.mod h1:5Zoc/QRtKVWzQhOtBMvqHzDpF6irO9z98xDceosuGiQ=
+golang.org/x/text v0.3.5/go.mod h1:5Zoc/QRtKVWzQhOtBMvqHzDpF6irO9z98xDceosuGiQ=
+golang.org/x/text v0.3.6/go.mod h1:5Zoc/QRtKVWzQhOtBMvqHzDpF6irO9z98xDceosuGiQ=
 golang.org/x/tools v0.0.0-20180525024113-a5b4c53f6e8b/go.mod h1:n7NCudcB/nEzxVGmLbDWY5pfWTLqBcC2KZ6jyYvM4mQ=
 golang.org/x/tools v0.0.0-20180917221912-90fa682c2a6e/go.mod h1:n7NCudcB/nEzxVGmLbDWY5pfWTLqBcC2KZ6jyYvM4mQ=
 golang.org/x/tools v0.0.0-20190114222345-bf090417da8b/go.mod h1:n7NCudcB/nEzxVGmLbDWY5pfWTLqBcC2KZ6jyYvM4mQ=
@@ -121,7 +152,9 @@ golang.org/x/tools v0.0.0-20190312151545-0bb0c0a6e846/go.mod h1:LCzVGOaR6xXOjkQ3
 golang.org/x/tools v0.0.0-20190524140312-2c0ae7006135/go.mod h1:RgjU9mgBXZiqYHBnxXauZ1Gv1EHHAz9KjViQ78xBX0Q=
 golang.org/x/tools v0.0.0-20191119224855-298f0cb1881e/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
 golang.org/x/tools v0.0.0-20200117012304-6edc0a871e69/go.mod h1:TB2adYChydJhpapKDTa4BR/hXlZSLoq2Wpct/0txZ28=
+golang.org/x/tools v0.0.0-20200130002326-2f3ba24bd6e7/go.mod h1:TB2adYChydJhpapKDTa4BR/hXlZSLoq2Wpct/0txZ28=
 golang.org/x/tools v0.0.0-20200207183749-b753a1ba74fa/go.mod h1:TB2adYChydJhpapKDTa4BR/hXlZSLoq2Wpct/0txZ28=
+golang.org/x/tools v0.1.4/go.mod h1:o0xws9oXOQQZyjljx8fwUC0k7L1pTE6eaCbjGeHmOkk=
 golang.org/x/xerrors v0.0.0-20190717185122-a985d3407aa7/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
 golang.org/x/xerrors v0.0.0-20191011141410-1b5146add898/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
 golang.org/x/xerrors v0.0.0-20191204190536-9bdfabe68543/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
@@ -137,13 +170,17 @@ google.golang.org/appengine v1.1.0/go.mod h1:EbEs0AVv82hx2wNQdGPgUI5lhzA/G0D9Ywl
 google.golang.org/appengine v1.4.0/go.mod h1:xpcJRLb0r/rnEns0DIKYYv+WjYCduHsrkT7/EB5XEv4=
 google.golang.org/genproto v0.0.0-20180817151627-c66870c02cf8/go.mod h1:JiN7NxoALGmiZfu7CAH4rXhgtRTLTxftemlI0sWmxmc=
 google.golang.org/genproto v0.0.0-20190819201941-24fa4b261c55/go.mod h1:DMBHOl98Agz4BDEuKkezgsaosCRResVns1a3J2ZsMNc=
+google.golang.org/genproto v0.0.0-20200513103714-09dca8ec2884/go.mod h1:55QSHmfGQM9UVYDPBsyGGes0y52j32PQ3BqQfXhyH3c=
 google.golang.org/genproto v0.0.0-20200526211855-cb27e3aa2013/go.mod h1:NbSheEEYHJ7i3ixzK3sjbqSGDJWnxyFXZblF3eUsNvo=
-google.golang.org/genproto v0.0.0-20200911024640-645f7a48b24f/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
+google.golang.org/genproto v0.0.0-20210630183607-d20f26d13c79/go.mod h1:yiaVoXHpRzHGyxV3o4DktVWY4mSUErTKaeEOq6C3t3U=
 google.golang.org/grpc v1.19.0/go.mod h1:mqu4LbDTu4XGKhr4mRzUsmM4RtVoemTSY81AxZiDr8c=
 google.golang.org/grpc v1.23.0/go.mod h1:Y5yQAOtifL1yxbo5wqy6BxZv8vAUGQwXBOALyacEbxg=
 google.golang.org/grpc v1.25.1/go.mod h1:c3i+UQWmh7LiEpx4sFZnkU36qjEYZ0imhYfXVyQciAY=
 google.golang.org/grpc v1.27.0/go.mod h1:qbnxyOmOxrQa7FizSgH+ReBfzJrCY1pSN7KXBS8abTk=
-google.golang.org/grpc v1.32.0/go.mod h1:N36X2cJ7JwdamYAgDz+s+rVMFjt3numwzf/HckM8pak=
+google.golang.org/grpc v1.33.1/go.mod h1:fr5YgcSWrqhRRxogOsw7RzIpsmvOZ6IcH4kBYTpR3n0=
+google.golang.org/grpc v1.36.0/go.mod h1:qjiiYl8FncCW8feJPdyg3v6XW24KsRHe+dy9BAGRRjU=
+google.golang.org/grpc v1.38.0/go.mod h1:NREThFqKR1f3iQ6oBuvc5LadQuXVGo9rkm5ZGrQdJfM=
+google.golang.org/grpc v1.39.0/go.mod h1:PImNr+rS9TWYb2O4/emRugxiyHZ5JyHW5F+RPnDzfrE=
 google.golang.org/protobuf v0.0.0-20200109180630-ec00e32a8dfd/go.mod h1:DFci5gLYBciE7Vtevhsrf46CRTquxDuWsQurQQe4oz8=
 google.golang.org/protobuf v0.0.0-20200221191635-4d8936d0db64/go.mod h1:kwYJMbMJ01Woi6D6+Kah6886xMZcty6N08ah7+eCXa0=
 google.golang.org/protobuf v0.0.0-20200228230310-ab0ca4ff8a60/go.mod h1:cfTl7dwQJ+fmap5saPgwCLgHXTUD7jkjRqWcaiX5VyM=
@@ -152,10 +189,14 @@ google.golang.org/protobuf v1.21.0/go.mod h1:47Nbq4nVaFHyn7ilMalzfO3qCViNmqZ2kzi
 google.golang.org/protobuf v1.22.0/go.mod h1:EGpADcykh3NcUnDUJcl1+ZksZNG86OlYog2l/sGQquU=
 google.golang.org/protobuf v1.23.0/go.mod h1:EGpADcykh3NcUnDUJcl1+ZksZNG86OlYog2l/sGQquU=
 google.golang.org/protobuf v1.23.1-0.20200526195155-81db48ad09cc/go.mod h1:EGpADcykh3NcUnDUJcl1+ZksZNG86OlYog2l/sGQquU=
-google.golang.org/protobuf v1.24.0/go.mod h1:r/3tXBNzIEhYS9I1OUVjXDlt8tc493IdKGjtUeSXeh4=
 google.golang.org/protobuf v1.25.0/go.mod h1:9JNX74DMeImyA3h4bdi1ymwjUzf21/xIlbajtzgsN7c=
+google.golang.org/protobuf v1.26.0-rc.1/go.mod h1:jlhhOSvTdKEhbULTjvd4ARK9grFBp09yW+WbY/TyQbw=
+google.golang.org/protobuf v1.26.0/go.mod h1:9q0QmTI4eRPtz6boOQmLYwt+qCgq0jsYwAQnmE0givc=
+google.golang.org/protobuf v1.27.1/go.mod h1:9q0QmTI4eRPtz6boOQmLYwt+qCgq0jsYwAQnmE0givc=
 gopkg.in/check.v1 v0.0.0-20161208181325-20d25e280405 h1:yhCVgyC4o1eVCa2tZl7eS0r+SDo693bJlVdllGtEeKM=
 gopkg.in/check.v1 v0.0.0-20161208181325-20d25e280405/go.mod h1:Co6ibVJAznAaIkqp8huTwlJQCZ016jof/cbN4VW5Yz0=
+gopkg.in/yaml.v2 v2.2.2/go.mod h1:hI93XBmqTisBFMUTm0b8Fm+jr3Dg1NNxqwp+5A1VGuI=
+gopkg.in/yaml.v2 v2.2.3/go.mod h1:hI93XBmqTisBFMUTm0b8Fm+jr3Dg1NNxqwp+5A1VGuI=
 gopkg.in/yaml.v3 v3.0.0-20200313102051-9f266ea9e77c h1:dUUwHk2QECo/6vqA44rthZ8ie2QXMNeKRTHCNY2nXvo=
 gopkg.in/yaml.v3 v3.0.0-20200313102051-9f266ea9e77c/go.mod h1:K4uyk7z7BCEPqu6E+C64Yfv1cQ7kz7rIZviUmN+EgEM=
 honnef.co/go/tools v0.0.0-20190102054323-c2f93a96b099/go.mod h1:rf3lG4BRIbNafJWhAfAdb/ePZxsR/4RtNHQocxwk9r4=
diff --git a/go/parquet/internal/encoding/boolean_encoder.go b/go/parquet/internal/encoding/boolean_encoder.go
index 617eaa9471e..ba06d4c22be 100644
--- a/go/parquet/internal/encoding/boolean_encoder.go
+++ b/go/parquet/internal/encoding/boolean_encoder.go
@@ -69,7 +69,7 @@ func (enc *PlainBooleanEncoder) PutSpaced(in []bool, validBits []byte, validBits
 // EstimatedDataEncodedSize returns the current number of bytes that have
 // been buffered so far
 func (enc *PlainBooleanEncoder) EstimatedDataEncodedSize() int64 {
-	return int64(enc.sink.Len() + int(bitutil.BytesForBits(enc.wr.Pos())))
+	return int64(enc.sink.Len() + int(bitutil.BytesForBits(int64(enc.wr.Pos()))))
 }
 
 // FlushValues returns the buffered data, the responsibility is on the caller
diff --git a/go/parquet/internal/hashing/xxh3_memo_table.go b/go/parquet/internal/hashing/xxh3_memo_table.go
index dd1ee6cf58f..c1a70582552 100644
--- a/go/parquet/internal/hashing/xxh3_memo_table.go
+++ b/go/parquet/internal/hashing/xxh3_memo_table.go
@@ -192,7 +192,13 @@ func (BinaryMemoTable) valAsByteSlice(val interface{}) []byte {
 	case parquet.FixedLenByteArray:
 		return *(*[]byte)(unsafe.Pointer(&v))
 	case string:
-		return (*(*[]byte)(unsafe.Pointer(&v)))[:len(v):len(v)]
+		var out []byte
+		h := (*reflect.StringHeader)(unsafe.Pointer(&v))
+		s := (*reflect.SliceHeader)(unsafe.Pointer(&out))
+		s.Data = h.Data
+		s.Len = h.Len
+		s.Cap = h.Len
+		return out
 	default:
 		panic("invalid type for binarymemotable")
 	}
diff --git a/go/parquet/internal/utils/bit_benchmark_test.go b/go/parquet/internal/utils/bit_benchmark_test.go
index d91ab55c6d7..7539dfe756e 100644
--- a/go/parquet/internal/utils/bit_benchmark_test.go
+++ b/go/parquet/internal/utils/bit_benchmark_test.go
@@ -17,7 +17,6 @@
 package utils_test
 
 import (
-	"math/rand"
 	"strconv"
 	"testing"
 
@@ -26,50 +25,6 @@ import (
 	"github.com/apache/arrow/go/parquet/internal/utils"
 )
 
-const bufferSize = 1024 * 8
-
-// a naive bitmap reader for a baseline
-
-type NaiveBitmapReader struct {
-	bitmap []byte
-	pos    int
-}
-
-func (n *NaiveBitmapReader) IsSet() bool    { return bitutil.BitIsSet(n.bitmap, n.pos) }
-func (n *NaiveBitmapReader) IsNotSet() bool { return !n.IsSet() }
-func (n *NaiveBitmapReader) Next()          { n.pos++ }
-
-// naive bitmap writer for a baseline
-
-type NaiveBitmapWriter struct {
-	bitmap []byte
-	pos    int
-}
-
-func (n *NaiveBitmapWriter) Set() {
-	byteOffset := n.pos / 8
-	bitOffset := n.pos % 8
-	bitSetMask := uint8(1 << bitOffset)
-	n.bitmap[byteOffset] |= bitSetMask
-}
-
-func (n *NaiveBitmapWriter) Clear() {
-	byteOffset := n.pos / 8
-	bitOffset := n.pos % 8
-	bitClearMask := uint8(0xFF ^ (1 << bitOffset))
-	n.bitmap[byteOffset] &= bitClearMask
-}
-
-func (n *NaiveBitmapWriter) Next()   { n.pos++ }
-func (n *NaiveBitmapWriter) Finish() {}
-
-func randomBuffer(nbytes int64) []byte {
-	buf := make([]byte, nbytes)
-	r := rand.New(rand.NewSource(0))
-	r.Read(buf)
-	return buf
-}
-
 func randomBitsBuffer(nbits, setPct int64) []byte {
 	rag := testutils.NewRandomArrayGenerator(23)
 	prob := float64(0)
@@ -80,7 +35,7 @@ func randomBitsBuffer(nbits, setPct int64) []byte {
 	rag.GenerateBitmap(buf, nbits, prob)
 
 	if setPct == -1 {
-		wr := utils.NewBitmapWriter(buf, 0, nbits)
+		wr := bitutil.NewBitmapWriter(buf, 0, int(nbits))
 		for i := int64(0); i < nbits; i++ {
 			if i%2 == 0 {
 				wr.Set()
@@ -93,62 +48,6 @@ func randomBitsBuffer(nbits, setPct int64) []byte {
 	return buf
 }
 
-func BenchmarkBitmapReader(b *testing.B) {
-	buf := randomBuffer(bufferSize)
-	nbits := bufferSize * 8
-
-	b.Run("naive baseline", func(b *testing.B) {
-		b.SetBytes(2 * bufferSize)
-		for i := 0; i < b.N; i++ {
-			{
-				total := 0
-				rdr := NaiveBitmapReader{buf, 0}
-				for j := 0; j < nbits; j++ {
-					if rdr.IsSet() {
-						total++
-					}
-					rdr.Next()
-				}
-			}
-			{
-				total := 0
-				rdr := NaiveBitmapReader{buf, 0}
-				for j := 0; j < nbits; j++ {
-					if rdr.IsSet() {
-						total++
-					}
-					rdr.Next()
-				}
-			}
-		}
-	})
-	b.Run("bitmap reader", func(b *testing.B) {
-		b.SetBytes(2 * bufferSize)
-		for i := 0; i < b.N; i++ {
-			{
-				total := 0
-				rdr := utils.NewBitmapReader(buf, 0, int64(nbits))
-				for j := 0; j < nbits; j++ {
-					if rdr.Set() {
-						total++
-					}
-					rdr.Next()
-				}
-			}
-			{
-				total := 0
-				rdr := utils.NewBitmapReader(buf, 0, int64(nbits))
-				for j := 0; j < nbits; j++ {
-					if rdr.Set() {
-						total++
-					}
-					rdr.Next()
-				}
-			}
-		}
-	})
-}
-
 func testBitRunReader(rdr utils.BitRunReader) (setTotal int64) {
 	for {
 		br := rdr.NextRun()
@@ -170,7 +69,7 @@ func BenchmarkBitRunReader(b *testing.B) {
 			b.Run("linear", func(b *testing.B) {
 				b.SetBytes(numBits / 8)
 				for i := 0; i < b.N; i++ {
-					rdr := linearBitRunReader{utils.NewBitmapReader(buf, 0, numBits)}
+					rdr := linearBitRunReader{bitutil.NewBitmapReader(buf, 0, numBits)}
 					testBitRunReader(rdr)
 				}
 			})
diff --git a/go/parquet/internal/utils/bit_block_counter_test.go b/go/parquet/internal/utils/bit_block_counter_test.go
index 6ec5a87d50d..86c55cd8383 100644
--- a/go/parquet/internal/utils/bit_block_counter_test.go
+++ b/go/parquet/internal/utils/bit_block_counter_test.go
@@ -100,7 +100,7 @@ func TestOneWordWithOffsets(t *testing.T) {
 		assert.EqualValues(t, 63, block.Popcnt)
 
 		// Set the next word to all false
-		utils.SetBitsTo(buf.Bytes(), 2*kWordSize+offset, kWordSize, false)
+		bitutil.SetBitsTo(buf.Bytes(), 2*kWordSize+offset, kWordSize, false)
 
 		block = counter.NextWord()
 		assert.EqualValues(t, 64, block.Len)
@@ -150,7 +150,7 @@ func TestFourWordsWithOffsets(t *testing.T) {
 		assert.EqualValues(t, 253, block.Popcnt)
 
 		// set the next two words to all false
-		utils.SetBitsTo(buf.Bytes(), 8*kWordSize+offset, 2*kWordSize, false)
+		bitutil.SetBitsTo(buf.Bytes(), 8*kWordSize+offset, 2*kWordSize, false)
 
 		// block is half set
 		block = counter.NextFourWords()
diff --git a/go/parquet/internal/utils/bit_run_reader_test.go b/go/parquet/internal/utils/bit_run_reader_test.go
index e34026ed816..2b3cc4d2f4d 100644
--- a/go/parquet/internal/utils/bit_run_reader_test.go
+++ b/go/parquet/internal/utils/bit_run_reader_test.go
@@ -44,7 +44,7 @@ func TestBitRunReaderZeroLength(t *testing.T) {
 
 func bitmapFromSlice(vals []int, bitOffset int64) []byte {
 	out := make([]byte, int(bitutil.BytesForBits(int64(len(vals))+bitOffset)))
-	writer := utils.NewBitmapWriter(out, bitOffset, int64(len(vals)))
+	writer := bitutil.NewBitmapWriter(out, int(bitOffset), len(vals))
 	for _, val := range vals {
 		if val == 1 {
 			writer.Set()
diff --git a/go/parquet/internal/utils/bit_set_run_reader_test.go b/go/parquet/internal/utils/bit_set_run_reader_test.go
index 2165b77c346..7a001780551 100644
--- a/go/parquet/internal/utils/bit_set_run_reader_test.go
+++ b/go/parquet/internal/utils/bit_set_run_reader_test.go
@@ -34,7 +34,7 @@ func reverseAny(s interface{}) {
 }
 
 type linearBitRunReader struct {
-	reader *utils.BitmapReader
+	reader *bitutil.BitmapReader
 }
 
 func (l linearBitRunReader) NextRun() utils.BitRun {
@@ -68,16 +68,16 @@ func bitmapFromString(s string) []byte {
 	return ret[:actualLen]
 }
 
-func referenceBitRuns(data []byte, offset, length int64) (ret []utils.SetBitRun) {
+func referenceBitRuns(data []byte, offset, length int) (ret []utils.SetBitRun) {
 	ret = make([]utils.SetBitRun, 0)
-	reader := linearBitRunReader{utils.NewBitmapReader(data, offset, length)}
-	pos := int64(0)
+	reader := linearBitRunReader{bitutil.NewBitmapReader(data, offset, length)}
+	pos := 0
 	for pos < length {
 		br := reader.NextRun()
 		if br.Set {
-			ret = append(ret, utils.SetBitRun{pos, br.Len})
+			ret = append(ret, utils.SetBitRun{int64(pos), br.Len})
 		}
-		pos += br.Len
+		pos += int(br.Len)
 	}
 	return
 }
@@ -94,9 +94,6 @@ func TestBitSetRunReader(t *testing.T) {
 
 func (br *BitSetRunReaderSuite) SetupSuite() {
 	br.testOffsets = []int64{0, 1, 6, 7, 8, 33, 63, 64, 65, 71}
-}
-
-func (br *BitSetRunReaderSuite) SetupTest() {
 	br.T().Parallel()
 }
 
@@ -165,10 +162,10 @@ func (br *BitSetRunReaderSuite) TestOneByte() {
 
 	for _, str := range []string{"01101101", "10110110", "00000000", "11111111"} {
 		buf := bitmapFromString(str)
-		for offset := int64(0); offset < 8; offset++ {
-			for length := int64(0); length <= 8-offset; length++ {
+		for offset := 0; offset < 8; offset++ {
+			for length := 0; length <= 8-offset; length++ {
 				expected := referenceBitRuns(buf, offset, length)
-				br.assertBitRuns(buf, offset, length, expected)
+				br.assertBitRuns(buf, int64(offset), int64(length), expected)
 			}
 		}
 	}
@@ -215,7 +212,7 @@ func (br *BitSetRunReaderSuite) TestAllZeros() {
 func (br *BitSetRunReaderSuite) TestAllOnes() {
 	const bufferSize = 256
 	buf := make([]byte, int(bitutil.BytesForBits(bufferSize)))
-	utils.SetBitsTo(buf, 0, bufferSize, true)
+	bitutil.SetBitsTo(buf, 0, bufferSize, true)
 
 	for _, rg := range br.bufferTestRanges(buf) {
 		if rg.Len > 0 {
@@ -235,9 +232,9 @@ func (br *BitSetRunReaderSuite) TestSmall() {
 	)
 
 	buf := make([]byte, int(bitutil.BytesForBits(bufferSize)))
-	utils.SetBitsTo(buf, 0, bufferSize, false)
-	utils.SetBitsTo(buf, 0, onesLen, true)
-	utils.SetBitsTo(buf, secondOnesStart, onesLen, true)
+	bitutil.SetBitsTo(buf, 0, bufferSize, false)
+	bitutil.SetBitsTo(buf, 0, onesLen, true)
+	bitutil.SetBitsTo(buf, secondOnesStart, onesLen, true)
 
 	for _, rg := range br.bufferTestRanges(buf) {
 		expected := []utils.SetBitRun{}
@@ -257,8 +254,8 @@ func (br *BitSetRunReaderSuite) TestSingleRun() {
 	buf := make([]byte, int(bitutil.BytesForBits(bufferSize)))
 
 	for _, onesRg := range br.bufferTestRanges(buf) {
-		utils.SetBitsTo(buf, 0, bufferSize, false)
-		utils.SetBitsTo(buf, onesRg.Offset, onesRg.Len, true)
+		bitutil.SetBitsTo(buf, 0, bufferSize, false)
+		bitutil.SetBitsTo(buf, onesRg.Offset, onesRg.Len, true)
 
 		for _, rg := range br.bufferTestRanges(buf) {
 			expect := []utils.SetBitRun{}
diff --git a/go/parquet/internal/utils/bitmap_reader.go b/go/parquet/internal/utils/bitmap_reader.go
deleted file mode 100644
index ace63bb9b18..00000000000
--- a/go/parquet/internal/utils/bitmap_reader.go
+++ /dev/null
@@ -1,72 +0,0 @@
-// Licensed to the Apache Software Foundation (ASF) under one
-// or more contributor license agreements.  See the NOTICE file
-// distributed with this work for additional information
-// regarding copyright ownership.  The ASF licenses this file
-// to you under the Apache License, Version 2.0 (the
-// "License"); you may not use this file except in compliance
-// with the License.  You may obtain a copy of the License at
-//
-// http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-package utils
-
-// BitmapReader is a simple bitmap reader for a byte slice.
-type BitmapReader struct {
-	bitmap []byte
-	pos    int64
-	len    int64
-
-	current    byte
-	byteOffset int64
-	bitOffset  int64
-}
-
-// NewBitmapReader creates and returns a new bitmap reader for the given bitmap
-func NewBitmapReader(bitmap []byte, offset, length int64) *BitmapReader {
-	curbyte := byte(0)
-	if length > 0 && bitmap != nil {
-		curbyte = bitmap[offset/8]
-	}
-	return &BitmapReader{
-		bitmap:     bitmap,
-		byteOffset: offset / 8,
-		bitOffset:  offset % 8,
-		current:    curbyte,
-		len:        length,
-	}
-}
-
-// Set returns true if the current bit is set
-func (b *BitmapReader) Set() bool {
-	return (b.current & (1 << b.bitOffset)) != 0
-}
-
-// NotSet returns true if the current bit is not set
-func (b *BitmapReader) NotSet() bool {
-	return (b.current & (1 << b.bitOffset)) == 0
-}
-
-// Next advances the reader to the next bit in the bitmap.
-func (b *BitmapReader) Next() {
-	b.bitOffset++
-	b.pos++
-	if b.bitOffset == 8 {
-		b.bitOffset = 0
-		b.byteOffset++
-		if b.pos < b.len {
-			b.current = b.bitmap[int(b.byteOffset)]
-		}
-	}
-}
-
-// Pos returns the current bit position in the bitmap that the reader is looking at
-func (b *BitmapReader) Pos() int64 { return b.pos }
-
-// Len returns the total number of bits in the bitmap
-func (b *BitmapReader) Len() int64 { return b.len }
diff --git a/go/parquet/internal/utils/bitmap_reader_test.go b/go/parquet/internal/utils/bitmap_reader_test.go
deleted file mode 100644
index e9a7eda9d3f..00000000000
--- a/go/parquet/internal/utils/bitmap_reader_test.go
+++ /dev/null
@@ -1,75 +0,0 @@
-// Licensed to the Apache Software Foundation (ASF) under one
-// or more contributor license agreements.  See the NOTICE file
-// distributed with this work for additional information
-// regarding copyright ownership.  The ASF licenses this file
-// to you under the Apache License, Version 2.0 (the
-// "License"); you may not use this file except in compliance
-// with the License.  You may obtain a copy of the License at
-//
-// http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-package utils_test
-
-import (
-	"testing"
-
-	"github.com/apache/arrow/go/parquet/internal/utils"
-	"github.com/stretchr/testify/assert"
-)
-
-func assertReaderVals(t *testing.T, reader *utils.BitmapReader, vals []bool) {
-	for _, v := range vals {
-		if v {
-			assert.True(t, reader.Set())
-			assert.False(t, reader.NotSet())
-		} else {
-			assert.True(t, reader.NotSet())
-			assert.False(t, reader.Set())
-		}
-		reader.Next()
-	}
-}
-
-func TestNormalOperation(t *testing.T) {
-	for _, offset := range []int64{0, 1, 3, 5, 7, 8, 12, 13, 21, 38, 75, 120} {
-		buf := bitmapFromSlice([]int{0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1}, offset)
-
-		reader := utils.NewBitmapReader(buf, offset, 14)
-		assertReaderVals(t, reader, []bool{false, true, true, true, false, false, false, true, false, true, false, true, false, true})
-	}
-}
-
-func TestDoesNotReadOutOfBounds(t *testing.T) {
-	var bitmap [16]byte
-	const length = 128
-
-	reader := utils.NewBitmapReader(bitmap[:], 0, length)
-	assert.EqualValues(t, length, reader.Len())
-	assert.NotPanics(t, func() {
-		for i := 0; i < length; i++ {
-			assert.True(t, reader.NotSet())
-			reader.Next()
-		}
-	})
-	assert.EqualValues(t, length, reader.Pos())
-
-	reader = utils.NewBitmapReader(bitmap[:], 5, length-5)
-	assert.EqualValues(t, length-5, reader.Len())
-	assert.NotPanics(t, func() {
-		for i := 0; i < length-5; i++ {
-			assert.True(t, reader.NotSet())
-			reader.Next()
-		}
-	})
-	assert.EqualValues(t, length-5, reader.Pos())
-
-	assert.NotPanics(t, func() {
-		reader = utils.NewBitmapReader(nil, 0, 0)
-	})
-}
diff --git a/go/parquet/internal/utils/bitmap_writer.go b/go/parquet/internal/utils/bitmap_writer.go
index f7c1f7a57cd..c386705f444 100644
--- a/go/parquet/internal/utils/bitmap_writer.go
+++ b/go/parquet/internal/utils/bitmap_writer.go
@@ -18,71 +18,11 @@ package utils
 
 import (
 	"encoding/binary"
-	"math"
 	"math/bits"
 
 	"github.com/apache/arrow/go/arrow/bitutil"
-	"github.com/apache/arrow/go/arrow/memory"
 )
 
-var (
-	// PrecedingBitmask is a convenience set of values as bitmasks for checking
-	// prefix bits of a byte
-	PrecedingBitmask = [8]byte{0, 1, 3, 7, 15, 31, 63, 127}
-	// TrailingBitmask is the bitwise complement version of kPrecedingBitmask
-	TrailingBitmask = [8]byte{255, 254, 252, 248, 240, 224, 192, 128}
-)
-
-// SetBitsTo is a convenience function to quickly set or unset all the bits
-// in a bitmap starting at startOffset for length bits.
-func SetBitsTo(bits []byte, startOffset, length int64, areSet bool) {
-	if length == 0 {
-		return
-	}
-
-	beg := startOffset
-	end := startOffset + length
-	var fill uint8 = 0
-	if areSet {
-		fill = math.MaxUint8
-	}
-
-	byteBeg := beg / 8
-	byteEnd := end/8 + 1
-
-	// don't modify bits before the startOffset by using this mask
-	firstByteMask := PrecedingBitmask[beg%8]
-	// don't modify bits past the length by using this mask
-	lastByteMask := TrailingBitmask[end%8]
-
-	if byteEnd == byteBeg+1 {
-		// set bits within a single byte
-		onlyByteMask := firstByteMask
-		if end%8 != 0 {
-			onlyByteMask = firstByteMask | lastByteMask
-		}
-
-		bits[byteBeg] &= onlyByteMask
-		bits[byteBeg] |= fill &^ onlyByteMask
-		return
-	}
-
-	// set/clear trailing bits of first byte
-	bits[byteBeg] &= firstByteMask
-	bits[byteBeg] |= fill &^ firstByteMask
-
-	if byteEnd-byteBeg > 2 {
-		memory.Set(bits[byteBeg+1:byteEnd-1], fill)
-	}
-
-	if end%8 == 0 {
-		return
-	}
-
-	bits[byteEnd-1] &= lastByteMask
-	bits[byteEnd-1] |= fill &^ lastByteMask
-}
-
 // BitmapWriter is an interface for bitmap writers so that we can use multiple
 // implementations or swap if necessary.
 type BitmapWriter interface {
@@ -100,96 +40,22 @@ type BitmapWriter interface {
 	// of bools that were able to fit in the remaining length of the bitmapwriter.
 	AppendBools(in []bool) int
 	// Pos is the current position that will be written next
-	Pos() int64
+	Pos() int
 	// Reset allows reusing the bitmapwriter by resetting Pos to start with length as
 	// the number of bits that the writer can write.
-	Reset(start, length int64)
+	Reset(start, length int)
 }
 
 type bitmapWriter struct {
-	buf    []byte
-	pos    int64
-	length int64
-
-	curByte    uint8
-	bitMask    uint8
-	byteOffset int64
-}
-
-// NewBitmapWriter returns a sequential bitwise writer that preserves surrounding
-// bit values as it writes.
-func NewBitmapWriter(bitmap []byte, start, length int64) BitmapWriter {
-	ret := &bitmapWriter{
-		buf:        bitmap,
-		length:     length,
-		byteOffset: start / 8,
-		bitMask:    bitutil.BitMask[start%8],
-	}
-	if length > 0 {
-		ret.curByte = bitmap[int(ret.byteOffset)]
-	}
-	return ret
-}
-
-func (b *bitmapWriter) Reset(start, length int64) {
-	b.pos = 0
-	b.byteOffset = start / 8
-	b.bitMask = bitutil.BitMask[start%8]
-	b.length = length
-	if b.length > 0 {
-		b.curByte = b.buf[int(b.byteOffset)]
-	}
-}
-
-func (b *bitmapWriter) Pos() int64 { return b.pos }
-func (b *bitmapWriter) Set()       { b.curByte |= b.bitMask }
-func (b *bitmapWriter) Clear()     { b.curByte &= ^b.bitMask }
-
-func (b *bitmapWriter) Next() {
-	b.bitMask = b.bitMask << 1
-	b.pos++
-	if b.bitMask == 0 {
-		b.bitMask = 0x01
-		b.buf[b.byteOffset] = b.curByte
-		b.byteOffset++
-		if b.pos < b.length {
-			b.curByte = b.buf[int(b.byteOffset)]
-		}
-	}
-}
-
-func (b *bitmapWriter) AppendBools(in []bool) int {
-	space := Min(bitutil.BytesForBits(b.length-b.pos), int64(len(in)))
-
-	// location that the first byte needs to be written to for appending
-	appslice := b.buf[int(b.byteOffset):]
-	// update everything but curByte
-	bitOffset := bits.TrailingZeros32(uint32(b.bitMask))
-	appslice[0] = b.curByte
-	for i, b := range in[:space] {
-		if b {
-			bitutil.SetBit(appslice, i)
-		} else {
-			bitutil.ClearBit(appslice, i)
-		}
-	}
-
-	b.pos += space
-	b.bitMask = bitutil.BitMask[(int64(bitOffset)+space)%8]
-	b.byteOffset += (int64(bitOffset) + space) / 8
-	b.curByte = appslice[len(appslice)-1]
-
-	return int(space)
+	*bitutil.BitmapWriter
 }
 
-func (b *bitmapWriter) Finish() {
-	if b.length > 0 && (b.bitMask != 0x01 || b.pos < b.length) {
-		b.buf[int(b.byteOffset)] = b.curByte
-	}
+func NewBitmapWriter(bitmap []byte, start, length int) BitmapWriter {
+	return &bitmapWriter{bitutil.NewBitmapWriter(bitmap, start, length)}
 }
 
 func (b *bitmapWriter) AppendWord(uint64, int64) {
-	panic("AppendWord not implemented")
+	panic("unimplemented")
 }
 
 type firstTimeBitmapWriter struct {
@@ -213,24 +79,24 @@ func NewFirstTimeBitmapWriter(buf []byte, start, length int64) BitmapWriter {
 		length:     length,
 	}
 	if length > 0 {
-		ret.curByte = ret.buf[int(ret.byteOffset)] & PrecedingBitmask[start%8]
+		ret.curByte = ret.buf[int(ret.byteOffset)] & bitutil.PrecedingBitmask[start%8]
 	}
 	return ret
 }
 
 var endianBuffer [8]byte
 
-func (bw *firstTimeBitmapWriter) Reset(start, length int64) {
+func (bw *firstTimeBitmapWriter) Reset(start, length int) {
 	bw.pos = 0
-	bw.byteOffset = start / 8
+	bw.byteOffset = int64(start / 8)
 	bw.bitMask = bitutil.BitMask[start%8]
-	bw.length = length
+	bw.length = int64(length)
 	if length > 0 {
-		bw.curByte = bw.buf[int(bw.byteOffset)] & PrecedingBitmask[start%8]
+		bw.curByte = bw.buf[int(bw.byteOffset)] & bitutil.PrecedingBitmask[start%8]
 	}
 }
 
-func (bw *firstTimeBitmapWriter) Pos() int64 { return bw.pos }
+func (bw *firstTimeBitmapWriter) Pos() int { return int(bw.pos) }
 func (bw *firstTimeBitmapWriter) AppendWord(word uint64, nbits int64) {
 	if nbits == 0 {
 		return
@@ -251,7 +117,7 @@ func (bw *firstTimeBitmapWriter) AppendWord(word uint64, nbits int64) {
 		carry := 8 - bitOffset
 		// Carry over bits from word to curByte. We assume any extra bits in word are unset
 		// so no additional accounting is needed for when nbits < carry
-		bw.curByte |= uint8((word & uint64(PrecedingBitmask[carry])) << bitOffset)
+		bw.curByte |= uint8((word & uint64(bitutil.PrecedingBitmask[carry])) << bitOffset)
 		// check everything was transferred to curByte
 		if nbits < int64(carry) {
 			return
diff --git a/go/parquet/metadata/app_version.go b/go/parquet/metadata/app_version.go
new file mode 100644
index 00000000000..02d9a4aa87c
--- /dev/null
+++ b/go/parquet/metadata/app_version.go
@@ -0,0 +1,184 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package metadata
+
+import (
+	"regexp"
+	"strconv"
+	"strings"
+
+	"github.com/apache/arrow/go/parquet"
+	"github.com/apache/arrow/go/parquet/schema"
+)
+
+var (
+	// Regular expression for the version format
+	// major . minor . patch unknown - prerelease.x + build info
+	// Eg: 1.5.0ab-cdh5.5.0+cd
+	versionRx = regexp.MustCompile(`^(\d+)\.(\d+)\.(\d+)([^-+]*)?(?:-([^+]*))?(?:\+(.*))?$`)
+	// Regular expression for the application format
+	// application_name version VERSION_FORMAT (build build_name)
+	// Eg: parquet-cpp version 1.5.0ab-xyz5.5.0+cd (build abcd)
+	applicationRx = regexp.MustCompile(`^(.*?)\s*(?:(version\s*(?:([^(]*?)\s*(?:\(\s*build\s*([^)]*?)\s*\))?)?)?)$`)
+
+	// Parquet816FixedVersion is the version used for fixing PARQUET-816
+	// that changed the padding calculations for dictionary headers on row groups.
+	Parquet816FixedVersion      = NewAppVersionExplicit("parquet-mr", 1, 2, 9)
+	parquet251FixedVersion      = NewAppVersionExplicit("parquet-mr", 1, 8, 0)
+	parquetCPPFixedStatsVersion = NewAppVersionExplicit("parquet-cpp", 1, 3, 0)
+	parquetMRFixedStatsVersion  = NewAppVersionExplicit("parquet-mr", 1, 10, 0)
+	// parquet1655FixedVersion is the version used for fixing PARQUET-1655
+	// which fixed min/max stats comparisons for Decimal types
+	parquet1655FixedVersion = NewAppVersionExplicit("parquet-cpp-arrow", 4, 0, 0)
+)
+
+// AppVersion represents a specific application version either read from
+// or written to a parquet file.
+type AppVersion struct {
+	App     string
+	Build   string
+	Version struct {
+		Major      int
+		Minor      int
+		Patch      int
+		Unknown    string
+		PreRelease string
+		BuildInfo  string
+	}
+}
+
+// NewAppVersionExplicit is a convenience function to construct a specific
+// application version from the given app string and version
+func NewAppVersionExplicit(app string, major, minor, patch int) *AppVersion {
+	v := &AppVersion{App: app}
+	v.Version.Major = major
+	v.Version.Minor = minor
+	v.Version.Patch = patch
+	return v
+}
+
+// NewAppVersion parses a "created by" string such as "parquet-go 1.0.0".
+//
+// It also supports handling pre-releases and build info such as
+// 	parquet-cpp version 1.5.0ab-xyz5.5.0+cd (build abcd)
+func NewAppVersion(createdby string) *AppVersion {
+	v := &AppVersion{}
+
+	var ver []string
+
+	m := applicationRx.FindStringSubmatch(strings.ToLower(createdby))
+	if len(m) >= 4 {
+		v.App = m[1]
+		v.Build = m[4]
+		ver = versionRx.FindStringSubmatch(m[3])
+	} else {
+		v.App = "unknown"
+	}
+
+	if len(ver) >= 7 {
+		v.Version.Major, _ = strconv.Atoi(ver[1])
+		v.Version.Minor, _ = strconv.Atoi(ver[2])
+		v.Version.Patch, _ = strconv.Atoi(ver[3])
+		v.Version.Unknown = ver[4]
+		v.Version.PreRelease = ver[5]
+		v.Version.BuildInfo = ver[6]
+	}
+	return v
+}
+
+// LessThan compares the app versions and returns true if this version
+// is "less than" the passed version.
+//
+// If the apps don't match, this always returns false. Otherwise it compares
+// the major versions first, then the minor versions, and finally the patch
+// versions.
+//
+// Pre-release and build info are not considered.
+func (v AppVersion) LessThan(other *AppVersion) bool {
+	switch {
+	case v.App != other.App:
+		return false
+	case v.Version.Major < other.Version.Major:
+		return true
+	case v.Version.Major > other.Version.Major:
+		return false
+	case v.Version.Minor < other.Version.Minor:
+		return true
+	case v.Version.Minor > other.Version.Minor:
+		return false
+	}
+
+	return v.Version.Patch < other.Version.Patch
+}
+
+// Equal only compares the Application and major/minor/patch versions.
+//
+// Pre-release and build info are not considered.
+func (v AppVersion) Equal(other *AppVersion) bool {
+	return v.App == other.App &&
+		v.Version.Major == other.Version.Major &&
+		v.Version.Minor == other.Version.Minor &&
+		v.Version.Patch == other.Version.Patch
+}
+
+// HasCorrectStatistics checks whether or not the statistics are valid to be used
+// based on the primitive type and the version since previous versions had issues with
+// properly computing stats.
+//
+// Reference: parquet-cpp/src/parquet/metadata.cc
+//
+// PARQUET-686 has more discussion on statistics
+func (v AppVersion) HasCorrectStatistics(coltype parquet.Type, logicalType schema.LogicalType, stats EncodedStatistics, sort schema.SortOrder) bool {
+	// parquet-cpp version 1.3.0 and parquet-mr 1.10.0 onwards stats are computed correctly for all types except decimal
+	if (v.App == "parquet-cpp" && v.LessThan(parquetCPPFixedStatsVersion)) ||
+		(v.App == "parquet-mr" && v.LessThan(parquetMRFixedStatsVersion)) {
+		// only SIGNED are valid unless max and min are the same (in which case the sort order doesn't matter)
+		var maxEqualsMin bool
+		if stats.HasMin && stats.HasMax {
+			maxEqualsMin = string(stats.Min) == string(stats.Max)
+		}
+		if sort != schema.SortSIGNED && !maxEqualsMin {
+			return false
+		}
+
+		if coltype != parquet.Types.FixedLenByteArray && coltype != parquet.Types.ByteArray {
+			return true
+		}
+	}
+
+	// parquet-cpp-arrow version 4.0.0 fixed Decimal comparisons for creating min/max stats
+	// parquet-cpp also becomes parquet-cpp-arrow as of version 4.0.0
+	if v.App == "parquet-cpp" || (v.App == "parquet-cpp-arrow" && v.LessThan(parquet1655FixedVersion)) {
+		if _, ok := logicalType.(*schema.DecimalLogicalType); ok && coltype == parquet.Types.FixedLenByteArray {
+			return false
+		}
+	}
+
+	// created_by is not populated, which could have been caused by
+	// parquet-mr during the same time as PARQUET-251, see PARQUET-297
+	if v.App == "unknown" {
+		return true
+	}
+
+	// unknown sort order has incorrect stats
+	if sort == schema.SortUNKNOWN {
+		return false
+	}
+
+	// PARQUET-251
+	return !v.LessThan(parquet251FixedVersion)
+}
diff --git a/go/parquet/metadata/column_chunk.go b/go/parquet/metadata/column_chunk.go
new file mode 100644
index 00000000000..e3a7eae7d81
--- /dev/null
+++ b/go/parquet/metadata/column_chunk.go
@@ -0,0 +1,423 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package metadata
+
+import (
+	"bytes"
+	"context"
+	"io"
+	"reflect"
+
+	"github.com/apache/arrow/go/arrow/memory"
+	"github.com/apache/arrow/go/parquet"
+	"github.com/apache/arrow/go/parquet/compress"
+	"github.com/apache/arrow/go/parquet/internal/encryption"
+	format "github.com/apache/arrow/go/parquet/internal/gen-go/parquet"
+	"github.com/apache/arrow/go/parquet/internal/thrift"
+	"github.com/apache/arrow/go/parquet/schema"
+	"golang.org/x/xerrors"
+)
+
+// PageEncodingStats is used for counting the number of pages of specific
+// types with the given internal encoding.
+type PageEncodingStats struct {
+	Encoding parquet.Encoding
+	PageType format.PageType
+}
+
+type statvalues struct {
+	*format.Statistics
+}
+
+func (s *statvalues) GetMin() []byte { return s.GetMinValue() }
+func (s *statvalues) GetMax() []byte { return s.GetMaxValue() }
+func (s *statvalues) IsSetMin() bool { return s.IsSetMinValue() }
+func (s *statvalues) IsSetMax() bool { return s.IsSetMaxValue() }
+
+func makeColumnStats(metadata *format.ColumnMetaData, descr *schema.Column, mem memory.Allocator) TypedStatistics {
+	if descr.ColumnOrder() == parquet.ColumnOrders.TypeDefinedOrder {
+		return NewStatisticsFromEncoded(descr, mem,
+			metadata.NumValues-metadata.Statistics.GetNullCount(),
+			&statvalues{metadata.Statistics})
+	}
+	return NewStatisticsFromEncoded(descr, mem,
+		metadata.NumValues-metadata.Statistics.GetNullCount(),
+		metadata.Statistics)
+}
+
+// ColumnChunkMetaData is a proxy around format.ColumnChunkMetaData
+// containing all of the information and metadata for a given column chunk
+// and it's associated Column
+type ColumnChunkMetaData struct {
+	column        *format.ColumnChunk
+	columnMeta    *format.ColumnMetaData
+	decryptedMeta format.ColumnMetaData
+	descr         *schema.Column
+	writerVersion *AppVersion
+	encodings     []parquet.Encoding
+	encodingStats []format.PageEncodingStats
+	possibleStats TypedStatistics
+	mem           memory.Allocator
+}
+
+// NewColumnChunkMetaData creates an instance of the metadata from a column chunk and descriptor
+//
+// this is primarily used internally or between the subpackages. ColumnChunkMetaDataBuilder should
+// be used by consumers instead of using this directly.
+func NewColumnChunkMetaData(column *format.ColumnChunk, descr *schema.Column, writerVersion *AppVersion, rowGroupOrdinal, columnOrdinal int16, fileDecryptor encryption.FileDecryptor) (*ColumnChunkMetaData, error) {
+	c := &ColumnChunkMetaData{
+		column:        column,
+		columnMeta:    column.GetMetaData(),
+		descr:         descr,
+		writerVersion: writerVersion,
+		mem:           memory.DefaultAllocator,
+	}
+	if column.IsSetCryptoMetadata() {
+		ccmd := column.CryptoMetadata
+
+		if ccmd.IsSetENCRYPTION_WITH_COLUMN_KEY() {
+			if fileDecryptor != nil && fileDecryptor.Properties() != nil {
+				// should decrypt metadata
+				path := parquet.ColumnPath(ccmd.ENCRYPTION_WITH_COLUMN_KEY.GetPathInSchema())
+				keyMetadata := ccmd.ENCRYPTION_WITH_COLUMN_KEY.GetKeyMetadata()
+				aadColumnMetadata := encryption.CreateModuleAad(fileDecryptor.FileAad(), encryption.ColumnMetaModule, rowGroupOrdinal, columnOrdinal, -1)
+				decryptor := fileDecryptor.GetColumnMetaDecryptor(path.String(), string(keyMetadata), aadColumnMetadata)
+				thrift.DeserializeThrift(&c.decryptedMeta, decryptor.Decrypt(column.GetEncryptedColumnMetadata()))
+				c.columnMeta = &c.decryptedMeta
+			} else {
+				return nil, xerrors.New("cannot decrypt column metadata. file decryption not setup correctly")
+			}
+		}
+	}
+	for _, enc := range c.columnMeta.Encodings {
+		c.encodings = append(c.encodings, parquet.Encoding(enc))
+	}
+	for _, enc := range c.columnMeta.EncodingStats {
+		c.encodingStats = append(c.encodingStats, *enc)
+	}
+	return c, nil
+}
+
+// CryptoMetadata returns the cryptographic metadata for how this column was
+// encrypted and how to decrypt it.
+func (c *ColumnChunkMetaData) CryptoMetadata() *format.ColumnCryptoMetaData {
+	return c.column.GetCryptoMetadata()
+}
+
+// FileOffset is the location in the file where the column data begins
+func (c *ColumnChunkMetaData) FileOffset() int64 { return c.column.FileOffset }
+
+// FilePath gives the name of the parquet file if provided in the metadata
+func (c *ColumnChunkMetaData) FilePath() string { return c.column.GetFilePath() }
+
+// Type is the physical storage type used in the parquet file for this column chunk.
+func (c *ColumnChunkMetaData) Type() parquet.Type { return parquet.Type(c.columnMeta.Type) }
+
+// NumValues is the number of values stored in just this chunk including nulls.
+func (c *ColumnChunkMetaData) NumValues() int64 { return c.columnMeta.NumValues }
+
+// PathInSchema is the full path to this column from the root of the schema including
+// any nested columns
+func (c *ColumnChunkMetaData) PathInSchema() parquet.ColumnPath {
+	return c.columnMeta.GetPathInSchema()
+}
+
+// Compression provides the type of compression used for this particular chunk.
+func (c *ColumnChunkMetaData) Compression() compress.Compression {
+	return compress.Compression(c.columnMeta.Codec)
+}
+
+// Encodings returns the list of different encodings used in this chunk
+func (c *ColumnChunkMetaData) Encodings() []parquet.Encoding { return c.encodings }
+
+// EncodingStats connects the order of encodings based on the list of pages and types
+func (c *ColumnChunkMetaData) EncodingStats() []PageEncodingStats {
+	ret := make([]PageEncodingStats, len(c.encodingStats))
+	for idx := range ret {
+		ret[idx].Encoding = parquet.Encoding(c.encodingStats[idx].Encoding)
+		ret[idx].PageType = c.encodingStats[idx].PageType
+	}
+	return ret
+}
+
+// HasDictionaryPage returns true if there is a dictionary page offset set in
+// this metadata.
+func (c *ColumnChunkMetaData) HasDictionaryPage() bool {
+	return c.columnMeta.IsSetDictionaryPageOffset()
+}
+
+// DictionaryPageOffset returns the location in the file where the dictionary page starts
+func (c *ColumnChunkMetaData) DictionaryPageOffset() int64 {
+	return c.columnMeta.GetDictionaryPageOffset()
+}
+
+// DataPageOffset returns the location in the file where the data pages begin for this column
+func (c *ColumnChunkMetaData) DataPageOffset() int64 { return c.columnMeta.GetDataPageOffset() }
+
+// HasIndexPage returns true if the offset for the index page is set in the metadata
+func (c *ColumnChunkMetaData) HasIndexPage() bool { return c.columnMeta.IsSetIndexPageOffset() }
+
+// IndexPageOffset is the location in the file where the index page starts.
+func (c *ColumnChunkMetaData) IndexPageOffset() int64 { return c.columnMeta.GetIndexPageOffset() }
+
+// TotalCompressedSize will be equal to TotalUncompressedSize if the data is not compressed.
+// Otherwise this will be the size of the actual data in the file.
+func (c *ColumnChunkMetaData) TotalCompressedSize() int64 {
+	return c.columnMeta.GetTotalCompressedSize()
+}
+
+// TotalUncompressedSize is the total size of the raw data after uncompressing the chunk
+func (c *ColumnChunkMetaData) TotalUncompressedSize() int64 {
+	return c.columnMeta.GetTotalUncompressedSize()
+}
+
+// BloomFilterOffset is the byte offset from the beginning of the file to the bloom
+// filter data.
+func (c *ColumnChunkMetaData) BloomFilterOffset() int64 {
+	return c.columnMeta.GetBloomFilterOffset()
+}
+
+// StatsSet returns true only if there are statistics set in the metadata and the column
+// descriptor has a sort order that is not SortUnknown
+//
+// It also checks the writer version to ensure that it was not written by a version
+// of parquet which is known to have incorrect stat computations.
+func (c *ColumnChunkMetaData) StatsSet() (bool, error) {
+	if !c.columnMeta.IsSetStatistics() || c.descr.SortOrder() == schema.SortUNKNOWN {
+		return false, nil
+	}
+
+	if c.possibleStats == nil {
+		c.possibleStats = makeColumnStats(c.columnMeta, c.descr, c.mem)
+	}
+
+	encoded, err := c.possibleStats.Encode()
+	if err != nil {
+		return false, err
+	}
+
+	return c.writerVersion.HasCorrectStatistics(c.Type(), c.descr.LogicalType(), encoded, c.descr.SortOrder()), nil
+}
+
+func (c *ColumnChunkMetaData) Equals(other *ColumnChunkMetaData) bool {
+	return reflect.DeepEqual(c.columnMeta, other.columnMeta)
+}
+
+// Statistics can return nil if there are no stats in this metadata
+func (c *ColumnChunkMetaData) Statistics() (TypedStatistics, error) {
+	ok, err := c.StatsSet()
+	if err != nil {
+		return nil, err
+	}
+
+	if ok {
+		return c.possibleStats, nil
+	}
+	return nil, nil
+}
+
+// ColumnChunkMetaDataBuilder is used during writing to construct metadata
+// for a given column chunk while writing, providing a proxy around constructing
+// the actual thrift object.
+type ColumnChunkMetaDataBuilder struct {
+	chunk  *format.ColumnChunk
+	props  *parquet.WriterProperties
+	column *schema.Column
+
+	compressedSize int64
+}
+
+func NewColumnChunkMetaDataBuilder(props *parquet.WriterProperties, column *schema.Column) *ColumnChunkMetaDataBuilder {
+	return NewColumnChunkMetaDataBuilderWithContents(props, column, format.NewColumnChunk())
+}
+
+// NewColumnChunkMetaDataBuilderWithContents will construct a builder and start it with the provided
+// column chunk information rather than with an empty column chunk.
+func NewColumnChunkMetaDataBuilderWithContents(props *parquet.WriterProperties, column *schema.Column, chunk *format.ColumnChunk) *ColumnChunkMetaDataBuilder {
+	b := &ColumnChunkMetaDataBuilder{
+		props:  props,
+		column: column,
+		chunk:  chunk,
+	}
+	b.init(chunk)
+	return b
+}
+
+// Contents returns the underlying thrift ColumnChunk object so that it can be used
+// for constructing or duplicating column metadata
+func (c *ColumnChunkMetaDataBuilder) Contents() *format.ColumnChunk { return c.chunk }
+
+func (c *ColumnChunkMetaDataBuilder) init(chunk *format.ColumnChunk) {
+	c.chunk = chunk
+	if !c.chunk.IsSetMetaData() {
+		c.chunk.MetaData = format.NewColumnMetaData()
+	}
+	c.chunk.MetaData.Type = format.Type(c.column.PhysicalType())
+	c.chunk.MetaData.PathInSchema = schema.ColumnPathFromNode(c.column.SchemaNode())
+	c.chunk.MetaData.Codec = format.CompressionCodec(c.props.CompressionFor(c.column.Path()))
+}
+
+func (c *ColumnChunkMetaDataBuilder) SetFilePath(val string) {
+	c.chunk.FilePath = &val
+}
+
+// Descr returns the associated column descriptor for this column chunk
+func (c *ColumnChunkMetaDataBuilder) Descr() *schema.Column { return c.column }
+
+func (c *ColumnChunkMetaDataBuilder) TotalCompressedSize() int64 {
+	// if this column is encrypted, after Finish is called, the MetaData
+	// field is set to nil and we store the compressed size so return that
+	if c.chunk.MetaData == nil {
+		return c.compressedSize
+	}
+	return c.chunk.MetaData.GetTotalCompressedSize()
+}
+
+func (c *ColumnChunkMetaDataBuilder) SetStats(val EncodedStatistics) {
+	c.chunk.MetaData.Statistics = val.ToThrift()
+}
+
+// ChunkMetaInfo is a helper struct for passing the offset and size information
+// for finishing the building of column chunk metadata
+type ChunkMetaInfo struct {
+	NumValues        int64
+	DictPageOffset   int64
+	IndexPageOffset  int64
+	DataPageOffset   int64
+	CompressedSize   int64
+	UncompressedSize int64
+}
+
+// EncodingStats is a helper struct for passing the encoding stat information
+// for finishing up metadata for a column chunk.
+type EncodingStats struct {
+	DictEncodingStats map[parquet.Encoding]int32
+	DataEncodingStats map[parquet.Encoding]int32
+}
+
+// Finish finalizes the metadata with the given offsets,
+// flushes any compression that needs to be done, and performs
+// any encryption if an encryptor is provided.
+func (c *ColumnChunkMetaDataBuilder) Finish(info ChunkMetaInfo, hasDict, dictFallback bool, encStats EncodingStats, metaEncryptor encryption.Encryptor) error {
+	if info.DictPageOffset > 0 {
+		c.chunk.MetaData.DictionaryPageOffset = &info.DictPageOffset
+		c.chunk.FileOffset = info.DictPageOffset + info.CompressedSize
+	} else {
+		c.chunk.FileOffset = info.DataPageOffset + info.CompressedSize
+	}
+
+	c.chunk.MetaData.NumValues = info.NumValues
+	if info.IndexPageOffset >= 0 {
+		c.chunk.MetaData.IndexPageOffset = &info.IndexPageOffset
+	}
+
+	c.chunk.MetaData.DataPageOffset = info.DataPageOffset
+	c.chunk.MetaData.TotalUncompressedSize = info.UncompressedSize
+	c.chunk.MetaData.TotalCompressedSize = info.CompressedSize
+
+	// no matter the configuration, the maximum number of thrift encodings we'll
+	// populate is going to be 3:
+	// 	1. potential dictionary index encoding
+	//	2. page encoding
+	//	3. RLE for repetition and definition levels
+	// so let's preallocate a capacity of 3 but initialize the slice at 0 len
+	const maxEncodings = 3
+
+	thriftEncodings := make([]format.Encoding, 0, maxEncodings)
+	if hasDict {
+		thriftEncodings = append(thriftEncodings, format.Encoding(c.props.DictionaryIndexEncoding()))
+		if c.props.Version() == parquet.V1_0 {
+			thriftEncodings = append(thriftEncodings, format.Encoding_PLAIN)
+		} else {
+			thriftEncodings = append(thriftEncodings, format.Encoding(c.props.DictionaryPageEncoding()))
+		}
+	} else { // no dictionary
+		thriftEncodings = append(thriftEncodings, format.Encoding(c.props.EncodingFor(c.column.Path())))
+	}
+
+	thriftEncodings = append(thriftEncodings, format.Encoding(parquet.Encodings.RLE))
+	// Only PLAIN encoding is supported for fallback in V1
+	// TODO(zeroshade): Use user specified encoding for V2
+	if dictFallback {
+		thriftEncodings = append(thriftEncodings, format.Encoding_PLAIN)
+	}
+	c.chunk.MetaData.Encodings = thriftEncodings
+
+	thriftEncodingStats := make([]*format.PageEncodingStats, 0, len(encStats.DictEncodingStats)+len(encStats.DataEncodingStats))
+	for k, v := range encStats.DictEncodingStats {
+		thriftEncodingStats = append(thriftEncodingStats, &format.PageEncodingStats{
+			PageType: format.PageType_DICTIONARY_PAGE,
+			Encoding: format.Encoding(k),
+			Count:    v,
+		})
+	}
+	for k, v := range encStats.DataEncodingStats {
+		thriftEncodingStats = append(thriftEncodingStats, &format.PageEncodingStats{
+			PageType: format.PageType_DATA_PAGE,
+			Encoding: format.Encoding(k),
+			Count:    v,
+		})
+	}
+	c.chunk.MetaData.EncodingStats = thriftEncodingStats
+
+	encryptProps := c.props.ColumnEncryptionProperties(c.column.Path())
+	if encryptProps != nil && encryptProps.IsEncrypted() {
+		ccmd := format.NewColumnCryptoMetaData()
+		if encryptProps.IsEncryptedWithFooterKey() {
+			ccmd.ENCRYPTION_WITH_FOOTER_KEY = format.NewEncryptionWithFooterKey()
+		} else {
+			ccmd.ENCRYPTION_WITH_COLUMN_KEY = &format.EncryptionWithColumnKey{
+				KeyMetadata:  []byte(encryptProps.KeyMetadata()),
+				PathInSchema: c.column.ColumnPath(),
+			}
+		}
+		c.chunk.CryptoMetadata = ccmd
+
+		encryptedFooter := c.props.FileEncryptionProperties().EncryptedFooter()
+		encryptMetadata := !encryptedFooter || !encryptProps.IsEncryptedWithFooterKey()
+		if encryptMetadata {
+			// Serialize and encrypt ColumnMetadata separately
+			// Thrift-serialize the ColumnMetaData structure,
+			// encrypt it with the column key, and write to encrypted_column_metadata
+			serializer := thrift.NewThriftSerializer()
+			data, err := serializer.Write(context.Background(), c.chunk.MetaData)
+			if err != nil {
+				return err
+			}
+			var buf bytes.Buffer
+			metaEncryptor.Encrypt(&buf, data)
+			c.chunk.EncryptedColumnMetadata = buf.Bytes()
+
+			if encryptedFooter {
+				c.compressedSize = c.chunk.MetaData.GetTotalCompressedSize()
+				c.chunk.MetaData = nil
+			} else {
+				// Keep redacted metadata version for old readers
+				c.chunk.MetaData.Statistics = nil
+				c.chunk.MetaData.EncodingStats = nil
+			}
+		}
+	}
+	return nil
+}
+
+// WriteTo will always return 0 as the int64 since the thrift writer library
+// does not return the number of bytes written, we only use the signature
+// of (int64, error) in order to match the standard WriteTo interfaces.
+func (c *ColumnChunkMetaDataBuilder) WriteTo(w io.Writer) (int64, error) {
+	return 0, thrift.SerializeThriftStream(c.chunk, w)
+}
diff --git a/go/parquet/metadata/file.go b/go/parquet/metadata/file.go
new file mode 100644
index 00000000000..30dcc98e9f2
--- /dev/null
+++ b/go/parquet/metadata/file.go
@@ -0,0 +1,508 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package metadata
+
+import (
+	"bytes"
+	"context"
+	"io"
+	"reflect"
+	"unicode/utf8"
+
+	"github.com/apache/arrow/go/parquet"
+	"github.com/apache/arrow/go/parquet/compress"
+	"github.com/apache/arrow/go/parquet/internal/encryption"
+	format "github.com/apache/arrow/go/parquet/internal/gen-go/parquet"
+	"github.com/apache/arrow/go/parquet/internal/thrift"
+	"github.com/apache/arrow/go/parquet/schema"
+	"golang.org/x/xerrors"
+)
+
+// DefaultCompressionType is used unless a different compression is specified
+// in the properties
+var DefaultCompressionType = compress.Codecs.Uncompressed
+
+// FileMetaDataBuilder is a proxy for more easily constructing file metadata
+// particularly used when writing a file out.
+type FileMetaDataBuilder struct {
+	metadata       *format.FileMetaData
+	props          *parquet.WriterProperties
+	schema         *schema.Schema
+	rowGroups      []*format.RowGroup
+	currentRgBldr  *RowGroupMetaDataBuilder
+	kvmeta         KeyValueMetadata
+	cryptoMetadata *format.FileCryptoMetaData
+}
+
+// NewFileMetadataBuilder will use the default writer properties if nil is passed for
+// the writer properties and nil is allowable for the key value metadata.
+func NewFileMetadataBuilder(schema *schema.Schema, props *parquet.WriterProperties, kvmeta KeyValueMetadata) *FileMetaDataBuilder {
+	var crypto *format.FileCryptoMetaData
+	if props.FileEncryptionProperties() != nil && props.FileEncryptionProperties().EncryptedFooter() {
+		crypto = format.NewFileCryptoMetaData()
+	}
+	return &FileMetaDataBuilder{
+		metadata:       format.NewFileMetaData(),
+		props:          props,
+		schema:         schema,
+		kvmeta:         kvmeta,
+		cryptoMetadata: crypto,
+	}
+}
+
+// GetFileCryptoMetaData returns the cryptographic information for encrypting/
+// decrypting the file.
+func (f *FileMetaDataBuilder) GetFileCryptoMetaData() *FileCryptoMetadata {
+	if f.cryptoMetadata == nil {
+		return nil
+	}
+
+	props := f.props.FileEncryptionProperties()
+	f.cryptoMetadata.EncryptionAlgorithm = props.Algorithm().ToThrift()
+	keyMetadata := props.FooterKeyMetadata()
+	if keyMetadata != "" {
+		f.cryptoMetadata.KeyMetadata = []byte(keyMetadata)
+	}
+
+	return &FileCryptoMetadata{f.cryptoMetadata, 0}
+}
+
+// AppendRowGroup adds a rowgroup to the list and returns a builder
+// for that row group
+func (f *FileMetaDataBuilder) AppendRowGroup() *RowGroupMetaDataBuilder {
+	if f.rowGroups == nil {
+		f.rowGroups = make([]*format.RowGroup, 0, 1)
+	}
+
+	rg := format.NewRowGroup()
+	f.rowGroups = append(f.rowGroups, rg)
+	f.currentRgBldr = NewRowGroupMetaDataBuilder(f.props, f.schema, rg)
+	return f.currentRgBldr
+}
+
+// Finish will finalize the metadata of the number of rows, row groups,
+// version etc. This will clear out this filemetadatabuilder so it can
+// be re-used
+func (f *FileMetaDataBuilder) Finish() (*FileMetaData, error) {
+	totalRows := int64(0)
+	for _, rg := range f.rowGroups {
+		totalRows += rg.NumRows
+	}
+	f.metadata.NumRows = totalRows
+	f.metadata.RowGroups = f.rowGroups
+	switch f.props.Version() {
+	case parquet.V1_0:
+		f.metadata.Version = 1
+	default:
+		f.metadata.Version = 2
+	}
+	createdBy := f.props.CreatedBy()
+	f.metadata.CreatedBy = &createdBy
+
+	// Users cannot set the `ColumnOrder` since we do not not have user defined sort order
+	// in the spec yet.
+	//
+	// We always default to `TYPE_DEFINED_ORDER`. We can expose it in
+	// the API once we have user defined sort orders in the Parquet format.
+	// TypeDefinedOrder implies choose SortOrder based on ConvertedType/PhysicalType
+	typeDefined := format.NewTypeDefinedOrder()
+	colOrder := &format.ColumnOrder{TYPE_ORDER: typeDefined}
+	f.metadata.ColumnOrders = make([]*format.ColumnOrder, f.schema.NumColumns())
+	for idx := range f.metadata.ColumnOrders {
+		f.metadata.ColumnOrders[idx] = colOrder
+	}
+
+	encryptProps := f.props.FileEncryptionProperties()
+	if encryptProps != nil && !encryptProps.EncryptedFooter() {
+		var signingAlgo parquet.Algorithm
+		algo := encryptProps.Algorithm()
+		signingAlgo.Aad.AadFileUnique = algo.Aad.AadFileUnique
+		signingAlgo.Aad.SupplyAadPrefix = algo.Aad.SupplyAadPrefix
+		if !algo.Aad.SupplyAadPrefix {
+			signingAlgo.Aad.AadPrefix = algo.Aad.AadPrefix
+		}
+		signingAlgo.Algo = parquet.AesGcm
+		f.metadata.EncryptionAlgorithm = signingAlgo.ToThrift()
+		footerSigningMetadata := f.props.FileEncryptionProperties().FooterKeyMetadata()
+		if footerSigningMetadata != "" {
+			f.metadata.FooterSigningKeyMetadata = []byte(footerSigningMetadata)
+		}
+	}
+
+	f.metadata.Schema = schema.ToThrift(f.schema.Root())
+	f.metadata.KeyValueMetadata = f.kvmeta
+
+	out := &FileMetaData{
+		FileMetaData: f.metadata,
+		version:      NewAppVersion(f.metadata.GetCreatedBy()),
+	}
+	if err := out.initSchema(); err != nil {
+		return nil, err
+	}
+	out.initColumnOrders()
+
+	f.metadata = format.NewFileMetaData()
+	f.rowGroups = nil
+	return out, nil
+}
+
+// KeyValueMetadata is an alias for a slice of thrift keyvalue pairs.
+//
+// It is presumed that the metadata should all be utf8 valid.
+type KeyValueMetadata []*format.KeyValue
+
+// NewKeyValueMetadata is equivalent to make(KeyValueMetadata, 0)
+func NewKeyValueMetadata() KeyValueMetadata {
+	return make(KeyValueMetadata, 0)
+}
+
+// Append adds the passed in key and value to the metadata, if either contains
+// any invalid utf8 runes, then it is not added and an error is returned.
+func (k *KeyValueMetadata) Append(key, value string) error {
+	if !utf8.ValidString(key) || !utf8.ValidString(value) {
+		return xerrors.Errorf("metadata must be valid utf8 strings, got key = '%s' and value = '%s'", key, value)
+	}
+	*k = append(*k, &format.KeyValue{Key: key, Value: &value})
+	return nil
+}
+
+func (k KeyValueMetadata) Len() int { return len(k) }
+
+// Equals compares all of the metadata keys and values to check they are equal
+func (k KeyValueMetadata) Equals(other KeyValueMetadata) bool {
+	return reflect.DeepEqual(k, other)
+}
+
+func (k KeyValueMetadata) Keys() (ret []string) {
+	ret = make([]string, len(k))
+	for idx, v := range k {
+		ret[idx] = v.GetKey()
+	}
+	return
+}
+
+func (k KeyValueMetadata) Values() (ret []string) {
+	ret = make([]string, len(k))
+	for idx, v := range k {
+		ret[idx] = v.GetValue()
+	}
+	return
+}
+
+func (k KeyValueMetadata) FindValue(key string) *string {
+	for _, v := range k {
+		if v.Key == key {
+			return v.Value
+		}
+	}
+	return nil
+}
+
+// FileMetaData is a proxy around the underlying thrift FileMetaData object
+// to make it easier to use and interact with.
+type FileMetaData struct {
+	*format.FileMetaData
+	Schema        *schema.Schema
+	FileDecryptor encryption.FileDecryptor
+
+	// app version of the writer for this file
+	version *AppVersion
+	// size of the raw bytes of the metadata in the file which were
+	// decoded by thrift, Size() getter returns the value.
+	metadataLen int
+}
+
+// NewFileMetaData takes in the raw bytes of the serialized metadata to deserialize
+// and will attempt to decrypt the footer if a decryptor is provided.
+func NewFileMetaData(data []byte, fileDecryptor encryption.FileDecryptor) (*FileMetaData, error) {
+	meta := format.NewFileMetaData()
+	if fileDecryptor != nil {
+		footerDecryptor := fileDecryptor.GetFooterDecryptor()
+		data = footerDecryptor.Decrypt(data)
+	}
+
+	remain, err := thrift.DeserializeThrift(meta, data)
+	if err != nil {
+		return nil, err
+	}
+
+	f := &FileMetaData{
+		FileMetaData:  meta,
+		version:       NewAppVersion(meta.GetCreatedBy()),
+		metadataLen:   len(data) - int(remain),
+		FileDecryptor: fileDecryptor,
+	}
+
+	f.initSchema()
+	f.initColumnOrders()
+
+	return f, nil
+}
+
+// Size is the length of the raw serialized metadata bytes in the footer
+func (f *FileMetaData) Size() int { return f.metadataLen }
+
+// NumSchemaElements is the length of the flattened schema list in the thrift
+func (f *FileMetaData) NumSchemaElements() int {
+	return len(f.FileMetaData.Schema)
+}
+
+// RowGroup provides the metadata for the (0-based) index of the row group
+func (f *FileMetaData) RowGroup(i int) *RowGroupMetaData {
+	return &RowGroupMetaData{
+		f.RowGroups[i], f.Schema, f.version, f.FileDecryptor,
+	}
+}
+
+func (f *FileMetaData) Serialize(ctx context.Context) ([]byte, error) {
+	return thrift.NewThriftSerializer().Write(ctx, f.FileMetaData)
+}
+
+func (f *FileMetaData) SerializeString(ctx context.Context) (string, error) {
+	return thrift.NewThriftSerializer().WriteString(ctx, f.FileMetaData)
+}
+
+// EncryptionAlgorithm constructs the algorithm object from the thrift
+// information or returns an empty instance if it was not set.
+func (f *FileMetaData) EncryptionAlgorithm() parquet.Algorithm {
+	if f.IsSetEncryptionAlgorithm() {
+		return parquet.AlgorithmFromThrift(f.GetEncryptionAlgorithm())
+	}
+	return parquet.Algorithm{}
+}
+
+func (f *FileMetaData) initSchema() error {
+	root, err := schema.FromParquet(f.FileMetaData.Schema)
+	if err != nil {
+		return err
+	}
+	f.Schema = schema.NewSchema(root.(*schema.GroupNode))
+	return nil
+}
+
+func (f *FileMetaData) initColumnOrders() {
+	orders := make([]parquet.ColumnOrder, 0, f.Schema.NumColumns())
+	if f.IsSetColumnOrders() {
+		for _, o := range f.GetColumnOrders() {
+			if o.IsSetTYPE_ORDER() {
+				orders = append(orders, parquet.ColumnOrders.TypeDefinedOrder)
+			} else {
+				orders = append(orders, parquet.ColumnOrders.Undefined)
+			}
+		}
+	} else {
+		orders = orders[:f.Schema.NumColumns()]
+		orders[0] = parquet.ColumnOrders.Undefined
+		for i := 1; i < len(orders); i *= 2 {
+			copy(orders[i:], orders[:i])
+		}
+	}
+	f.Schema.UpdateColumnOrders(orders)
+}
+
+// WriterVersion returns the constructed application version from the
+// created by string
+func (f *FileMetaData) WriterVersion() *AppVersion {
+	if f.version == nil {
+		f.version = NewAppVersion(f.GetCreatedBy())
+	}
+	return f.version
+}
+
+// SetFilePath will set the file path into all of the columns in each row group.
+func (f *FileMetaData) SetFilePath(path string) {
+	for _, rg := range f.RowGroups {
+		for _, chunk := range rg.Columns {
+			chunk.FilePath = &path
+		}
+	}
+}
+
+// AppendRowGroups will add all of the rowgroup metadata from other to the
+// current file metadata
+func (f *FileMetaData) AppendRowGroups(other *FileMetaData) error {
+	if !f.Schema.Equals(other.Schema) {
+		return xerrors.New("parquet/FileMetaData: AppendRowGroups requires equal schemas")
+	}
+
+	f.RowGroups = append(f.RowGroups, other.GetRowGroups()...)
+	for _, rg := range other.GetRowGroups() {
+		f.NumRows += rg.NumRows
+	}
+	return nil
+}
+
+// Subset will construct a new FileMetaData object containing only the requested
+// row groups by index
+func (f *FileMetaData) Subset(rowGroups []int) (*FileMetaData, error) {
+	for _, i := range rowGroups {
+		if i < len(f.RowGroups) {
+			continue
+		}
+		return nil, xerrors.Errorf("parquet: this file only has %d row groups, but requested a subset including row group: %d", len(f.RowGroups), i)
+	}
+
+	out := &FileMetaData{
+		&format.FileMetaData{
+			Schema:                   f.FileMetaData.Schema,
+			CreatedBy:                f.CreatedBy,
+			ColumnOrders:             f.GetColumnOrders(),
+			EncryptionAlgorithm:      f.FileMetaData.EncryptionAlgorithm,
+			FooterSigningKeyMetadata: f.FooterSigningKeyMetadata,
+			Version:                  f.FileMetaData.Version,
+			KeyValueMetadata:         f.KeyValueMetadata(),
+		},
+		f.Schema,
+		f.FileDecryptor,
+		f.version,
+		0,
+	}
+
+	out.RowGroups = make([]*format.RowGroup, 0, len(rowGroups))
+	for _, selected := range rowGroups {
+		out.RowGroups = append(out.RowGroups, f.RowGroups[selected])
+		out.NumRows += f.RowGroups[selected].GetNumRows()
+	}
+
+	return out, nil
+}
+
+func (f *FileMetaData) Equals(other *FileMetaData) bool {
+	return reflect.DeepEqual(f.FileMetaData, other.FileMetaData)
+}
+
+func (f *FileMetaData) KeyValueMetadata() KeyValueMetadata {
+	return f.GetKeyValueMetadata()
+}
+
+// VerifySignature constructs a cryptographic signature using the FileDecryptor
+// of the footer and then verifies it's integrity.
+//
+// Panics if f.FileDecryptor is nil
+func (f *FileMetaData) VerifySignature(signature []byte) bool {
+	if f.FileDecryptor == nil {
+		panic("decryption not set propertly, cannot verify signature")
+	}
+
+	serializer := thrift.NewThriftSerializer()
+	data, _ := serializer.Write(context.Background(), f.FileMetaData)
+	nonce := signature[:encryption.NonceLength]
+	tag := signature[encryption.NonceLength : encryption.NonceLength+encryption.GcmTagLength]
+
+	key := f.FileDecryptor.GetFooterKey()
+	aad := encryption.CreateFooterAad(f.FileDecryptor.FileAad())
+
+	enc := encryption.NewAesEncryptor(f.FileDecryptor.Algorithm(), true)
+	var buf bytes.Buffer
+	buf.Grow(enc.CiphertextSizeDelta() + len(data))
+	encryptedLen := enc.SignedFooterEncrypt(&buf, data, []byte(key), []byte(aad), nonce)
+	return bytes.Equal(buf.Bytes()[encryptedLen-encryption.GcmTagLength:], tag)
+}
+
+// WriteTo will serialize and write out this file metadata, encrypting it if
+// appropriate.
+//
+// If it is an encrypted file with a plaintext footer, then we will write the
+// signature with the unencrypted footer.
+func (f *FileMetaData) WriteTo(w io.Writer, encryptor encryption.Encryptor) (int64, error) {
+	serializer := thrift.NewThriftSerializer()
+	// only in encrypted files with plaintext footers, the encryption algorithm is set in the footer
+	if f.IsSetEncryptionAlgorithm() {
+		data, err := serializer.Write(context.Background(), f.FileMetaData)
+		if err != nil {
+			return 0, err
+		}
+
+		// encrypt the footer key
+		var buf bytes.Buffer
+		buf.Grow(encryptor.CiphertextSizeDelta() + len(data))
+		encryptedLen := encryptor.Encrypt(&buf, data)
+
+		wrote := 0
+		n := 0
+		// write unencrypted footer
+		if n, err = w.Write(data); err != nil {
+			return int64(n), err
+		}
+		wrote += n
+		// write signature (nonce and tag)
+		buf.Next(4)
+		if n, err = w.Write(buf.Next(encryption.NonceLength)); err != nil {
+			return int64(wrote + n), err
+		}
+		wrote += n
+		buf.Next(encryptedLen - 4 - encryption.NonceLength - encryption.GcmTagLength)
+		n, err = w.Write(buf.Next(encryption.GcmTagLength))
+		return int64(wrote + n), err
+	}
+	n, err := serializer.Serialize(f.FileMetaData, w, encryptor)
+	return int64(n), err
+}
+
+// Version returns the "version" of the file
+//
+// WARNING: The value returned by this method is unreliable as 1) the
+// parquet file metadata stores the version as a single integer and
+// 2) some producers are known to always write a hardcoded value. Therefore
+// you cannot use this value to know which features are used in the file.
+func (f *FileMetaData) Version() parquet.Version {
+	switch f.FileMetaData.Version {
+	case 1:
+		return parquet.V1_0
+	case 2:
+		return parquet.V2_LATEST
+	default:
+		// imporperly set version, assume parquet 1.0
+		return parquet.V1_0
+	}
+}
+
+// FileCryptoMetadata is a proxy for the thrift fileCryptoMetadata object
+type FileCryptoMetadata struct {
+	metadata          *format.FileCryptoMetaData
+	cryptoMetadataLen uint32
+}
+
+// NewFileCryptoMetaData takes in the raw serialized bytes to deserialize
+// storing the number of bytes that were actually deserialized.
+func NewFileCryptoMetaData(metadata []byte) (ret FileCryptoMetadata, err error) {
+	ret.metadata = format.NewFileCryptoMetaData()
+	var remain uint64
+	remain, err = thrift.DeserializeThrift(ret.metadata, metadata)
+	ret.cryptoMetadataLen = uint32(uint64(len(metadata)) - remain)
+	return
+}
+
+// WriteTo writes out the serialized crypto metadata to w
+func (fc FileCryptoMetadata) WriteTo(w io.Writer) (int64, error) {
+	serializer := thrift.NewThriftSerializer()
+	n, err := serializer.Serialize(fc.metadata, w, nil)
+	return int64(n), err
+}
+
+// Len is the number of bytes that were deserialized to create this object
+func (fc FileCryptoMetadata) Len() int { return int(fc.cryptoMetadataLen) }
+
+func (fc FileCryptoMetadata) KeyMetadata() []byte {
+	return fc.metadata.KeyMetadata
+}
+
+// EncryptionAlgorithm constructs the object from the thrift instance of
+// the encryption algorithm
+func (fc FileCryptoMetadata) EncryptionAlgorithm() parquet.Algorithm {
+	return parquet.AlgorithmFromThrift(fc.metadata.GetEncryptionAlgorithm())
+}
diff --git a/go/parquet/metadata/metadata_test.go b/go/parquet/metadata/metadata_test.go
new file mode 100644
index 00000000000..8e77d73ca2b
--- /dev/null
+++ b/go/parquet/metadata/metadata_test.go
@@ -0,0 +1,336 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package metadata_test
+
+import (
+	"context"
+	"testing"
+	"unsafe"
+
+	"github.com/apache/arrow/go/parquet"
+	"github.com/apache/arrow/go/parquet/metadata"
+	"github.com/apache/arrow/go/parquet/schema"
+	"github.com/stretchr/testify/assert"
+	"github.com/stretchr/testify/require"
+)
+
+func generateTableMetaData(schema *schema.Schema, props *parquet.WriterProperties, nrows int64, statsInt, statsFloat metadata.EncodedStatistics) (*metadata.FileMetaData, error) {
+	fbuilder := metadata.NewFileMetadataBuilder(schema, props, nil)
+	rg1Builder := fbuilder.AppendRowGroup()
+	// metadata
+	// row group 1
+	col1Builder := rg1Builder.NextColumnChunk()
+	col2Builder := rg1Builder.NextColumnChunk()
+	// column metadata
+	dictEncodingStats := map[parquet.Encoding]int32{parquet.Encodings.RLEDict: 1}
+	dataEncodingStats := map[parquet.Encoding]int32{parquet.Encodings.Plain: 1, parquet.Encodings.RLE: 1}
+	statsInt.Signed = true
+	col1Builder.SetStats(statsInt)
+	statsFloat.Signed = true
+	col2Builder.SetStats(statsFloat)
+
+	col1Builder.Finish(metadata.ChunkMetaInfo{nrows / 2, 4, 0, 10, 512, 600}, true, false, metadata.EncodingStats{dictEncodingStats, dataEncodingStats}, nil)
+	col2Builder.Finish(metadata.ChunkMetaInfo{nrows / 2, 24, 0, 30, 512, 600}, true, false, metadata.EncodingStats{dictEncodingStats, dataEncodingStats}, nil)
+
+	rg1Builder.SetNumRows(nrows / 2)
+	rg1Builder.Finish(1024, -1)
+
+	// rowgroup2 metadata
+	rg2Builder := fbuilder.AppendRowGroup()
+	col1Builder = rg2Builder.NextColumnChunk()
+	col2Builder = rg2Builder.NextColumnChunk()
+	// column metadata
+	col1Builder.SetStats(statsInt)
+	col2Builder.SetStats(statsFloat)
+	col1Builder.Finish(metadata.ChunkMetaInfo{nrows / 2, 6, 0, 10, 512, 600}, true, false, metadata.EncodingStats{dictEncodingStats, dataEncodingStats}, nil)
+	col2Builder.Finish(metadata.ChunkMetaInfo{nrows / 2, 16, 0, 26, 512, 600}, true, false, metadata.EncodingStats{dictEncodingStats, dataEncodingStats}, nil)
+
+	rg2Builder.SetNumRows(nrows / 2)
+	rg2Builder.Finish(1024, -1)
+
+	return fbuilder.Finish()
+}
+
+func assertStatsSet(t *testing.T, m *metadata.ColumnChunkMetaData) {
+	ok, err := m.StatsSet()
+	assert.NoError(t, err)
+	assert.True(t, ok)
+}
+
+func assertStats(t *testing.T, m *metadata.ColumnChunkMetaData) metadata.TypedStatistics {
+	s, err := m.Statistics()
+	assert.NoError(t, err)
+	assert.NotNil(t, s)
+	return s
+}
+
+func TestBuildAccess(t *testing.T) {
+	props := parquet.NewWriterProperties(parquet.WithVersion(parquet.V2_LATEST))
+
+	fields := schema.FieldList{
+		schema.NewInt32Node("int_col", parquet.Repetitions.Required, -1),
+		schema.NewFloat32Node("float_col", parquet.Repetitions.Required, -1),
+	}
+	root, err := schema.NewGroupNode("schema", parquet.Repetitions.Repeated, fields, -1)
+	require.NoError(t, err)
+	schema := schema.NewSchema(root)
+
+	var (
+		nrows      int64   = 1000
+		intMin     int32   = 100
+		intMax     int32   = 200
+		floatMin   float32 = 100.100
+		floatMax   float32 = 200.200
+		statsInt   metadata.EncodedStatistics
+		statsFloat metadata.EncodedStatistics
+	)
+
+	statsInt.SetNullCount(0).
+		SetDistinctCount(nrows).
+		SetMin((*(*[4]byte)(unsafe.Pointer(&intMin)))[:]).
+		SetMax((*(*[4]byte)(unsafe.Pointer(&intMax)))[:])
+
+	statsFloat.SetNullCount(0).
+		SetDistinctCount(nrows).
+		SetMin((*(*[4]byte)(unsafe.Pointer(&floatMin)))[:]).
+		SetMax((*(*[4]byte)(unsafe.Pointer(&floatMax)))[:])
+
+	faccessor, err := generateTableMetaData(schema, props, nrows, statsInt, statsFloat)
+	require.NoError(t, err)
+	serialized, err := faccessor.SerializeString(context.Background())
+	assert.NoError(t, err)
+	faccessorCopy, err := metadata.NewFileMetaData([]byte(serialized), nil)
+	assert.NoError(t, err)
+
+	for _, accessor := range []*metadata.FileMetaData{faccessor, faccessorCopy} {
+		assert.Equal(t, nrows, accessor.NumRows)
+		assert.Len(t, accessor.RowGroups, 2)
+		assert.EqualValues(t, parquet.V2_LATEST, accessor.Version())
+		assert.Equal(t, parquet.DefaultCreatedBy, accessor.GetCreatedBy())
+		assert.Equal(t, 3, accessor.NumSchemaElements())
+
+		rg1Access := accessor.RowGroup(0)
+		assert.Equal(t, 2, rg1Access.NumColumns())
+		assert.Equal(t, nrows/2, rg1Access.NumRows())
+		assert.Equal(t, int64(1024), rg1Access.TotalByteSize())
+
+		rg1Col1, err := rg1Access.ColumnChunk(0)
+		assert.NoError(t, err)
+		rg1Col2, err := rg1Access.ColumnChunk(1)
+		assert.NoError(t, err)
+		assertStatsSet(t, rg1Col1)
+		assertStatsSet(t, rg1Col2)
+		assert.Equal(t, statsInt.Min, assertStats(t, rg1Col1).EncodeMin())
+		assert.Equal(t, statsInt.Max, assertStats(t, rg1Col1).EncodeMax())
+		assert.Equal(t, statsFloat.Min, assertStats(t, rg1Col2).EncodeMin())
+		assert.Equal(t, statsFloat.Max, assertStats(t, rg1Col2).EncodeMax())
+		assert.Zero(t, assertStats(t, rg1Col1).NullCount())
+		assert.Zero(t, assertStats(t, rg1Col2).NullCount())
+		assert.Equal(t, nrows, assertStats(t, rg1Col1).DistinctCount())
+		assert.Equal(t, nrows, assertStats(t, rg1Col2).DistinctCount())
+		assert.Equal(t, metadata.DefaultCompressionType, rg1Col1.Compression())
+		assert.Equal(t, metadata.DefaultCompressionType, rg1Col2.Compression())
+		assert.Equal(t, nrows/2, rg1Col1.NumValues())
+		assert.Equal(t, nrows/2, rg1Col2.NumValues())
+		assert.Len(t, rg1Col1.Encodings(), 3)
+		assert.Len(t, rg1Col2.Encodings(), 3)
+		assert.EqualValues(t, 512, rg1Col1.TotalCompressedSize())
+		assert.EqualValues(t, 512, rg1Col2.TotalCompressedSize())
+		assert.EqualValues(t, 600, rg1Col1.TotalUncompressedSize())
+		assert.EqualValues(t, 600, rg1Col2.TotalUncompressedSize())
+		assert.EqualValues(t, 4, rg1Col1.DictionaryPageOffset())
+		assert.EqualValues(t, 24, rg1Col2.DictionaryPageOffset())
+		assert.EqualValues(t, 10, rg1Col1.DataPageOffset())
+		assert.EqualValues(t, 30, rg1Col2.DataPageOffset())
+		assert.Len(t, rg1Col1.EncodingStats(), 3)
+		assert.Len(t, rg1Col2.EncodingStats(), 3)
+
+		rg2Access := accessor.RowGroup(1)
+		assert.Equal(t, 2, rg2Access.NumColumns())
+		assert.Equal(t, nrows/2, rg2Access.NumRows())
+		assert.EqualValues(t, 1024, rg2Access.TotalByteSize())
+
+		rg2Col1, err := rg2Access.ColumnChunk(0)
+		assert.NoError(t, err)
+		rg2Col2, err := rg2Access.ColumnChunk(1)
+		assert.NoError(t, err)
+		assertStatsSet(t, rg1Col1)
+		assertStatsSet(t, rg1Col2)
+		assert.Equal(t, statsInt.Min, assertStats(t, rg1Col1).EncodeMin())
+		assert.Equal(t, statsInt.Max, assertStats(t, rg1Col1).EncodeMax())
+		assert.Equal(t, statsFloat.Min, assertStats(t, rg1Col2).EncodeMin())
+		assert.Equal(t, statsFloat.Max, assertStats(t, rg1Col2).EncodeMax())
+		assert.Zero(t, assertStats(t, rg1Col1).NullCount())
+		assert.Zero(t, assertStats(t, rg1Col2).NullCount())
+		assert.Equal(t, nrows, assertStats(t, rg1Col1).DistinctCount())
+		assert.Equal(t, nrows, assertStats(t, rg1Col2).DistinctCount())
+		assert.Equal(t, metadata.DefaultCompressionType, rg2Col1.Compression())
+		assert.Equal(t, metadata.DefaultCompressionType, rg2Col2.Compression())
+		assert.Equal(t, nrows/2, rg2Col1.NumValues())
+		assert.Equal(t, nrows/2, rg2Col2.NumValues())
+		assert.Len(t, rg2Col1.Encodings(), 3)
+		assert.Len(t, rg2Col2.Encodings(), 3)
+		assert.EqualValues(t, 512, rg2Col1.TotalCompressedSize())
+		assert.EqualValues(t, 512, rg2Col2.TotalCompressedSize())
+		assert.EqualValues(t, 600, rg2Col1.TotalUncompressedSize())
+		assert.EqualValues(t, 600, rg2Col2.TotalUncompressedSize())
+		assert.EqualValues(t, 6, rg2Col1.DictionaryPageOffset())
+		assert.EqualValues(t, 16, rg2Col2.DictionaryPageOffset())
+		assert.EqualValues(t, 10, rg2Col1.DataPageOffset())
+		assert.EqualValues(t, 26, rg2Col2.DataPageOffset())
+		assert.Len(t, rg2Col1.EncodingStats(), 3)
+		assert.Len(t, rg2Col2.EncodingStats(), 3)
+
+		assert.Empty(t, rg2Col1.FilePath())
+		accessor.SetFilePath("/foo/bar/bar.parquet")
+		assert.Equal(t, "/foo/bar/bar.parquet", rg2Col1.FilePath())
+	}
+
+	faccessor2, err := generateTableMetaData(schema, props, nrows, statsInt, statsFloat)
+	require.NoError(t, err)
+	faccessor.AppendRowGroups(faccessor2)
+	assert.Len(t, faccessor.RowGroups, 4)
+	assert.Equal(t, nrows*2, faccessor.NumRows)
+	assert.EqualValues(t, parquet.V2_LATEST, faccessor.Version())
+	assert.Equal(t, parquet.DefaultCreatedBy, faccessor.GetCreatedBy())
+	assert.Equal(t, 3, faccessor.NumSchemaElements())
+
+	faccessor1, err := faccessor.Subset([]int{2, 3})
+	require.NoError(t, err)
+	assert.True(t, faccessor1.Equals(faccessor2))
+
+	faccessor1, err = faccessor2.Subset([]int{0})
+	require.NoError(t, err)
+
+	next, err := faccessor.Subset([]int{0})
+	require.NoError(t, err)
+	faccessor1.AppendRowGroups(next)
+
+	sub, err := faccessor.Subset([]int{2, 0})
+	require.NoError(t, err)
+	assert.True(t, faccessor1.Equals(sub))
+}
+
+func TestV1VersionMetadata(t *testing.T) {
+	props := parquet.NewWriterProperties(parquet.WithVersion(parquet.V1_0))
+
+	fields := schema.FieldList{
+		schema.NewInt32Node("int_col", parquet.Repetitions.Required, -1),
+		schema.NewFloat32Node("float_col", parquet.Repetitions.Required, -1),
+	}
+	root, err := schema.NewGroupNode("schema", parquet.Repetitions.Repeated, fields, -1)
+	require.NoError(t, err)
+	schema := schema.NewSchema(root)
+
+	fbuilder := metadata.NewFileMetadataBuilder(schema, props, nil)
+	faccessor, err := fbuilder.Finish()
+	require.NoError(t, err)
+	assert.EqualValues(t, parquet.V1_0, faccessor.Version())
+}
+
+func TestKeyValueMetadata(t *testing.T) {
+	props := parquet.NewWriterProperties(parquet.WithVersion(parquet.V1_0))
+
+	fields := schema.FieldList{
+		schema.NewInt32Node("int_col", parquet.Repetitions.Required, -1),
+		schema.NewFloat32Node("float_col", parquet.Repetitions.Required, -1),
+	}
+	root, err := schema.NewGroupNode("schema", parquet.Repetitions.Repeated, fields, -1)
+	require.NoError(t, err)
+	schema := schema.NewSchema(root)
+	kvmeta := metadata.NewKeyValueMetadata()
+	kvmeta.Append("test_key", "test_value")
+
+	fbuilder := metadata.NewFileMetadataBuilder(schema, props, kvmeta)
+	faccessor, err := fbuilder.Finish()
+	require.NoError(t, err)
+
+	assert.True(t, faccessor.KeyValueMetadata().Equals(kvmeta))
+}
+
+func TestApplicationVersion(t *testing.T) {
+	version := metadata.NewAppVersion("parquet-mr version 1.7.9")
+	version1 := metadata.NewAppVersion("parquet-mr version 1.8.0")
+	version2 := metadata.NewAppVersion("parquet-cpp version 1.0.0")
+	version3 := metadata.NewAppVersion("")
+	version4 := metadata.NewAppVersion("parquet-mr version 1.5.0ab-cdh5.5.0+cd (build abcd)")
+	version5 := metadata.NewAppVersion("parquet-mr")
+
+	assert.Equal(t, "parquet-mr", version.App)
+	assert.Equal(t, 1, version.Version.Major)
+	assert.Equal(t, 7, version.Version.Minor)
+	assert.Equal(t, 9, version.Version.Patch)
+
+	assert.Equal(t, "parquet-cpp", version2.App)
+	assert.Equal(t, 1, version2.Version.Major)
+	assert.Equal(t, 0, version2.Version.Minor)
+	assert.Equal(t, 0, version2.Version.Patch)
+
+	assert.Equal(t, "parquet-mr", version4.App)
+	assert.Equal(t, "abcd", version4.Build)
+	assert.Equal(t, 1, version4.Version.Major)
+	assert.Equal(t, 5, version4.Version.Minor)
+	assert.Equal(t, 0, version4.Version.Patch)
+	assert.Equal(t, "ab", version4.Version.Unknown)
+	assert.Equal(t, "cdh5.5.0", version4.Version.PreRelease)
+	assert.Equal(t, "cd", version4.Version.BuildInfo)
+
+	assert.Equal(t, "parquet-mr", version5.App)
+	assert.Equal(t, 0, version5.Version.Major)
+	assert.Equal(t, 0, version5.Version.Minor)
+	assert.Equal(t, 0, version5.Version.Patch)
+
+	assert.True(t, version.LessThan(version1))
+
+	var stats metadata.EncodedStatistics
+	assert.False(t, version1.HasCorrectStatistics(parquet.Types.Int96, schema.NoLogicalType{}, stats, schema.SortUNKNOWN))
+	assert.True(t, version.HasCorrectStatistics(parquet.Types.Int32, schema.NoLogicalType{}, stats, schema.SortSIGNED))
+	assert.False(t, version.HasCorrectStatistics(parquet.Types.ByteArray, schema.NoLogicalType{}, stats, schema.SortSIGNED))
+	assert.True(t, version1.HasCorrectStatistics(parquet.Types.ByteArray, schema.NoLogicalType{}, stats, schema.SortSIGNED))
+	assert.False(t, version1.HasCorrectStatistics(parquet.Types.ByteArray, schema.NoLogicalType{}, stats, schema.SortUNSIGNED))
+	assert.True(t, version3.HasCorrectStatistics(parquet.Types.FixedLenByteArray, schema.NoLogicalType{}, stats, schema.SortSIGNED))
+
+	// check that the old stats are correct if min and max are the same regardless of sort order
+	var statsStr metadata.EncodedStatistics
+	statsStr.SetMin([]byte("a")).SetMax([]byte("b"))
+	assert.False(t, version1.HasCorrectStatistics(parquet.Types.ByteArray, schema.NoLogicalType{}, statsStr, schema.SortUNSIGNED))
+	statsStr.SetMax([]byte("a"))
+	assert.True(t, version1.HasCorrectStatistics(parquet.Types.ByteArray, schema.NoLogicalType{}, statsStr, schema.SortUNSIGNED))
+
+	// check that the same holds true for ints
+	var (
+		intMin int32 = 100
+		intMax int32 = 200
+	)
+	var statsInt metadata.EncodedStatistics
+	statsInt.SetMin((*(*[4]byte)(unsafe.Pointer(&intMin)))[:])
+	statsInt.SetMax((*(*[4]byte)(unsafe.Pointer(&intMax)))[:])
+	assert.False(t, version1.HasCorrectStatistics(parquet.Types.ByteArray, schema.NoLogicalType{}, statsInt, schema.SortUNSIGNED))
+	statsInt.SetMax((*(*[4]byte)(unsafe.Pointer(&intMin)))[:])
+	assert.True(t, version1.HasCorrectStatistics(parquet.Types.ByteArray, schema.NoLogicalType{}, statsInt, schema.SortUNSIGNED))
+}
+
+func TestCheckBadDecimalStats(t *testing.T) {
+	version1 := metadata.NewAppVersion("parquet-cpp version 3.0.0")
+	version2 := metadata.NewAppVersion("parquet-cpp-arrow version 3.0.0")
+	version3 := metadata.NewAppVersion("parquet-cpp-arrow version 4.0.0")
+
+	var stats metadata.EncodedStatistics
+	assert.False(t, version1.HasCorrectStatistics(parquet.Types.FixedLenByteArray, schema.NewDecimalLogicalType(5, 0), stats, schema.SortSIGNED))
+	assert.False(t, version2.HasCorrectStatistics(parquet.Types.FixedLenByteArray, schema.NewDecimalLogicalType(5, 0), stats, schema.SortSIGNED))
+	assert.True(t, version3.HasCorrectStatistics(parquet.Types.FixedLenByteArray, schema.NewDecimalLogicalType(5, 0), stats, schema.SortSIGNED))
+}
diff --git a/go/parquet/metadata/row_group.go b/go/parquet/metadata/row_group.go
new file mode 100644
index 00000000000..12863138cd6
--- /dev/null
+++ b/go/parquet/metadata/row_group.go
@@ -0,0 +1,173 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package metadata
+
+import (
+	"reflect"
+
+	"github.com/apache/arrow/go/parquet"
+	"github.com/apache/arrow/go/parquet/internal/encryption"
+	format "github.com/apache/arrow/go/parquet/internal/gen-go/parquet"
+	"github.com/apache/arrow/go/parquet/schema"
+	"golang.org/x/xerrors"
+)
+
+// RowGroupMetaData is a proxy around the thrift RowGroup meta data object
+type RowGroupMetaData struct {
+	rowGroup      *format.RowGroup
+	Schema        *schema.Schema
+	version       *AppVersion
+	fileDecryptor encryption.FileDecryptor
+}
+
+// NewRowGroupMetaData constructs an object from the underlying thrift objects and schema,
+// decrypting if provided and necessary. This is primarily used internally and consumers
+// should use the RowGroupMetaDataBuilder rather than this directly.
+func NewRowGroupMetaData(rg *format.RowGroup, sc *schema.Schema, version *AppVersion, decryptor encryption.FileDecryptor) *RowGroupMetaData {
+	return &RowGroupMetaData{
+		rowGroup:      rg,
+		Schema:        sc,
+		version:       version,
+		fileDecryptor: decryptor,
+	}
+}
+
+// NumColumns returns the number of column metadata objects in this row group
+func (r *RowGroupMetaData) NumColumns() int {
+	return len(r.rowGroup.GetColumns())
+}
+
+func (r *RowGroupMetaData) Equals(other *RowGroupMetaData) bool {
+	return reflect.DeepEqual(r.rowGroup, other.rowGroup)
+}
+
+// NumRows is just the number of rows in this row group. All columns have the same
+// number of rows for a row group regardless of repetition and definition levels.
+func (r *RowGroupMetaData) NumRows() int64 { return r.rowGroup.NumRows }
+
+// TotalByteSize is the total size of this rowgroup on disk
+func (r *RowGroupMetaData) TotalByteSize() int64 { return r.rowGroup.GetTotalByteSize() }
+
+// FileOffset is the location in the file where the data for this rowgroup begins
+func (r *RowGroupMetaData) FileOffset() int64 { return r.rowGroup.GetFileOffset() }
+
+func (r *RowGroupMetaData) TotalCompressedSize() int64 { return r.rowGroup.GetTotalCompressedSize() }
+
+// Ordinal is the row group number in order for the given file.
+func (r *RowGroupMetaData) Ordinal() int16 { return r.rowGroup.GetOrdinal() }
+
+// ColumnChunk returns the metadata for the requested (0-based) chunk index
+func (r *RowGroupMetaData) ColumnChunk(i int) (*ColumnChunkMetaData, error) {
+	if i >= r.NumColumns() {
+		panic(xerrors.Errorf("parquet: the file only has %d columns, requested metadata for column: %d", r.NumColumns(), i))
+	}
+
+	return NewColumnChunkMetaData(r.rowGroup.Columns[i], r.Schema.Column(i), r.version, r.rowGroup.GetOrdinal(), int16(i), r.fileDecryptor)
+}
+
+// RowGroupMetaDataBuilder is a convenience object for constructing row group
+// metadata information. Primarily used in conjunction with writing new files.
+type RowGroupMetaDataBuilder struct {
+	rg          *format.RowGroup
+	props       *parquet.WriterProperties
+	schema      *schema.Schema
+	colBuilders []*ColumnChunkMetaDataBuilder
+	nextCol     int
+}
+
+// NewRowGroupMetaDataBuilder returns a builder using the given properties and underlying thrift object.
+//
+// This is primarily used internally, consumers should use the file metadatabuilder and call
+// AppendRowGroup on it to get instances of RowGroupMetaDataBuilder
+func NewRowGroupMetaDataBuilder(props *parquet.WriterProperties, schema *schema.Schema, rg *format.RowGroup) *RowGroupMetaDataBuilder {
+	r := &RowGroupMetaDataBuilder{
+		rg:          rg,
+		props:       props,
+		schema:      schema,
+		colBuilders: make([]*ColumnChunkMetaDataBuilder, 0),
+	}
+	r.rg.Columns = make([]*format.ColumnChunk, schema.NumColumns())
+	return r
+}
+
+// NumColumns returns the current number of columns in this metadata
+func (r *RowGroupMetaDataBuilder) NumColumns() int {
+	return int(len(r.rg.GetColumns()))
+}
+
+func (r *RowGroupMetaDataBuilder) NumRows() int64 {
+	return r.rg.GetNumRows()
+}
+
+func (r *RowGroupMetaDataBuilder) SetNumRows(nrows int64) {
+	r.rg.NumRows = nrows
+}
+
+// CurrentColumn returns the current column chunk (0-based) index that is being built.
+//
+// Returns -1 until the first time NextColumnChunk is called.
+func (r *RowGroupMetaDataBuilder) CurrentColumn() int { return r.nextCol - 1 }
+
+// NextColumnChunk appends a new column chunk, updates the column index,
+// and returns a builder for that column chunk's metadata
+func (r *RowGroupMetaDataBuilder) NextColumnChunk() *ColumnChunkMetaDataBuilder {
+	if r.nextCol >= r.NumColumns() {
+		panic(xerrors.Errorf("parquet: the schema only has %d columns, requested metadata for col: %d", r.NumColumns(), r.nextCol))
+	}
+
+	col := r.schema.Column(r.nextCol)
+	if r.rg.Columns[r.nextCol] == nil {
+		r.rg.Columns[r.nextCol] = &format.ColumnChunk{MetaData: format.NewColumnMetaData()}
+	}
+	colBldr := NewColumnChunkMetaDataBuilderWithContents(r.props, col, r.rg.Columns[r.nextCol])
+	r.nextCol++
+	r.colBuilders = append(r.colBuilders, colBldr)
+	return colBldr
+}
+
+// Finish should be called when complete and updates the metadata with the final
+// file offset, and total compressed sizes. totalBytesWritten gets written as the
+// TotalByteSize for the row group and Ordinal should be the index of the row group
+// being written. e.g. first row group should be 0, second is 1, and so on...
+func (r *RowGroupMetaDataBuilder) Finish(totalBytesWritten int64, ordinal int16) error {
+	if r.nextCol != r.NumColumns() {
+		return xerrors.Errorf("parquet: only %d out of %d columns are initialized", r.nextCol-1, r.schema.NumColumns())
+	}
+
+	var (
+		fileOffset      int64 = 0
+		totalCompressed int64 = 0
+	)
+
+	for idx, col := range r.rg.Columns {
+		if col.FileOffset < 0 {
+			return xerrors.Errorf("parquet: Column %d is not complete", idx)
+		}
+		if idx == 0 {
+			fileOffset = col.FileOffset
+		}
+		// sometimes column metadata is encrypted and not available to read
+		// so we must get total compressed size from column builder
+		totalCompressed += r.colBuilders[idx].TotalCompressedSize()
+	}
+
+	r.rg.FileOffset = &fileOffset
+	r.rg.TotalCompressedSize = &totalCompressed
+	r.rg.TotalByteSize = totalBytesWritten
+	r.rg.Ordinal = &ordinal
+	return nil
+}
diff --git a/go/parquet/metadata/stat_compare_test.go b/go/parquet/metadata/stat_compare_test.go
new file mode 100644
index 00000000000..c1fd11a8f69
--- /dev/null
+++ b/go/parquet/metadata/stat_compare_test.go
@@ -0,0 +1,268 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package metadata
+
+import (
+	"encoding/binary"
+	"testing"
+
+	"github.com/apache/arrow/go/parquet"
+	"github.com/apache/arrow/go/parquet/schema"
+	"github.com/stretchr/testify/assert"
+	"github.com/stretchr/testify/require"
+)
+
+func TestSignedByteArrayCompare(t *testing.T) {
+	s := ByteArrayStatistics{
+		statistics: statistics{
+			order: schema.SortSIGNED,
+		},
+	}
+
+	// signed byte array comparison is only used for Decimal comparison.
+	// when decimals are encoded as byte arrays they use twos compliment
+	// big-endian encoded values. Comparisons of byte arrays of unequal
+	// types need to handle sign extension.
+
+	tests := []struct {
+		b     []byte
+		order int
+	}{
+		{[]byte{0x80, 0x80, 0, 0}, 0},
+		{[]byte{ /*0xFF,*/ 0x80, 0, 0}, 1},
+		{[]byte{0xFF, 0x80, 0, 0}, 1},
+		{[]byte{ /*0xFF,*/ 0xFF, 0x01, 0}, 2},
+		{[]byte{ /*0xFF, 0xFF,*/ 0x80, 0}, 3},
+		{[]byte{ /*0xFF,*/ 0xFF, 0x80, 0}, 3},
+		{[]byte{0xFF, 0xFF, 0x80, 0}, 3},
+		{[]byte{ /*0xFF,0xFF,0xFF,*/ 0x80}, 4},
+		{[]byte{ /*0xFF,0xFF,0xFF*/ 0xFF}, 5},
+		{[]byte{ /*0, 0,*/ 0x01, 0x01}, 6},
+		{[]byte{ /*0,*/ 0, 0x01, 0x01}, 6},
+		{[]byte{0, 0, 0x01, 0x01}, 6},
+		{[]byte{ /*0,*/ 0x01, 0x01, 0}, 7},
+		{[]byte{0x01, 0x01, 0, 0}, 8},
+	}
+
+	for i, tt := range tests {
+		// empty array is always the smallest
+		assert.Truef(t, s.less(parquet.ByteArray{}, parquet.ByteArray(tt.b)), "case: %d", i)
+		assert.Falsef(t, s.less(parquet.ByteArray(tt.b), parquet.ByteArray{}), "case: %d", i)
+		// equals is always false
+		assert.Falsef(t, s.less(parquet.ByteArray(tt.b), parquet.ByteArray(tt.b)), "case: %d", i)
+
+		for j, case2 := range tests {
+			var fn func(assert.TestingT, bool, string, ...interface{}) bool
+			if tt.order < case2.order {
+				fn = assert.Truef
+			} else {
+				fn = assert.Falsef
+			}
+			fn(t, s.less(parquet.ByteArray(tt.b), parquet.ByteArray(case2.b)),
+				"%d (order: %d) %d (order: %d)", i, tt.order, j, case2.order)
+		}
+	}
+}
+
+func TestUnsignedByteArrayCompare(t *testing.T) {
+	s := ByteArrayStatistics{
+		statistics: statistics{
+			order: schema.SortUNSIGNED,
+		},
+	}
+
+	s1ba := parquet.ByteArray("arrange")
+	s2ba := parquet.ByteArray("arrangement")
+	assert.True(t, s.less(s1ba, s2ba))
+
+	// multi-byte utf-8 characters
+	s1ba = parquet.ByteArray("braten")
+	s2ba = parquet.ByteArray("bügeln")
+	assert.True(t, s.less(s1ba, s2ba))
+
+	s1ba = parquet.ByteArray("ünk123456") // ü = 252
+	s2ba = parquet.ByteArray("ănk123456") // ă = 259
+	assert.True(t, s.less(s1ba, s2ba))
+}
+
+func TestSignedCompareFLBA(t *testing.T) {
+	s := FixedLenByteArrayStatistics{
+		statistics: statistics{order: schema.SortSIGNED},
+	}
+
+	values := []parquet.FixedLenByteArray{
+		[]byte{0x80, 0, 0, 0},
+		[]byte{0xFF, 0xFF, 0x01, 0},
+		[]byte{0xFF, 0xFF, 0x80, 0},
+		[]byte{0xFF, 0xFF, 0xFF, 0x80},
+		[]byte{0xFF, 0xFF, 0xFF, 0xFF},
+		[]byte{0, 0, 0x01, 0x01},
+		[]byte{0, 0x01, 0x01, 0},
+		[]byte{0x01, 0x01, 0, 0},
+	}
+
+	for i, v := range values {
+		assert.Falsef(t, s.less(v, v), "%d", i)
+		for j, v2 := range values[i+1:] {
+			assert.Truef(t, s.less(v, v2), "%d %d", i, j)
+			assert.Falsef(t, s.less(v2, v), "%d %d", j, i)
+		}
+	}
+}
+
+func TestUnsignedCompareFLBA(t *testing.T) {
+	s := FixedLenByteArrayStatistics{
+		statistics: statistics{order: schema.SortUNSIGNED},
+	}
+
+	s1flba := parquet.FixedLenByteArray("Anti123456")
+	s2flba := parquet.FixedLenByteArray("Bunkd123456")
+	assert.True(t, s.less(s1flba, s2flba))
+
+	s1flba = parquet.FixedLenByteArray("Bunk123456")
+	s2flba = parquet.FixedLenByteArray("Bünk123456")
+	assert.True(t, s.less(s1flba, s2flba))
+}
+
+func TestSignedCompareInt96(t *testing.T) {
+	s := Int96Statistics{
+		statistics: statistics{order: schema.SortSIGNED},
+	}
+
+	val := -14
+
+	var (
+		a   = parquet.NewInt96([3]uint32{1, 41, 14})
+		b   = parquet.NewInt96([3]uint32{1, 41, 42})
+		aa  = parquet.NewInt96([3]uint32{1, 41, 14})
+		bb  = parquet.NewInt96([3]uint32{1, 41, 14})
+		aaa = parquet.NewInt96([3]uint32{1, 41, uint32(val)})
+		bbb = parquet.NewInt96([3]uint32{1, 41, 42})
+	)
+
+	assert.True(t, s.less(a, b))
+	assert.True(t, !s.less(aa, bb) && !s.less(bb, aa))
+	assert.True(t, s.less(aaa, bbb))
+}
+
+func TestUnsignedCompareInt96(t *testing.T) {
+	s := Int96Statistics{
+		statistics: statistics{order: schema.SortUNSIGNED},
+	}
+
+	valb := -41
+	valbb := -14
+
+	var (
+		a   = parquet.NewInt96([3]uint32{1, 41, 14})
+		b   = parquet.NewInt96([3]uint32{1, uint32(valb), 42})
+		aa  = parquet.NewInt96([3]uint32{1, 41, 14})
+		bb  = parquet.NewInt96([3]uint32{1, 41, uint32(valbb)})
+		aaa parquet.Int96
+		bbb parquet.Int96
+	)
+
+	assert.True(t, s.less(a, b))
+	assert.True(t, s.less(aa, bb))
+
+	binary.LittleEndian.PutUint32(aaa[8:], 2451545) // 2000-01-01
+	binary.LittleEndian.PutUint32(bbb[8:], 2451546) // 2000-01-02
+	// 12 hours + 34 minutes + 56 seconds
+	aaa.SetNanoSeconds(45296000000000)
+	// 12 hours + 34 minutes + 50 seconds
+	bbb.SetNanoSeconds(45290000000000)
+	assert.True(t, s.less(aaa, bbb))
+
+	binary.LittleEndian.PutUint32(aaa[8:], 2451545) // 2000-01-01
+	binary.LittleEndian.PutUint32(bbb[8:], 2451545) // 2000-01-01
+	// 11 hours + 34 minutes + 56 seconds
+	aaa.SetNanoSeconds(41696000000000)
+	// 12 hours + 34 minutes + 50 seconds
+	bbb.SetNanoSeconds(45290000000000)
+	assert.True(t, s.less(aaa, bbb))
+
+	binary.LittleEndian.PutUint32(aaa[8:], 2451545) // 2000-01-01
+	binary.LittleEndian.PutUint32(bbb[8:], 2451545) // 2000-01-01
+	// 12 hours + 34 minutes + 55 seconds
+	aaa.SetNanoSeconds(45295000000000)
+	// 12 hours + 34 minutes + 56 seconds
+	bbb.SetNanoSeconds(45296000000000)
+	assert.True(t, s.less(aaa, bbb))
+}
+
+func TestCompareSignedInt64(t *testing.T) {
+	var (
+		a   int64 = 1
+		b   int64 = 4
+		aa  int64 = 1
+		bb  int64 = 1
+		aaa int64 = -1
+		bbb int64 = 1
+	)
+
+	n := schema.NewInt64Node("signedint64", parquet.Repetitions.Required, -1)
+	descr := schema.NewColumn(n, 0, 0)
+	s := NewStatistics(descr, nil).(*Int64Statistics)
+
+	assert.True(t, s.less(a, b))
+	assert.True(t, !s.less(aa, bb) && !s.less(bb, aa))
+	assert.True(t, s.less(aaa, bbb))
+}
+
+func TestCompareUnsignedInt64(t *testing.T) {
+	var (
+		a   int64 = 1
+		b   int64 = 4
+		aa  int64 = 1
+		bb  int64 = 1
+		aaa int64 = 1
+		bbb int64 = -1
+	)
+
+	n, err := schema.NewPrimitiveNodeConverted("unsigned int64", parquet.Repetitions.Required, parquet.Types.Int64, schema.ConvertedTypes.Uint64, 0, 0, 0, 0)
+	require.NoError(t, err)
+	descr := schema.NewColumn(n, 0, 0)
+
+	assert.Equal(t, schema.SortUNSIGNED, descr.SortOrder())
+	s := NewStatistics(descr, nil).(*Int64Statistics)
+
+	assert.True(t, s.less(a, b))
+	assert.True(t, !s.less(aa, bb) && !s.less(bb, aa))
+	assert.True(t, s.less(aaa, bbb))
+}
+
+func TestCompareUnsignedInt32(t *testing.T) {
+	var (
+		a   int32 = 1
+		b   int32 = 4
+		aa  int32 = 1
+		bb  int32 = 1
+		aaa int32 = 1
+		bbb int32 = -1
+	)
+
+	n, err := schema.NewPrimitiveNodeConverted("unsigned int32", parquet.Repetitions.Required, parquet.Types.Int32, schema.ConvertedTypes.Uint32, 0, 0, 0, 0)
+	require.NoError(t, err)
+	descr := schema.NewColumn(n, 0, 0)
+
+	assert.Equal(t, schema.SortUNSIGNED, descr.SortOrder())
+	s := NewStatistics(descr, nil).(*Int32Statistics)
+
+	assert.True(t, s.less(a, b))
+	assert.True(t, !s.less(aa, bb) && !s.less(bb, aa))
+	assert.True(t, s.less(aaa, bbb))
+}
diff --git a/go/parquet/metadata/statistics.go b/go/parquet/metadata/statistics.go
new file mode 100644
index 00000000000..85910c8425f
--- /dev/null
+++ b/go/parquet/metadata/statistics.go
@@ -0,0 +1,552 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package metadata
+
+import (
+	"bytes"
+	"encoding/binary"
+	"math"
+	"unsafe"
+
+	"github.com/apache/arrow/go/arrow"
+	"github.com/apache/arrow/go/arrow/memory"
+	"github.com/apache/arrow/go/parquet"
+	"github.com/apache/arrow/go/parquet/internal/debug"
+	"github.com/apache/arrow/go/parquet/internal/encoding"
+	format "github.com/apache/arrow/go/parquet/internal/gen-go/parquet"
+	"github.com/apache/arrow/go/parquet/schema"
+)
+
+//go:generate go run ../../arrow/_tools/tmpl/main.go -i -data=../internal/encoding/physical_types.tmpldata statistics_types.gen.go.tmpl
+
+type StatProvider interface {
+	GetMin() []byte
+	GetMax() []byte
+	GetNullCount() int64
+	GetDistinctCount() int64
+	IsSetMax() bool
+	IsSetMin() bool
+	IsSetNullCount() bool
+	IsSetDistinctCount() bool
+}
+
+// EncodedStatistics are raw statistics with encoded values that will be written
+// to the parquet file, or was read from the parquet file.
+type EncodedStatistics struct {
+	HasMax           bool
+	Max              []byte
+	HasMin           bool
+	Min              []byte
+	Signed           bool
+	HasNullCount     bool
+	NullCount        int64
+	HasDistinctCount bool
+	DistinctCount    int64
+}
+
+// ApplyStatSizeLimits sets the maximum size of the min/max values.
+//
+// from parquet-mr
+// we don't write stats larger than the max size rather than truncating.
+// the rationale is that some engines may use the minimum value in the page
+// as the true minimum for aggregations and there is no way to mark that
+// a value has been truncated and is a lower bound and not in the page
+func (e *EncodedStatistics) ApplyStatSizeLimits(length int) {
+	if len(e.Max) > length {
+		e.HasMax = false
+	}
+	if len(e.Min) > length {
+		e.HasMin = false
+	}
+}
+
+// IsSet returns true iff one of the Has* values is true.
+func (e *EncodedStatistics) IsSet() bool {
+	return e.HasMin || e.HasMax || e.HasNullCount || e.HasDistinctCount
+}
+
+// SetMax sets the encoded Max value to val and sets HasMax to true
+func (e *EncodedStatistics) SetMax(val []byte) *EncodedStatistics {
+	e.Max = val[:]
+	e.HasMax = true
+	return e
+}
+
+// SetMin sets the encoded Min value to val, and sets HasMin to true
+func (e *EncodedStatistics) SetMin(val []byte) *EncodedStatistics {
+	e.Min = val[:]
+	e.HasMin = true
+	return e
+}
+
+// SetNullCount sets the NullCount to val and sets HasNullCount to true
+func (e *EncodedStatistics) SetNullCount(val int64) *EncodedStatistics {
+	e.NullCount = val
+	e.HasNullCount = true
+	return e
+}
+
+// SetDistinctCount sets the DistinctCount to val and sets HasDistinctCount to true
+func (e *EncodedStatistics) SetDistinctCount(val int64) *EncodedStatistics {
+	e.DistinctCount = val
+	e.HasDistinctCount = true
+	return e
+}
+
+func (e *EncodedStatistics) ToThrift() (stats *format.Statistics) {
+	stats = format.NewStatistics()
+	if e.HasMin {
+		stats.MinValue = e.Min
+		// if sort order is SIGNED then the old min value must be set too for backwards compatibility
+		if e.Signed {
+			stats.Min = e.Min
+		}
+	}
+	if e.HasMax {
+		stats.MaxValue = e.Max
+		// if sort order is SIGNED then old max value must be set to
+		if e.Signed {
+			stats.Max = e.Max
+		}
+	}
+	if e.HasNullCount {
+		stats.NullCount = &e.NullCount
+	}
+	if e.HasDistinctCount {
+		stats.DistinctCount = &e.DistinctCount
+	}
+	return
+}
+
+// TypedStatistics is the base interface for dealing with stats as
+// they are being populated
+type TypedStatistics interface {
+	// Type is the underlying physical type for this stat block
+	Type() parquet.Type
+	// Returns true if there is a min and max value set for this stat object
+	HasMinMax() bool
+	// Returns true if a nullcount has been set
+	HasNullCount() bool
+	// returns true only if a distinct count has been set
+	// current implementation does of the writer does not automatically populate
+	// the distinct count right now.
+	HasDistinctCount() bool
+	NullCount() int64
+	DistinctCount() int64
+	NumValues() int64
+	// return the column descriptor that this stat object was initialized with
+	Descr() *schema.Column
+
+	// Encode the current min value and return the bytes. ByteArray does not
+	// include the len in the encoded bytes, otherwise this is identical to
+	// plain encoding
+	EncodeMin() []byte
+	// Encode the current max value and return the bytes. ByteArray does not
+	// include the len in the encoded bytes, otherwise this is identical to
+	// plain encoding
+	EncodeMax() []byte
+	// Populate an EncodedStatistics object from the current stats
+	Encode() (EncodedStatistics, error)
+	// Resets all values to 0 to enable reusing this stat object for multiple
+	// columns, by calling Encode to get the finished values and then calling
+	// reset
+	Reset()
+	// Merge the min/max/nullcounts and distinct count from the passed stat object
+	// into this one.
+	Merge(TypedStatistics)
+}
+
+type statistics struct {
+	descr            *schema.Column
+	hasMinMax        bool
+	hasNullCount     bool
+	hasDistinctCount bool
+	mem              memory.Allocator
+	nvalues          int64
+	stats            EncodedStatistics
+	order            schema.SortOrder
+
+	encoder encoding.TypedEncoder
+}
+
+func (s *statistics) incNulls(n int64) {
+	s.stats.NullCount += n
+	s.hasNullCount = true
+}
+func (s *statistics) incDistinct(n int64) {
+	s.stats.DistinctCount += n
+	s.hasDistinctCount = true
+}
+
+func (s *statistics) Descr() *schema.Column  { return s.descr }
+func (s *statistics) Type() parquet.Type     { return s.descr.PhysicalType() }
+func (s *statistics) HasDistinctCount() bool { return s.hasDistinctCount }
+func (s *statistics) HasMinMax() bool        { return s.hasMinMax }
+func (s *statistics) HasNullCount() bool     { return s.hasNullCount }
+func (s *statistics) NullCount() int64       { return s.stats.NullCount }
+func (s *statistics) DistinctCount() int64   { return s.stats.DistinctCount }
+func (s *statistics) NumValues() int64       { return s.nvalues }
+
+func (s *statistics) Reset() {
+	s.stats.NullCount = 0
+	s.stats.DistinctCount = 0
+	s.nvalues = 0
+	s.hasMinMax = false
+	s.hasDistinctCount = false
+	s.hasNullCount = false
+}
+
+// base merge function for base non-typed stat object so we don't have to
+// duplicate this in each of the typed implementations
+func (s *statistics) merge(other TypedStatistics) {
+	s.nvalues += other.NumValues()
+	if other.HasNullCount() {
+		s.stats.NullCount += other.NullCount()
+	}
+	if other.HasDistinctCount() {
+		// this isn't technically correct as it should be keeping an actual set
+		// of the distinct values and then combining the sets to get a new count
+		// but for now we'll do this to match the C++ implementation at the current
+		// time.
+		s.stats.DistinctCount += other.DistinctCount()
+	}
+}
+
+func coalesce(val, fallback interface{}) interface{} {
+	switch v := val.(type) {
+	case float32:
+		if math.IsNaN(float64(v)) {
+			return fallback
+		}
+	case float64:
+		if math.IsNaN(v) {
+			return fallback
+		}
+	}
+	return val
+}
+
+func signedByteLess(a, b []byte) bool {
+	// signed comparison is used for integers encoded as big-endian twos complement
+	// integers (e.g. decimals)
+
+	// if at least one of the lengths is zero, we can short circuit
+	if len(a) == 0 || len(b) == 0 {
+		return len(a) == 0 && len(b) > 0
+	}
+
+	sa := *(*[]int8)(unsafe.Pointer(&a))
+	sb := *(*[]int8)(unsafe.Pointer(&b))
+
+	// we can short circuit for different signd numbers or for equal length byte
+	// arrays that have different first bytes. The equality requirement is necessary
+	// for sign extension cases. 0xFF10 should be equal to 0x10 (due to big endian sign extension)
+	if int8(0x80&uint8(sa[0])) != int8(0x80&uint8(sb[0])) || (len(sa) == len(sb) && sa[0] != sb[0]) {
+		return sa[0] < sb[0]
+	}
+
+	// when the lengths are unequal and the numbers are of the same sign, we need
+	// to do comparison by sign extending the shorter value first, and once we get
+	// to equal sized arrays, lexicographical unsigned comparison of everything but
+	// the first byte is sufficient.
+
+	if len(a) != len(b) {
+		var lead []byte
+		if len(a) > len(b) {
+			leadLen := len(a) - len(b)
+			lead = a[:leadLen]
+			a = a[leadLen:]
+		} else {
+			debug.Assert(len(a) < len(b), "something weird in byte slice signed comparison")
+			leadLen := len(b) - len(a)
+			lead = b[:leadLen]
+			b = b[leadLen:]
+		}
+
+		// compare extra bytes to the sign extension of the first byte of the other number
+		var extension byte
+		if sa[0] < 0 {
+			extension = 0xFF
+		}
+
+		notequal := false
+		for _, c := range lead {
+			if c != extension {
+				notequal = true
+				break
+			}
+		}
+
+		if notequal {
+			// since sign extension are extrema values for unsigned bytes:
+			//
+			// Four cases exist:
+			//	 negative values:
+			//	   b is the longer value
+			//       b must be the lesser value: return false
+			//     else:
+			//       a must be the lesser value: return true
+			//
+			//   positive values:
+			//     b is the longer value
+			//       values in b must be greater than a: return true
+			//     else:
+			//       values in a must be greater than b: return false
+			neg := sa[0] < 0
+			blonger := len(sa) < len(sb)
+			return neg != blonger
+		}
+	} else {
+		a = a[1:]
+		b = b[1:]
+	}
+
+	return bytes.Compare(a, b) == -1
+}
+
+func (BooleanStatistics) defaultMin() bool { return true }
+func (BooleanStatistics) defaultMax() bool { return false }
+func (s *Int32Statistics) defaultMin() int32 {
+	if s.order == schema.SortUNSIGNED {
+		val := math.MaxUint32
+		return int32(val)
+	}
+	return math.MaxInt32
+}
+
+func (s *Int32Statistics) defaultMax() int32 {
+	if s.order == schema.SortUNSIGNED {
+		return int32(0)
+	}
+	return math.MinInt32
+}
+
+func (s *Int64Statistics) defaultMin() int64 {
+	if s.order == schema.SortUNSIGNED {
+		val := uint64(math.MaxUint64)
+		return int64(val)
+	}
+	return math.MaxInt64
+}
+
+func (s *Int64Statistics) defaultMax() int64 {
+	if s.order == schema.SortUNSIGNED {
+		return int64(0)
+	}
+	return math.MinInt64
+}
+
+var (
+	defaultMinInt96  parquet.Int96
+	defaultMinUInt96 parquet.Int96
+	defaultMaxInt96  parquet.Int96
+	defaultMaxUInt96 parquet.Int96
+)
+
+func init() {
+	i96 := arrow.Uint32Traits.CastFromBytes(defaultMinInt96[:])
+	i96[0] = math.MaxUint32
+	i96[1] = math.MaxUint32
+	i96[2] = math.MaxInt32
+
+	i96 = arrow.Uint32Traits.CastFromBytes(defaultMinUInt96[:])
+	i96[0] = math.MaxUint32
+	i96[1] = math.MaxUint32
+	i96[2] = math.MaxUint32
+
+	// golang will initialize the bytes to 0
+	i96 = arrow.Uint32Traits.CastFromBytes(defaultMaxInt96[:])
+	i96[2] = math.MaxInt32 + 1
+
+	// defaultMaxUInt96 will be initialized to 0 as desired
+}
+
+func (s *Int96Statistics) defaultMin() parquet.Int96 {
+	if s.order == schema.SortUNSIGNED {
+		return defaultMinUInt96
+	}
+	return defaultMinInt96
+}
+
+func (s *Int96Statistics) defaultMax() parquet.Int96 {
+	if s.order == schema.SortUNSIGNED {
+		return defaultMaxUInt96
+	}
+	return defaultMaxInt96
+}
+
+func (Float32Statistics) defaultMin() float32                             { return math.MaxFloat32 }
+func (Float32Statistics) defaultMax() float32                             { return -math.MaxFloat32 }
+func (Float64Statistics) defaultMin() float64                             { return math.MaxFloat64 }
+func (Float64Statistics) defaultMax() float64                             { return -math.MaxFloat64 }
+func (ByteArrayStatistics) defaultMin() parquet.ByteArray                 { return nil }
+func (ByteArrayStatistics) defaultMax() parquet.ByteArray                 { return nil }
+func (FixedLenByteArrayStatistics) defaultMin() parquet.FixedLenByteArray { return nil }
+func (FixedLenByteArrayStatistics) defaultMax() parquet.FixedLenByteArray { return nil }
+
+func (BooleanStatistics) equal(a, b bool) bool                { return a == b }
+func (Int32Statistics) equal(a, b int32) bool                 { return a == b }
+func (Int64Statistics) equal(a, b int64) bool                 { return a == b }
+func (Float32Statistics) equal(a, b float32) bool             { return a == b }
+func (Float64Statistics) equal(a, b float64) bool             { return a == b }
+func (Int96Statistics) equal(a, b parquet.Int96) bool         { return bytes.Equal(a[:], b[:]) }
+func (ByteArrayStatistics) equal(a, b parquet.ByteArray) bool { return bytes.Equal(a, b) }
+func (FixedLenByteArrayStatistics) equal(a, b parquet.FixedLenByteArray) bool {
+	return bytes.Equal(a, b)
+}
+
+func (BooleanStatistics) less(a, b bool) bool {
+	return !a && b
+}
+
+func (s *Int32Statistics) less(a, b int32) bool {
+	if s.order == schema.SortUNSIGNED {
+		return uint32(a) < uint32(b)
+	}
+	return a < b
+}
+
+func (s *Int64Statistics) less(a, b int64) bool {
+	if s.order == schema.SortUNSIGNED {
+		return uint64(a) < uint64(b)
+	}
+	return a < b
+}
+func (Float32Statistics) less(a, b float32) bool { return a < b }
+func (Float64Statistics) less(a, b float64) bool { return a < b }
+func (s *Int96Statistics) less(a, b parquet.Int96) bool {
+	i96a := arrow.Uint32Traits.CastFromBytes(a[:])
+	i96b := arrow.Uint32Traits.CastFromBytes(b[:])
+	if i96a[2] != i96b[2] {
+		// only the msb bit is by signed comparison
+		if s.order == schema.SortSIGNED {
+			return int32(i96a[2]) < int32(i96b[2])
+		}
+		return i96a[2] < i96b[2]
+	} else if i96a[1] != i96b[1] {
+		return i96a[1] < i96b[1]
+	}
+	return i96a[0] < i96b[0]
+}
+
+func (s *ByteArrayStatistics) less(a, b parquet.ByteArray) bool {
+	if s.order == schema.SortUNSIGNED {
+		return bytes.Compare(a, b) == -1
+	}
+
+	return signedByteLess([]byte(a), []byte(b))
+}
+
+func (s *FixedLenByteArrayStatistics) less(a, b parquet.FixedLenByteArray) bool {
+	if s.order == schema.SortUNSIGNED {
+		return bytes.Compare(a, b) == -1
+	}
+
+	return signedByteLess([]byte(a), []byte(b))
+}
+
+func (BooleanStatistics) cleanStat(minMax minmaxPairBoolean) *minmaxPairBoolean { return &minMax }
+func (Int32Statistics) cleanStat(minMax minmaxPairInt32) *minmaxPairInt32       { return &minMax }
+func (Int64Statistics) cleanStat(minMax minmaxPairInt64) *minmaxPairInt64       { return &minMax }
+func (Int96Statistics) cleanStat(minMax minmaxPairInt96) *minmaxPairInt96       { return &minMax }
+
+// in the case of floating point types, the following rules are applied as per parquet-mr:
+// - if any of min/max is NaN, return nothing
+// - if min is 0.0f replace with -0.0f
+// - if max is -0.0f replace with 0.0f
+//
+// https://issues.apache.org/jira/browse/PARQUET-1222 tracks the official documenting of
+// a well-defined order for floats and doubles.
+func (Float32Statistics) cleanStat(minMax minmaxPairFloat32) *minmaxPairFloat32 {
+	if math.IsNaN(float64(minMax[0])) || math.IsNaN(float64(minMax[1])) {
+		return nil
+	}
+
+	if minMax[0] == math.MaxFloat32 && minMax[1] == -math.MaxFloat32 {
+		return nil
+	}
+
+	var zero float32 = 0
+	if minMax[0] == zero && !math.Signbit(float64(minMax[0])) {
+		minMax[0] = -minMax[0]
+	}
+
+	if minMax[1] == zero && math.Signbit(float64(minMax[1])) {
+		minMax[1] = -minMax[1]
+	}
+
+	return &minMax
+}
+
+func (Float64Statistics) cleanStat(minMax minmaxPairFloat64) *minmaxPairFloat64 {
+	if math.IsNaN(minMax[0]) || math.IsNaN(minMax[1]) {
+		return nil
+	}
+
+	if minMax[0] == math.MaxFloat64 && minMax[1] == -math.MaxFloat64 {
+		return nil
+	}
+
+	var zero float64 = 0
+	if minMax[0] == zero && !math.Signbit(minMax[0]) {
+		minMax[0] = -minMax[0]
+	}
+
+	if minMax[1] == zero && math.Signbit(minMax[1]) {
+		minMax[1] = -minMax[1]
+	}
+
+	return &minMax
+}
+
+func (ByteArrayStatistics) cleanStat(minMax minmaxPairByteArray) *minmaxPairByteArray {
+	if minMax[0] == nil || minMax[1] == nil {
+		return nil
+	}
+	return &minMax
+}
+
+func (FixedLenByteArrayStatistics) cleanStat(minMax minmaxPairFixedLenByteArray) *minmaxPairFixedLenByteArray {
+	if minMax[0] == nil || minMax[1] == nil {
+		return nil
+	}
+	return &minMax
+}
+
+func GetStatValue(typ parquet.Type, val []byte) interface{} {
+	switch typ {
+	case parquet.Types.Boolean:
+		return val[0] != 0
+	case parquet.Types.Int32:
+		return int32(binary.LittleEndian.Uint32(val))
+	case parquet.Types.Int64:
+		return int64(binary.LittleEndian.Uint64(val))
+	case parquet.Types.Int96:
+		p := parquet.Int96{}
+		copy(p[:], val)
+		return p
+	case parquet.Types.Float:
+		return math.Float32frombits(binary.LittleEndian.Uint32(val))
+	case parquet.Types.Double:
+		return math.Float64frombits(binary.LittleEndian.Uint64(val))
+	case parquet.Types.ByteArray:
+		fallthrough
+	case parquet.Types.FixedLenByteArray:
+		return val
+	}
+	return nil
+}
diff --git a/go/parquet/metadata/statistics_test.go b/go/parquet/metadata/statistics_test.go
new file mode 100644
index 00000000000..b052b37f778
--- /dev/null
+++ b/go/parquet/metadata/statistics_test.go
@@ -0,0 +1,190 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package metadata_test
+
+import (
+	"math"
+	"reflect"
+	"testing"
+
+	"github.com/apache/arrow/go/arrow/bitutil"
+	"github.com/apache/arrow/go/arrow/memory"
+	"github.com/apache/arrow/go/parquet"
+	"github.com/apache/arrow/go/parquet/metadata"
+	"github.com/apache/arrow/go/parquet/schema"
+	"github.com/stretchr/testify/assert"
+)
+
+// NOTE(zeroshade): tests will be added and updated after merging the "file" package
+// since the tests that I wrote relied on the file writer/reader for ease of use.
+
+func TestCheckNaNs(t *testing.T) {
+	const (
+		numvals = 8
+		min     = -4.0
+		max     = 3.0
+	)
+	nan := math.NaN()
+
+	allNans := []float64{nan, nan, nan, nan, nan, nan, nan, nan}
+	allNansf32 := make([]float32, numvals)
+	for idx, v := range allNans {
+		allNansf32[idx] = float32(v)
+	}
+
+	someNans := []float64{nan, max, -3.0, -1.0, nan, 2.0, min, nan}
+	someNansf32 := make([]float32, numvals)
+	for idx, v := range someNans {
+		someNansf32[idx] = float32(v)
+	}
+
+	validBitmap := []byte{0x7F}       // 0b01111111
+	validBitmapNoNaNs := []byte{0x6E} // 0b01101110
+
+	assertUnsetMinMax := func(stats metadata.TypedStatistics, values interface{}, bitmap []byte) {
+		if bitmap == nil {
+			switch s := stats.(type) {
+			case *metadata.Float32Statistics:
+				s.Update(values.([]float32), 0)
+			case *metadata.Float64Statistics:
+				s.Update(values.([]float64), 0)
+			}
+			assert.False(t, stats.HasMinMax())
+		} else {
+			nvalues := reflect.ValueOf(values).Len()
+			nullCount := bitutil.CountSetBits(bitmap, 0, nvalues)
+			switch s := stats.(type) {
+			case *metadata.Float32Statistics:
+				s.UpdateSpaced(values.([]float32), bitmap, 0, int64(nullCount))
+			case *metadata.Float64Statistics:
+				s.UpdateSpaced(values.([]float64), bitmap, 0, int64(nullCount))
+			}
+			assert.False(t, stats.HasMinMax())
+		}
+	}
+
+	assertMinMaxAre := func(stats metadata.TypedStatistics, values interface{}, expectedMin, expectedMax interface{}) {
+		switch s := stats.(type) {
+		case *metadata.Float32Statistics:
+			s.Update(values.([]float32), 0)
+			assert.True(t, stats.HasMinMax())
+			assert.Equal(t, expectedMin, s.Min())
+			assert.Equal(t, expectedMax, s.Max())
+		case *metadata.Float64Statistics:
+			s.Update(values.([]float64), 0)
+			assert.True(t, stats.HasMinMax())
+			assert.Equal(t, expectedMin, s.Min())
+			assert.Equal(t, expectedMax, s.Max())
+		}
+	}
+
+	assertMinMaxAreSpaced := func(stats metadata.TypedStatistics, values interface{}, bitmap []byte, expectedMin, expectedMax interface{}) {
+		nvalues := reflect.ValueOf(values).Len()
+		nullCount := bitutil.CountSetBits(bitmap, 0, nvalues)
+		switch s := stats.(type) {
+		case *metadata.Float32Statistics:
+			s.UpdateSpaced(values.([]float32), bitmap, 0, int64(nullCount))
+			assert.True(t, s.HasMinMax())
+			assert.Equal(t, expectedMin, s.Min())
+			assert.Equal(t, expectedMax, s.Max())
+		case *metadata.Float64Statistics:
+			s.UpdateSpaced(values.([]float64), bitmap, 0, int64(nullCount))
+			assert.True(t, s.HasMinMax())
+			assert.Equal(t, expectedMin, s.Min())
+			assert.Equal(t, expectedMax, s.Max())
+		}
+	}
+
+	f32Col := schema.NewColumn(schema.NewFloat32Node("f", parquet.Repetitions.Optional, -1), 1, 1)
+	f64Col := schema.NewColumn(schema.NewFloat64Node("f", parquet.Repetitions.Optional, -1), 1, 1)
+	// test values
+	someNanStats := metadata.NewStatistics(f64Col, memory.DefaultAllocator)
+	someNanStatsf32 := metadata.NewStatistics(f32Col, memory.DefaultAllocator)
+	// ingesting only nans should not yield a min or max
+	assertUnsetMinMax(someNanStats, allNans, nil)
+	assertUnsetMinMax(someNanStatsf32, allNansf32, nil)
+	// ingesting a mix should yield a valid min/max
+	assertMinMaxAre(someNanStats, someNans, min, max)
+	assertMinMaxAre(someNanStatsf32, someNansf32, float32(min), float32(max))
+	// ingesting only nans after a valid min/max should have no effect
+	assertMinMaxAre(someNanStats, allNans, min, max)
+	assertMinMaxAre(someNanStatsf32, allNansf32, float32(min), float32(max))
+
+	someNanStats = metadata.NewStatistics(f64Col, memory.DefaultAllocator)
+	someNanStatsf32 = metadata.NewStatistics(f32Col, memory.DefaultAllocator)
+	assertUnsetMinMax(someNanStats, allNans, validBitmap)
+	assertUnsetMinMax(someNanStatsf32, allNansf32, validBitmap)
+	// nans should not pollute min/max when excluded via null bitmap
+	assertMinMaxAreSpaced(someNanStats, someNans, validBitmapNoNaNs, min, max)
+	assertMinMaxAreSpaced(someNanStatsf32, someNansf32, validBitmapNoNaNs, float32(min), float32(max))
+	// ingesting nans with a null bitmap should not change the result
+	assertMinMaxAreSpaced(someNanStats, someNans, validBitmap, min, max)
+	assertMinMaxAreSpaced(someNanStatsf32, someNansf32, validBitmap, float32(min), float32(max))
+}
+
+func TestCheckNegativeZeroStats(t *testing.T) {
+	assertMinMaxZeroesSign := func(stats metadata.TypedStatistics, values interface{}) {
+		switch s := stats.(type) {
+		case *metadata.Float32Statistics:
+			s.Update(values.([]float32), 0)
+			assert.True(t, s.HasMinMax())
+			var zero float32
+			assert.Equal(t, zero, s.Min())
+			assert.True(t, math.Signbit(float64(s.Min())))
+			assert.Equal(t, zero, s.Max())
+			assert.False(t, math.Signbit(float64(s.Max())))
+		case *metadata.Float64Statistics:
+			s.Update(values.([]float64), 0)
+			assert.True(t, s.HasMinMax())
+			var zero float64
+			assert.Equal(t, zero, s.Min())
+			assert.True(t, math.Signbit(s.Min()))
+			assert.Equal(t, zero, s.Max())
+			assert.False(t, math.Signbit(s.Max()))
+		}
+	}
+
+	fcol := schema.NewColumn(schema.NewFloat32Node("f", parquet.Repetitions.Optional, -1), 1, 1)
+	dcol := schema.NewColumn(schema.NewFloat64Node("d", parquet.Repetitions.Optional, -1), 1, 1)
+
+	var f32zero float32
+	var f64zero float64
+	{
+		fstats := metadata.NewStatistics(fcol, memory.DefaultAllocator)
+		dstats := metadata.NewStatistics(dcol, memory.DefaultAllocator)
+		assertMinMaxZeroesSign(fstats, []float32{-f32zero, f32zero})
+		assertMinMaxZeroesSign(dstats, []float64{-f64zero, f64zero})
+	}
+	{
+		fstats := metadata.NewStatistics(fcol, memory.DefaultAllocator)
+		dstats := metadata.NewStatistics(dcol, memory.DefaultAllocator)
+		assertMinMaxZeroesSign(fstats, []float32{f32zero, -f32zero})
+		assertMinMaxZeroesSign(dstats, []float64{f64zero, -f64zero})
+	}
+	{
+		fstats := metadata.NewStatistics(fcol, memory.DefaultAllocator)
+		dstats := metadata.NewStatistics(dcol, memory.DefaultAllocator)
+		assertMinMaxZeroesSign(fstats, []float32{-f32zero, -f32zero})
+		assertMinMaxZeroesSign(dstats, []float64{-f64zero, -f64zero})
+	}
+	{
+		fstats := metadata.NewStatistics(fcol, memory.DefaultAllocator)
+		dstats := metadata.NewStatistics(dcol, memory.DefaultAllocator)
+		assertMinMaxZeroesSign(fstats, []float32{f32zero, f32zero})
+		assertMinMaxZeroesSign(dstats, []float64{f64zero, f64zero})
+	}
+}
diff --git a/go/parquet/metadata/statistics_types.gen.go b/go/parquet/metadata/statistics_types.gen.go
new file mode 100644
index 00000000000..63971a0a714
--- /dev/null
+++ b/go/parquet/metadata/statistics_types.gen.go
@@ -0,0 +1,2308 @@
+// Code generated by statistics_types.gen.go.tmpl. DO NOT EDIT.
+
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package metadata
+
+import (
+	"math"
+
+	"github.com/apache/arrow/go/arrow"
+	"github.com/apache/arrow/go/arrow/memory"
+	"github.com/apache/arrow/go/parquet"
+	"github.com/apache/arrow/go/parquet/internal/encoding"
+	"github.com/apache/arrow/go/parquet/internal/utils"
+	"github.com/apache/arrow/go/parquet/schema"
+	"golang.org/x/xerrors"
+)
+
+type minmaxPairInt32 [2]int32
+
+// Int32Statistics is the typed interface for managing stats for a column
+// of Int32 type.
+type Int32Statistics struct {
+	statistics
+	min int32
+	max int32
+
+	bitSetReader utils.SetBitRunReader
+}
+
+// NewInt32Statistics constructs an appropriate stat object type using the
+// given column descriptor and allocator.
+//
+// Panics if the physical type of descr is not parquet.Type.Int32
+func NewInt32Statistics(descr *schema.Column, mem memory.Allocator) *Int32Statistics {
+	if descr.PhysicalType() != parquet.Types.Int32 {
+		panic(xerrors.Errorf("parquet: invalid type %s for constructing a Int32 stat object", descr.PhysicalType()))
+	}
+
+	return &Int32Statistics{
+		statistics: statistics{
+			descr:            descr,
+			hasNullCount:     true,
+			hasDistinctCount: true,
+			order:            descr.SortOrder(),
+			encoder:          encoding.NewEncoder(descr.PhysicalType(), parquet.Encodings.Plain, false, descr, mem),
+			mem:              mem,
+		},
+	}
+}
+
+// NewInt32StatisticsFromEncoded will construct a propertly typed statistics object
+// initializing it with the provided information.
+func NewInt32StatisticsFromEncoded(descr *schema.Column, mem memory.Allocator, nvalues int64, encoded StatProvider) *Int32Statistics {
+	ret := NewInt32Statistics(descr, mem)
+	ret.nvalues += nvalues
+	if encoded.IsSetNullCount() {
+		ret.incNulls(encoded.GetNullCount())
+	}
+	if encoded.IsSetDistinctCount() {
+		ret.incDistinct(encoded.GetDistinctCount())
+	}
+
+	encodedMin := encoded.GetMin()
+	if encodedMin != nil && len(encodedMin) > 0 {
+		ret.min = ret.plainDecode(encodedMin)
+	}
+	encodedMax := encoded.GetMax()
+	if encodedMax != nil && len(encodedMax) > 0 {
+		ret.max = ret.plainDecode(encodedMax)
+	}
+	ret.hasMinMax = encoded.IsSetMax() || encoded.IsSetMin()
+	return ret
+}
+
+func (s *Int32Statistics) plainEncode(src int32) []byte {
+	s.encoder.(encoding.Int32Encoder).Put([]int32{src})
+	buf, err := s.encoder.FlushValues()
+	if err != nil {
+		panic(err) // recovered by Encode
+	}
+	defer buf.Release()
+
+	out := make([]byte, buf.Len())
+	copy(out, buf.Bytes())
+	return out
+}
+
+func (s *Int32Statistics) plainDecode(src []byte) int32 {
+	var buf [1]int32
+
+	decoder := encoding.NewDecoder(s.descr.PhysicalType(), parquet.Encodings.Plain, s.descr, s.mem)
+	decoder.SetData(1, src)
+	decoder.(encoding.Int32Decoder).Decode(buf[:])
+	return buf[0]
+}
+
+func (s *Int32Statistics) minval(a, b int32) int32 {
+	if s.less(a, b) {
+		return a
+	}
+	return b
+}
+
+func (s *Int32Statistics) maxval(a, b int32) int32 {
+	if s.less(a, b) {
+		return b
+	}
+	return a
+}
+
+// MinMaxEqual returns true if both stat objects have the same Min and Max values
+func (s *Int32Statistics) MinMaxEqual(rhs *Int32Statistics) bool {
+	return s.equal(s.min, rhs.min) && s.equal(s.max, rhs.max)
+}
+
+// Equals returns true only if both objects are the same type, have the same min and
+// max values, null count, distinct count and number of values.
+func (s *Int32Statistics) Equals(other TypedStatistics) bool {
+	if s.Type() != other.Type() {
+		return false
+	}
+	rhs, ok := other.(*Int32Statistics)
+	if !ok {
+		return false
+	}
+
+	if s.HasMinMax() != rhs.HasMinMax() {
+		return false
+	}
+	return (s.hasMinMax && s.MinMaxEqual(rhs)) &&
+		s.NullCount() == rhs.NullCount() &&
+		s.DistinctCount() == rhs.DistinctCount() &&
+		s.NumValues() == rhs.NumValues()
+}
+
+func (s *Int32Statistics) getMinMax(values []int32) (min, max int32) {
+	if s.order == schema.SortSIGNED {
+		min, max = utils.GetMinMaxInt32(values)
+	} else {
+		umin, umax := utils.GetMinMaxUint32(arrow.Uint32Traits.CastFromBytes(arrow.Int32Traits.CastToBytes(values)))
+		min, max = int32(umin), int32(umax)
+	}
+	return
+}
+
+func (s *Int32Statistics) getMinMaxSpaced(values []int32, validBits []byte, validBitsOffset int64) (min, max int32) {
+	min = s.defaultMin()
+	max = s.defaultMax()
+	var fn func([]int32) (int32, int32)
+	if s.order == schema.SortSIGNED {
+		fn = utils.GetMinMaxInt32
+	} else {
+		fn = func(v []int32) (int32, int32) {
+			umin, umax := utils.GetMinMaxUint32(arrow.Uint32Traits.CastFromBytes(arrow.Int32Traits.CastToBytes(values)))
+			return int32(umin), int32(umax)
+		}
+	}
+
+	if s.bitSetReader == nil {
+		s.bitSetReader = utils.NewSetBitRunReader(validBits, validBitsOffset, int64(len(values)))
+	} else {
+		s.bitSetReader.Reset(validBits, validBitsOffset, int64(len(values)))
+	}
+
+	for {
+		run := s.bitSetReader.NextRun()
+		if run.Length == 0 {
+			break
+		}
+		localMin, localMax := fn(values[int(run.Pos):int(run.Pos+run.Length)])
+		if min > localMin {
+			min = localMin
+		}
+		if max < localMax {
+			max = localMax
+		}
+	}
+	return
+}
+
+func (s *Int32Statistics) Min() int32 { return s.min }
+func (s *Int32Statistics) Max() int32 { return s.max }
+
+// Merge merges the stats from other into this stat object, updating
+// the null count, distinct count, number of values and the min/max if
+// appropriate.
+func (s *Int32Statistics) Merge(other TypedStatistics) {
+	rhs, ok := other.(*Int32Statistics)
+	if !ok {
+		panic("incompatible stat type merge")
+	}
+
+	s.statistics.merge(rhs)
+	if rhs.HasMinMax() {
+		s.SetMinMax(rhs.Min(), rhs.Max())
+	}
+}
+
+// Update is used to add more values to the current stat object, finding the
+// min and max values etc.
+func (s *Int32Statistics) Update(values []int32, numNull int64) {
+	s.incNulls(numNull)
+	s.nvalues += int64(len(values))
+
+	if len(values) == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMax(values))
+}
+
+// UpdateSpaced is just like Update, but for spaced values using validBits to determine
+// and skip null values.
+func (s *Int32Statistics) UpdateSpaced(values []int32, validBits []byte, validBitsOffset, numNull int64) {
+	s.incNulls(numNull)
+	notnull := int64(len(values)) - numNull
+	s.nvalues += notnull
+
+	if notnull == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMaxSpaced(values, validBits, validBitsOffset))
+}
+
+// SetMinMax updates the min and max values only if they are not currently set
+// or if argMin is less than the current min / argMax is greater than the current max
+func (s *Int32Statistics) SetMinMax(argMin, argMax int32) {
+	maybeMinMax := s.cleanStat([2]int32{argMin, argMax})
+	if maybeMinMax == nil {
+		return
+	}
+
+	min := (*maybeMinMax)[0]
+	max := (*maybeMinMax)[1]
+
+	if !s.hasMinMax {
+		s.hasMinMax = true
+		s.min = min
+		s.max = max
+	} else {
+		if !s.less(s.min, min) {
+			s.min = min
+		}
+		if s.less(s.max, max) {
+			s.max = max
+		}
+	}
+}
+
+// EncodeMin returns the encoded min value with plain encoding.
+//
+// ByteArray stats do not include the length in the encoding.
+func (s *Int32Statistics) EncodeMin() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.min)
+	}
+	return nil
+}
+
+// EncodeMax returns the current encoded max value with plain encoding
+//
+// ByteArray stats do not include the length in the encoding
+func (s *Int32Statistics) EncodeMax() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.max)
+	}
+	return nil
+}
+
+// Encode returns a populated EncodedStatistics object
+func (s *Int32Statistics) Encode() (enc EncodedStatistics, err error) {
+	defer func() {
+		if r := recover(); r != nil {
+			switch r := r.(type) {
+			case error:
+				err = r
+			case string:
+				err = xerrors.New(r)
+			default:
+				err = xerrors.Errorf("unknown error type thrown from panic: %v", r)
+			}
+		}
+	}()
+	if s.HasMinMax() {
+		enc.SetMax(s.EncodeMax())
+		enc.SetMin(s.EncodeMin())
+	}
+	if s.HasNullCount() {
+		enc.SetNullCount(s.NullCount())
+	}
+	if s.HasDistinctCount() {
+		enc.SetDistinctCount(s.DistinctCount())
+	}
+	return
+}
+
+type minmaxPairInt64 [2]int64
+
+// Int64Statistics is the typed interface for managing stats for a column
+// of Int64 type.
+type Int64Statistics struct {
+	statistics
+	min int64
+	max int64
+
+	bitSetReader utils.SetBitRunReader
+}
+
+// NewInt64Statistics constructs an appropriate stat object type using the
+// given column descriptor and allocator.
+//
+// Panics if the physical type of descr is not parquet.Type.Int64
+func NewInt64Statistics(descr *schema.Column, mem memory.Allocator) *Int64Statistics {
+	if descr.PhysicalType() != parquet.Types.Int64 {
+		panic(xerrors.Errorf("parquet: invalid type %s for constructing a Int64 stat object", descr.PhysicalType()))
+	}
+
+	return &Int64Statistics{
+		statistics: statistics{
+			descr:            descr,
+			hasNullCount:     true,
+			hasDistinctCount: true,
+			order:            descr.SortOrder(),
+			encoder:          encoding.NewEncoder(descr.PhysicalType(), parquet.Encodings.Plain, false, descr, mem),
+			mem:              mem,
+		},
+	}
+}
+
+// NewInt64StatisticsFromEncoded will construct a propertly typed statistics object
+// initializing it with the provided information.
+func NewInt64StatisticsFromEncoded(descr *schema.Column, mem memory.Allocator, nvalues int64, encoded StatProvider) *Int64Statistics {
+	ret := NewInt64Statistics(descr, mem)
+	ret.nvalues += nvalues
+	if encoded.IsSetNullCount() {
+		ret.incNulls(encoded.GetNullCount())
+	}
+	if encoded.IsSetDistinctCount() {
+		ret.incDistinct(encoded.GetDistinctCount())
+	}
+
+	encodedMin := encoded.GetMin()
+	if encodedMin != nil && len(encodedMin) > 0 {
+		ret.min = ret.plainDecode(encodedMin)
+	}
+	encodedMax := encoded.GetMax()
+	if encodedMax != nil && len(encodedMax) > 0 {
+		ret.max = ret.plainDecode(encodedMax)
+	}
+	ret.hasMinMax = encoded.IsSetMax() || encoded.IsSetMin()
+	return ret
+}
+
+func (s *Int64Statistics) plainEncode(src int64) []byte {
+	s.encoder.(encoding.Int64Encoder).Put([]int64{src})
+	buf, err := s.encoder.FlushValues()
+	if err != nil {
+		panic(err) // recovered by Encode
+	}
+	defer buf.Release()
+
+	out := make([]byte, buf.Len())
+	copy(out, buf.Bytes())
+	return out
+}
+
+func (s *Int64Statistics) plainDecode(src []byte) int64 {
+	var buf [1]int64
+
+	decoder := encoding.NewDecoder(s.descr.PhysicalType(), parquet.Encodings.Plain, s.descr, s.mem)
+	decoder.SetData(1, src)
+	decoder.(encoding.Int64Decoder).Decode(buf[:])
+	return buf[0]
+}
+
+func (s *Int64Statistics) minval(a, b int64) int64 {
+	if s.less(a, b) {
+		return a
+	}
+	return b
+}
+
+func (s *Int64Statistics) maxval(a, b int64) int64 {
+	if s.less(a, b) {
+		return b
+	}
+	return a
+}
+
+// MinMaxEqual returns true if both stat objects have the same Min and Max values
+func (s *Int64Statistics) MinMaxEqual(rhs *Int64Statistics) bool {
+	return s.equal(s.min, rhs.min) && s.equal(s.max, rhs.max)
+}
+
+// Equals returns true only if both objects are the same type, have the same min and
+// max values, null count, distinct count and number of values.
+func (s *Int64Statistics) Equals(other TypedStatistics) bool {
+	if s.Type() != other.Type() {
+		return false
+	}
+	rhs, ok := other.(*Int64Statistics)
+	if !ok {
+		return false
+	}
+
+	if s.HasMinMax() != rhs.HasMinMax() {
+		return false
+	}
+	return (s.hasMinMax && s.MinMaxEqual(rhs)) &&
+		s.NullCount() == rhs.NullCount() &&
+		s.DistinctCount() == rhs.DistinctCount() &&
+		s.NumValues() == rhs.NumValues()
+}
+
+func (s *Int64Statistics) getMinMax(values []int64) (min, max int64) {
+	if s.order == schema.SortSIGNED {
+		min, max = utils.GetMinMaxInt64(values)
+	} else {
+		umin, umax := utils.GetMinMaxUint64(arrow.Uint64Traits.CastFromBytes(arrow.Int64Traits.CastToBytes(values)))
+		min, max = int64(umin), int64(umax)
+	}
+	return
+}
+
+func (s *Int64Statistics) getMinMaxSpaced(values []int64, validBits []byte, validBitsOffset int64) (min, max int64) {
+	min = s.defaultMin()
+	max = s.defaultMax()
+	var fn func([]int64) (int64, int64)
+	if s.order == schema.SortSIGNED {
+		fn = utils.GetMinMaxInt64
+	} else {
+		fn = func(v []int64) (int64, int64) {
+			umin, umax := utils.GetMinMaxUint64(arrow.Uint64Traits.CastFromBytes(arrow.Int64Traits.CastToBytes(values)))
+			return int64(umin), int64(umax)
+		}
+	}
+
+	if s.bitSetReader == nil {
+		s.bitSetReader = utils.NewSetBitRunReader(validBits, validBitsOffset, int64(len(values)))
+	} else {
+		s.bitSetReader.Reset(validBits, validBitsOffset, int64(len(values)))
+	}
+
+	for {
+		run := s.bitSetReader.NextRun()
+		if run.Length == 0 {
+			break
+		}
+		localMin, localMax := fn(values[int(run.Pos):int(run.Pos+run.Length)])
+		if min > localMin {
+			min = localMin
+		}
+		if max < localMax {
+			max = localMax
+		}
+	}
+	return
+}
+
+func (s *Int64Statistics) Min() int64 { return s.min }
+func (s *Int64Statistics) Max() int64 { return s.max }
+
+// Merge merges the stats from other into this stat object, updating
+// the null count, distinct count, number of values and the min/max if
+// appropriate.
+func (s *Int64Statistics) Merge(other TypedStatistics) {
+	rhs, ok := other.(*Int64Statistics)
+	if !ok {
+		panic("incompatible stat type merge")
+	}
+
+	s.statistics.merge(rhs)
+	if rhs.HasMinMax() {
+		s.SetMinMax(rhs.Min(), rhs.Max())
+	}
+}
+
+// Update is used to add more values to the current stat object, finding the
+// min and max values etc.
+func (s *Int64Statistics) Update(values []int64, numNull int64) {
+	s.incNulls(numNull)
+	s.nvalues += int64(len(values))
+
+	if len(values) == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMax(values))
+}
+
+// UpdateSpaced is just like Update, but for spaced values using validBits to determine
+// and skip null values.
+func (s *Int64Statistics) UpdateSpaced(values []int64, validBits []byte, validBitsOffset, numNull int64) {
+	s.incNulls(numNull)
+	notnull := int64(len(values)) - numNull
+	s.nvalues += notnull
+
+	if notnull == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMaxSpaced(values, validBits, validBitsOffset))
+}
+
+// SetMinMax updates the min and max values only if they are not currently set
+// or if argMin is less than the current min / argMax is greater than the current max
+func (s *Int64Statistics) SetMinMax(argMin, argMax int64) {
+	maybeMinMax := s.cleanStat([2]int64{argMin, argMax})
+	if maybeMinMax == nil {
+		return
+	}
+
+	min := (*maybeMinMax)[0]
+	max := (*maybeMinMax)[1]
+
+	if !s.hasMinMax {
+		s.hasMinMax = true
+		s.min = min
+		s.max = max
+	} else {
+		if !s.less(s.min, min) {
+			s.min = min
+		}
+		if s.less(s.max, max) {
+			s.max = max
+		}
+	}
+}
+
+// EncodeMin returns the encoded min value with plain encoding.
+//
+// ByteArray stats do not include the length in the encoding.
+func (s *Int64Statistics) EncodeMin() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.min)
+	}
+	return nil
+}
+
+// EncodeMax returns the current encoded max value with plain encoding
+//
+// ByteArray stats do not include the length in the encoding
+func (s *Int64Statistics) EncodeMax() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.max)
+	}
+	return nil
+}
+
+// Encode returns a populated EncodedStatistics object
+func (s *Int64Statistics) Encode() (enc EncodedStatistics, err error) {
+	defer func() {
+		if r := recover(); r != nil {
+			switch r := r.(type) {
+			case error:
+				err = r
+			case string:
+				err = xerrors.New(r)
+			default:
+				err = xerrors.Errorf("unknown error type thrown from panic: %v", r)
+			}
+		}
+	}()
+	if s.HasMinMax() {
+		enc.SetMax(s.EncodeMax())
+		enc.SetMin(s.EncodeMin())
+	}
+	if s.HasNullCount() {
+		enc.SetNullCount(s.NullCount())
+	}
+	if s.HasDistinctCount() {
+		enc.SetDistinctCount(s.DistinctCount())
+	}
+	return
+}
+
+type minmaxPairInt96 [2]parquet.Int96
+
+// Int96Statistics is the typed interface for managing stats for a column
+// of Int96 type.
+type Int96Statistics struct {
+	statistics
+	min parquet.Int96
+	max parquet.Int96
+
+	bitSetReader utils.SetBitRunReader
+}
+
+// NewInt96Statistics constructs an appropriate stat object type using the
+// given column descriptor and allocator.
+//
+// Panics if the physical type of descr is not parquet.Type.Int96
+func NewInt96Statistics(descr *schema.Column, mem memory.Allocator) *Int96Statistics {
+	if descr.PhysicalType() != parquet.Types.Int96 {
+		panic(xerrors.Errorf("parquet: invalid type %s for constructing a Int96 stat object", descr.PhysicalType()))
+	}
+
+	return &Int96Statistics{
+		statistics: statistics{
+			descr:            descr,
+			hasNullCount:     true,
+			hasDistinctCount: true,
+			order:            descr.SortOrder(),
+			encoder:          encoding.NewEncoder(descr.PhysicalType(), parquet.Encodings.Plain, false, descr, mem),
+			mem:              mem,
+		},
+	}
+}
+
+// NewInt96StatisticsFromEncoded will construct a propertly typed statistics object
+// initializing it with the provided information.
+func NewInt96StatisticsFromEncoded(descr *schema.Column, mem memory.Allocator, nvalues int64, encoded StatProvider) *Int96Statistics {
+	ret := NewInt96Statistics(descr, mem)
+	ret.nvalues += nvalues
+	if encoded.IsSetNullCount() {
+		ret.incNulls(encoded.GetNullCount())
+	}
+	if encoded.IsSetDistinctCount() {
+		ret.incDistinct(encoded.GetDistinctCount())
+	}
+
+	encodedMin := encoded.GetMin()
+	if encodedMin != nil && len(encodedMin) > 0 {
+		ret.min = ret.plainDecode(encodedMin)
+	}
+	encodedMax := encoded.GetMax()
+	if encodedMax != nil && len(encodedMax) > 0 {
+		ret.max = ret.plainDecode(encodedMax)
+	}
+	ret.hasMinMax = encoded.IsSetMax() || encoded.IsSetMin()
+	return ret
+}
+
+func (s *Int96Statistics) plainEncode(src parquet.Int96) []byte {
+	s.encoder.(encoding.Int96Encoder).Put([]parquet.Int96{src})
+	buf, err := s.encoder.FlushValues()
+	if err != nil {
+		panic(err) // recovered by Encode
+	}
+	defer buf.Release()
+
+	out := make([]byte, buf.Len())
+	copy(out, buf.Bytes())
+	return out
+}
+
+func (s *Int96Statistics) plainDecode(src []byte) parquet.Int96 {
+	var buf [1]parquet.Int96
+
+	decoder := encoding.NewDecoder(s.descr.PhysicalType(), parquet.Encodings.Plain, s.descr, s.mem)
+	decoder.SetData(1, src)
+	decoder.(encoding.Int96Decoder).Decode(buf[:])
+	return buf[0]
+}
+
+func (s *Int96Statistics) minval(a, b parquet.Int96) parquet.Int96 {
+	if s.less(a, b) {
+		return a
+	}
+	return b
+}
+
+func (s *Int96Statistics) maxval(a, b parquet.Int96) parquet.Int96 {
+	if s.less(a, b) {
+		return b
+	}
+	return a
+}
+
+// MinMaxEqual returns true if both stat objects have the same Min and Max values
+func (s *Int96Statistics) MinMaxEqual(rhs *Int96Statistics) bool {
+	return s.equal(s.min, rhs.min) && s.equal(s.max, rhs.max)
+}
+
+// Equals returns true only if both objects are the same type, have the same min and
+// max values, null count, distinct count and number of values.
+func (s *Int96Statistics) Equals(other TypedStatistics) bool {
+	if s.Type() != other.Type() {
+		return false
+	}
+	rhs, ok := other.(*Int96Statistics)
+	if !ok {
+		return false
+	}
+
+	if s.HasMinMax() != rhs.HasMinMax() {
+		return false
+	}
+	return (s.hasMinMax && s.MinMaxEqual(rhs)) &&
+		s.NullCount() == rhs.NullCount() &&
+		s.DistinctCount() == rhs.DistinctCount() &&
+		s.NumValues() == rhs.NumValues()
+}
+
+func (s *Int96Statistics) getMinMax(values []parquet.Int96) (min, max parquet.Int96) {
+	defMin := s.defaultMin()
+	defMax := s.defaultMax()
+
+	min = defMin
+	max = defMax
+
+	for _, v := range values {
+		min = s.minval(min, v)
+		max = s.maxval(max, v)
+	}
+	return
+}
+
+func (s *Int96Statistics) getMinMaxSpaced(values []parquet.Int96, validBits []byte, validBitsOffset int64) (min, max parquet.Int96) {
+	min = s.defaultMin()
+	max = s.defaultMax()
+
+	if s.bitSetReader == nil {
+		s.bitSetReader = utils.NewSetBitRunReader(validBits, validBitsOffset, int64(len(values)))
+	} else {
+		s.bitSetReader.Reset(validBits, validBitsOffset, int64(len(values)))
+	}
+
+	for {
+		run := s.bitSetReader.NextRun()
+		if run.Length == 0 {
+			break
+		}
+		for _, v := range values[int(run.Pos):int(run.Pos+run.Length)] {
+			min = s.minval(min, v)
+			max = s.maxval(max, v)
+		}
+	}
+	return
+}
+
+func (s *Int96Statistics) Min() parquet.Int96 { return s.min }
+func (s *Int96Statistics) Max() parquet.Int96 { return s.max }
+
+// Merge merges the stats from other into this stat object, updating
+// the null count, distinct count, number of values and the min/max if
+// appropriate.
+func (s *Int96Statistics) Merge(other TypedStatistics) {
+	rhs, ok := other.(*Int96Statistics)
+	if !ok {
+		panic("incompatible stat type merge")
+	}
+
+	s.statistics.merge(rhs)
+	if rhs.HasMinMax() {
+		s.SetMinMax(rhs.Min(), rhs.Max())
+	}
+}
+
+// Update is used to add more values to the current stat object, finding the
+// min and max values etc.
+func (s *Int96Statistics) Update(values []parquet.Int96, numNull int64) {
+	s.incNulls(numNull)
+	s.nvalues += int64(len(values))
+
+	if len(values) == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMax(values))
+}
+
+// UpdateSpaced is just like Update, but for spaced values using validBits to determine
+// and skip null values.
+func (s *Int96Statistics) UpdateSpaced(values []parquet.Int96, validBits []byte, validBitsOffset, numNull int64) {
+	s.incNulls(numNull)
+	notnull := int64(len(values)) - numNull
+	s.nvalues += notnull
+
+	if notnull == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMaxSpaced(values, validBits, validBitsOffset))
+}
+
+// SetMinMax updates the min and max values only if they are not currently set
+// or if argMin is less than the current min / argMax is greater than the current max
+func (s *Int96Statistics) SetMinMax(argMin, argMax parquet.Int96) {
+	maybeMinMax := s.cleanStat([2]parquet.Int96{argMin, argMax})
+	if maybeMinMax == nil {
+		return
+	}
+
+	min := (*maybeMinMax)[0]
+	max := (*maybeMinMax)[1]
+
+	if !s.hasMinMax {
+		s.hasMinMax = true
+		s.min = min
+		s.max = max
+	} else {
+		if !s.less(s.min, min) {
+			s.min = min
+		}
+		if s.less(s.max, max) {
+			s.max = max
+		}
+	}
+}
+
+// EncodeMin returns the encoded min value with plain encoding.
+//
+// ByteArray stats do not include the length in the encoding.
+func (s *Int96Statistics) EncodeMin() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.min)
+	}
+	return nil
+}
+
+// EncodeMax returns the current encoded max value with plain encoding
+//
+// ByteArray stats do not include the length in the encoding
+func (s *Int96Statistics) EncodeMax() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.max)
+	}
+	return nil
+}
+
+// Encode returns a populated EncodedStatistics object
+func (s *Int96Statistics) Encode() (enc EncodedStatistics, err error) {
+	defer func() {
+		if r := recover(); r != nil {
+			switch r := r.(type) {
+			case error:
+				err = r
+			case string:
+				err = xerrors.New(r)
+			default:
+				err = xerrors.Errorf("unknown error type thrown from panic: %v", r)
+			}
+		}
+	}()
+	if s.HasMinMax() {
+		enc.SetMax(s.EncodeMax())
+		enc.SetMin(s.EncodeMin())
+	}
+	if s.HasNullCount() {
+		enc.SetNullCount(s.NullCount())
+	}
+	if s.HasDistinctCount() {
+		enc.SetDistinctCount(s.DistinctCount())
+	}
+	return
+}
+
+type minmaxPairFloat32 [2]float32
+
+// Float32Statistics is the typed interface for managing stats for a column
+// of Float32 type.
+type Float32Statistics struct {
+	statistics
+	min float32
+	max float32
+
+	bitSetReader utils.SetBitRunReader
+}
+
+// NewFloat32Statistics constructs an appropriate stat object type using the
+// given column descriptor and allocator.
+//
+// Panics if the physical type of descr is not parquet.Type.Float
+func NewFloat32Statistics(descr *schema.Column, mem memory.Allocator) *Float32Statistics {
+	if descr.PhysicalType() != parquet.Types.Float {
+		panic(xerrors.Errorf("parquet: invalid type %s for constructing a Float32 stat object", descr.PhysicalType()))
+	}
+
+	return &Float32Statistics{
+		statistics: statistics{
+			descr:            descr,
+			hasNullCount:     true,
+			hasDistinctCount: true,
+			order:            descr.SortOrder(),
+			encoder:          encoding.NewEncoder(descr.PhysicalType(), parquet.Encodings.Plain, false, descr, mem),
+			mem:              mem,
+		},
+	}
+}
+
+// NewFloat32StatisticsFromEncoded will construct a propertly typed statistics object
+// initializing it with the provided information.
+func NewFloat32StatisticsFromEncoded(descr *schema.Column, mem memory.Allocator, nvalues int64, encoded StatProvider) *Float32Statistics {
+	ret := NewFloat32Statistics(descr, mem)
+	ret.nvalues += nvalues
+	if encoded.IsSetNullCount() {
+		ret.incNulls(encoded.GetNullCount())
+	}
+	if encoded.IsSetDistinctCount() {
+		ret.incDistinct(encoded.GetDistinctCount())
+	}
+
+	encodedMin := encoded.GetMin()
+	if encodedMin != nil && len(encodedMin) > 0 {
+		ret.min = ret.plainDecode(encodedMin)
+	}
+	encodedMax := encoded.GetMax()
+	if encodedMax != nil && len(encodedMax) > 0 {
+		ret.max = ret.plainDecode(encodedMax)
+	}
+	ret.hasMinMax = encoded.IsSetMax() || encoded.IsSetMin()
+	return ret
+}
+
+func (s *Float32Statistics) plainEncode(src float32) []byte {
+	s.encoder.(encoding.Float32Encoder).Put([]float32{src})
+	buf, err := s.encoder.FlushValues()
+	if err != nil {
+		panic(err) // recovered by Encode
+	}
+	defer buf.Release()
+
+	out := make([]byte, buf.Len())
+	copy(out, buf.Bytes())
+	return out
+}
+
+func (s *Float32Statistics) plainDecode(src []byte) float32 {
+	var buf [1]float32
+
+	decoder := encoding.NewDecoder(s.descr.PhysicalType(), parquet.Encodings.Plain, s.descr, s.mem)
+	decoder.SetData(1, src)
+	decoder.(encoding.Float32Decoder).Decode(buf[:])
+	return buf[0]
+}
+
+func (s *Float32Statistics) minval(a, b float32) float32 {
+	if s.less(a, b) {
+		return a
+	}
+	return b
+}
+
+func (s *Float32Statistics) maxval(a, b float32) float32 {
+	if s.less(a, b) {
+		return b
+	}
+	return a
+}
+
+// MinMaxEqual returns true if both stat objects have the same Min and Max values
+func (s *Float32Statistics) MinMaxEqual(rhs *Float32Statistics) bool {
+	return s.equal(s.min, rhs.min) && s.equal(s.max, rhs.max)
+}
+
+// Equals returns true only if both objects are the same type, have the same min and
+// max values, null count, distinct count and number of values.
+func (s *Float32Statistics) Equals(other TypedStatistics) bool {
+	if s.Type() != other.Type() {
+		return false
+	}
+	rhs, ok := other.(*Float32Statistics)
+	if !ok {
+		return false
+	}
+
+	if s.HasMinMax() != rhs.HasMinMax() {
+		return false
+	}
+	return (s.hasMinMax && s.MinMaxEqual(rhs)) &&
+		s.NullCount() == rhs.NullCount() &&
+		s.DistinctCount() == rhs.DistinctCount() &&
+		s.NumValues() == rhs.NumValues()
+}
+
+func (s *Float32Statistics) coalesce(val, fallback float32) float32 {
+	if math.IsNaN(float64(val)) {
+		return fallback
+	}
+	return val
+}
+
+func (s *Float32Statistics) getMinMax(values []float32) (min, max float32) {
+	defMin := s.defaultMin()
+	defMax := s.defaultMax()
+
+	min = defMin
+	max = defMax
+
+	for _, v := range values {
+		min = s.minval(min, s.coalesce(v, defMin))
+		max = s.maxval(max, s.coalesce(v, defMax))
+	}
+	return
+}
+
+func (s *Float32Statistics) getMinMaxSpaced(values []float32, validBits []byte, validBitsOffset int64) (min, max float32) {
+	min = s.defaultMin()
+	max = s.defaultMax()
+
+	if s.bitSetReader == nil {
+		s.bitSetReader = utils.NewSetBitRunReader(validBits, validBitsOffset, int64(len(values)))
+	} else {
+		s.bitSetReader.Reset(validBits, validBitsOffset, int64(len(values)))
+	}
+
+	for {
+		run := s.bitSetReader.NextRun()
+		if run.Length == 0 {
+			break
+		}
+		for _, v := range values[int(run.Pos):int(run.Pos+run.Length)] {
+			min = s.minval(min, coalesce(v, s.defaultMin()).(float32))
+			max = s.maxval(max, coalesce(v, s.defaultMax()).(float32))
+		}
+	}
+	return
+}
+
+func (s *Float32Statistics) Min() float32 { return s.min }
+func (s *Float32Statistics) Max() float32 { return s.max }
+
+// Merge merges the stats from other into this stat object, updating
+// the null count, distinct count, number of values and the min/max if
+// appropriate.
+func (s *Float32Statistics) Merge(other TypedStatistics) {
+	rhs, ok := other.(*Float32Statistics)
+	if !ok {
+		panic("incompatible stat type merge")
+	}
+
+	s.statistics.merge(rhs)
+	if rhs.HasMinMax() {
+		s.SetMinMax(rhs.Min(), rhs.Max())
+	}
+}
+
+// Update is used to add more values to the current stat object, finding the
+// min and max values etc.
+func (s *Float32Statistics) Update(values []float32, numNull int64) {
+	s.incNulls(numNull)
+	s.nvalues += int64(len(values))
+
+	if len(values) == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMax(values))
+}
+
+// UpdateSpaced is just like Update, but for spaced values using validBits to determine
+// and skip null values.
+func (s *Float32Statistics) UpdateSpaced(values []float32, validBits []byte, validBitsOffset, numNull int64) {
+	s.incNulls(numNull)
+	notnull := int64(len(values)) - numNull
+	s.nvalues += notnull
+
+	if notnull == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMaxSpaced(values, validBits, validBitsOffset))
+}
+
+// SetMinMax updates the min and max values only if they are not currently set
+// or if argMin is less than the current min / argMax is greater than the current max
+func (s *Float32Statistics) SetMinMax(argMin, argMax float32) {
+	maybeMinMax := s.cleanStat([2]float32{argMin, argMax})
+	if maybeMinMax == nil {
+		return
+	}
+
+	min := (*maybeMinMax)[0]
+	max := (*maybeMinMax)[1]
+
+	if !s.hasMinMax {
+		s.hasMinMax = true
+		s.min = min
+		s.max = max
+	} else {
+		if !s.less(s.min, min) {
+			s.min = min
+		}
+		if s.less(s.max, max) {
+			s.max = max
+		}
+	}
+}
+
+// EncodeMin returns the encoded min value with plain encoding.
+//
+// ByteArray stats do not include the length in the encoding.
+func (s *Float32Statistics) EncodeMin() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.min)
+	}
+	return nil
+}
+
+// EncodeMax returns the current encoded max value with plain encoding
+//
+// ByteArray stats do not include the length in the encoding
+func (s *Float32Statistics) EncodeMax() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.max)
+	}
+	return nil
+}
+
+// Encode returns a populated EncodedStatistics object
+func (s *Float32Statistics) Encode() (enc EncodedStatistics, err error) {
+	defer func() {
+		if r := recover(); r != nil {
+			switch r := r.(type) {
+			case error:
+				err = r
+			case string:
+				err = xerrors.New(r)
+			default:
+				err = xerrors.Errorf("unknown error type thrown from panic: %v", r)
+			}
+		}
+	}()
+	if s.HasMinMax() {
+		enc.SetMax(s.EncodeMax())
+		enc.SetMin(s.EncodeMin())
+	}
+	if s.HasNullCount() {
+		enc.SetNullCount(s.NullCount())
+	}
+	if s.HasDistinctCount() {
+		enc.SetDistinctCount(s.DistinctCount())
+	}
+	return
+}
+
+type minmaxPairFloat64 [2]float64
+
+// Float64Statistics is the typed interface for managing stats for a column
+// of Float64 type.
+type Float64Statistics struct {
+	statistics
+	min float64
+	max float64
+
+	bitSetReader utils.SetBitRunReader
+}
+
+// NewFloat64Statistics constructs an appropriate stat object type using the
+// given column descriptor and allocator.
+//
+// Panics if the physical type of descr is not parquet.Type.Double
+func NewFloat64Statistics(descr *schema.Column, mem memory.Allocator) *Float64Statistics {
+	if descr.PhysicalType() != parquet.Types.Double {
+		panic(xerrors.Errorf("parquet: invalid type %s for constructing a Float64 stat object", descr.PhysicalType()))
+	}
+
+	return &Float64Statistics{
+		statistics: statistics{
+			descr:            descr,
+			hasNullCount:     true,
+			hasDistinctCount: true,
+			order:            descr.SortOrder(),
+			encoder:          encoding.NewEncoder(descr.PhysicalType(), parquet.Encodings.Plain, false, descr, mem),
+			mem:              mem,
+		},
+	}
+}
+
+// NewFloat64StatisticsFromEncoded will construct a propertly typed statistics object
+// initializing it with the provided information.
+func NewFloat64StatisticsFromEncoded(descr *schema.Column, mem memory.Allocator, nvalues int64, encoded StatProvider) *Float64Statistics {
+	ret := NewFloat64Statistics(descr, mem)
+	ret.nvalues += nvalues
+	if encoded.IsSetNullCount() {
+		ret.incNulls(encoded.GetNullCount())
+	}
+	if encoded.IsSetDistinctCount() {
+		ret.incDistinct(encoded.GetDistinctCount())
+	}
+
+	encodedMin := encoded.GetMin()
+	if encodedMin != nil && len(encodedMin) > 0 {
+		ret.min = ret.plainDecode(encodedMin)
+	}
+	encodedMax := encoded.GetMax()
+	if encodedMax != nil && len(encodedMax) > 0 {
+		ret.max = ret.plainDecode(encodedMax)
+	}
+	ret.hasMinMax = encoded.IsSetMax() || encoded.IsSetMin()
+	return ret
+}
+
+func (s *Float64Statistics) plainEncode(src float64) []byte {
+	s.encoder.(encoding.Float64Encoder).Put([]float64{src})
+	buf, err := s.encoder.FlushValues()
+	if err != nil {
+		panic(err) // recovered by Encode
+	}
+	defer buf.Release()
+
+	out := make([]byte, buf.Len())
+	copy(out, buf.Bytes())
+	return out
+}
+
+func (s *Float64Statistics) plainDecode(src []byte) float64 {
+	var buf [1]float64
+
+	decoder := encoding.NewDecoder(s.descr.PhysicalType(), parquet.Encodings.Plain, s.descr, s.mem)
+	decoder.SetData(1, src)
+	decoder.(encoding.Float64Decoder).Decode(buf[:])
+	return buf[0]
+}
+
+func (s *Float64Statistics) minval(a, b float64) float64 {
+	if s.less(a, b) {
+		return a
+	}
+	return b
+}
+
+func (s *Float64Statistics) maxval(a, b float64) float64 {
+	if s.less(a, b) {
+		return b
+	}
+	return a
+}
+
+// MinMaxEqual returns true if both stat objects have the same Min and Max values
+func (s *Float64Statistics) MinMaxEqual(rhs *Float64Statistics) bool {
+	return s.equal(s.min, rhs.min) && s.equal(s.max, rhs.max)
+}
+
+// Equals returns true only if both objects are the same type, have the same min and
+// max values, null count, distinct count and number of values.
+func (s *Float64Statistics) Equals(other TypedStatistics) bool {
+	if s.Type() != other.Type() {
+		return false
+	}
+	rhs, ok := other.(*Float64Statistics)
+	if !ok {
+		return false
+	}
+
+	if s.HasMinMax() != rhs.HasMinMax() {
+		return false
+	}
+	return (s.hasMinMax && s.MinMaxEqual(rhs)) &&
+		s.NullCount() == rhs.NullCount() &&
+		s.DistinctCount() == rhs.DistinctCount() &&
+		s.NumValues() == rhs.NumValues()
+}
+
+func (s *Float64Statistics) coalesce(val, fallback float64) float64 {
+	if math.IsNaN(float64(val)) {
+		return fallback
+	}
+	return val
+}
+
+func (s *Float64Statistics) getMinMax(values []float64) (min, max float64) {
+	defMin := s.defaultMin()
+	defMax := s.defaultMax()
+
+	min = defMin
+	max = defMax
+
+	for _, v := range values {
+		min = s.minval(min, s.coalesce(v, defMin))
+		max = s.maxval(max, s.coalesce(v, defMax))
+	}
+	return
+}
+
+func (s *Float64Statistics) getMinMaxSpaced(values []float64, validBits []byte, validBitsOffset int64) (min, max float64) {
+	min = s.defaultMin()
+	max = s.defaultMax()
+
+	if s.bitSetReader == nil {
+		s.bitSetReader = utils.NewSetBitRunReader(validBits, validBitsOffset, int64(len(values)))
+	} else {
+		s.bitSetReader.Reset(validBits, validBitsOffset, int64(len(values)))
+	}
+
+	for {
+		run := s.bitSetReader.NextRun()
+		if run.Length == 0 {
+			break
+		}
+		for _, v := range values[int(run.Pos):int(run.Pos+run.Length)] {
+			min = s.minval(min, coalesce(v, s.defaultMin()).(float64))
+			max = s.maxval(max, coalesce(v, s.defaultMax()).(float64))
+		}
+	}
+	return
+}
+
+func (s *Float64Statistics) Min() float64 { return s.min }
+func (s *Float64Statistics) Max() float64 { return s.max }
+
+// Merge merges the stats from other into this stat object, updating
+// the null count, distinct count, number of values and the min/max if
+// appropriate.
+func (s *Float64Statistics) Merge(other TypedStatistics) {
+	rhs, ok := other.(*Float64Statistics)
+	if !ok {
+		panic("incompatible stat type merge")
+	}
+
+	s.statistics.merge(rhs)
+	if rhs.HasMinMax() {
+		s.SetMinMax(rhs.Min(), rhs.Max())
+	}
+}
+
+// Update is used to add more values to the current stat object, finding the
+// min and max values etc.
+func (s *Float64Statistics) Update(values []float64, numNull int64) {
+	s.incNulls(numNull)
+	s.nvalues += int64(len(values))
+
+	if len(values) == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMax(values))
+}
+
+// UpdateSpaced is just like Update, but for spaced values using validBits to determine
+// and skip null values.
+func (s *Float64Statistics) UpdateSpaced(values []float64, validBits []byte, validBitsOffset, numNull int64) {
+	s.incNulls(numNull)
+	notnull := int64(len(values)) - numNull
+	s.nvalues += notnull
+
+	if notnull == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMaxSpaced(values, validBits, validBitsOffset))
+}
+
+// SetMinMax updates the min and max values only if they are not currently set
+// or if argMin is less than the current min / argMax is greater than the current max
+func (s *Float64Statistics) SetMinMax(argMin, argMax float64) {
+	maybeMinMax := s.cleanStat([2]float64{argMin, argMax})
+	if maybeMinMax == nil {
+		return
+	}
+
+	min := (*maybeMinMax)[0]
+	max := (*maybeMinMax)[1]
+
+	if !s.hasMinMax {
+		s.hasMinMax = true
+		s.min = min
+		s.max = max
+	} else {
+		if !s.less(s.min, min) {
+			s.min = min
+		}
+		if s.less(s.max, max) {
+			s.max = max
+		}
+	}
+}
+
+// EncodeMin returns the encoded min value with plain encoding.
+//
+// ByteArray stats do not include the length in the encoding.
+func (s *Float64Statistics) EncodeMin() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.min)
+	}
+	return nil
+}
+
+// EncodeMax returns the current encoded max value with plain encoding
+//
+// ByteArray stats do not include the length in the encoding
+func (s *Float64Statistics) EncodeMax() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.max)
+	}
+	return nil
+}
+
+// Encode returns a populated EncodedStatistics object
+func (s *Float64Statistics) Encode() (enc EncodedStatistics, err error) {
+	defer func() {
+		if r := recover(); r != nil {
+			switch r := r.(type) {
+			case error:
+				err = r
+			case string:
+				err = xerrors.New(r)
+			default:
+				err = xerrors.Errorf("unknown error type thrown from panic: %v", r)
+			}
+		}
+	}()
+	if s.HasMinMax() {
+		enc.SetMax(s.EncodeMax())
+		enc.SetMin(s.EncodeMin())
+	}
+	if s.HasNullCount() {
+		enc.SetNullCount(s.NullCount())
+	}
+	if s.HasDistinctCount() {
+		enc.SetDistinctCount(s.DistinctCount())
+	}
+	return
+}
+
+type minmaxPairBoolean [2]bool
+
+// BooleanStatistics is the typed interface for managing stats for a column
+// of Boolean type.
+type BooleanStatistics struct {
+	statistics
+	min bool
+	max bool
+
+	bitSetReader utils.SetBitRunReader
+}
+
+// NewBooleanStatistics constructs an appropriate stat object type using the
+// given column descriptor and allocator.
+//
+// Panics if the physical type of descr is not parquet.Type.Boolean
+func NewBooleanStatistics(descr *schema.Column, mem memory.Allocator) *BooleanStatistics {
+	if descr.PhysicalType() != parquet.Types.Boolean {
+		panic(xerrors.Errorf("parquet: invalid type %s for constructing a Boolean stat object", descr.PhysicalType()))
+	}
+
+	return &BooleanStatistics{
+		statistics: statistics{
+			descr:            descr,
+			hasNullCount:     true,
+			hasDistinctCount: true,
+			order:            descr.SortOrder(),
+			encoder:          encoding.NewEncoder(descr.PhysicalType(), parquet.Encodings.Plain, false, descr, mem),
+			mem:              mem,
+		},
+	}
+}
+
+// NewBooleanStatisticsFromEncoded will construct a propertly typed statistics object
+// initializing it with the provided information.
+func NewBooleanStatisticsFromEncoded(descr *schema.Column, mem memory.Allocator, nvalues int64, encoded StatProvider) *BooleanStatistics {
+	ret := NewBooleanStatistics(descr, mem)
+	ret.nvalues += nvalues
+	if encoded.IsSetNullCount() {
+		ret.incNulls(encoded.GetNullCount())
+	}
+	if encoded.IsSetDistinctCount() {
+		ret.incDistinct(encoded.GetDistinctCount())
+	}
+
+	encodedMin := encoded.GetMin()
+	if encodedMin != nil && len(encodedMin) > 0 {
+		ret.min = ret.plainDecode(encodedMin)
+	}
+	encodedMax := encoded.GetMax()
+	if encodedMax != nil && len(encodedMax) > 0 {
+		ret.max = ret.plainDecode(encodedMax)
+	}
+	ret.hasMinMax = encoded.IsSetMax() || encoded.IsSetMin()
+	return ret
+}
+
+func (s *BooleanStatistics) plainEncode(src bool) []byte {
+	s.encoder.(encoding.BooleanEncoder).Put([]bool{src})
+	buf, err := s.encoder.FlushValues()
+	if err != nil {
+		panic(err) // recovered by Encode
+	}
+	defer buf.Release()
+
+	out := make([]byte, buf.Len())
+	copy(out, buf.Bytes())
+	return out
+}
+
+func (s *BooleanStatistics) plainDecode(src []byte) bool {
+	var buf [1]bool
+
+	decoder := encoding.NewDecoder(s.descr.PhysicalType(), parquet.Encodings.Plain, s.descr, s.mem)
+	decoder.SetData(1, src)
+	decoder.(encoding.BooleanDecoder).Decode(buf[:])
+	return buf[0]
+}
+
+func (s *BooleanStatistics) minval(a, b bool) bool {
+	if s.less(a, b) {
+		return a
+	}
+	return b
+}
+
+func (s *BooleanStatistics) maxval(a, b bool) bool {
+	if s.less(a, b) {
+		return b
+	}
+	return a
+}
+
+// MinMaxEqual returns true if both stat objects have the same Min and Max values
+func (s *BooleanStatistics) MinMaxEqual(rhs *BooleanStatistics) bool {
+	return s.equal(s.min, rhs.min) && s.equal(s.max, rhs.max)
+}
+
+// Equals returns true only if both objects are the same type, have the same min and
+// max values, null count, distinct count and number of values.
+func (s *BooleanStatistics) Equals(other TypedStatistics) bool {
+	if s.Type() != other.Type() {
+		return false
+	}
+	rhs, ok := other.(*BooleanStatistics)
+	if !ok {
+		return false
+	}
+
+	if s.HasMinMax() != rhs.HasMinMax() {
+		return false
+	}
+	return (s.hasMinMax && s.MinMaxEqual(rhs)) &&
+		s.NullCount() == rhs.NullCount() &&
+		s.DistinctCount() == rhs.DistinctCount() &&
+		s.NumValues() == rhs.NumValues()
+}
+
+func (s *BooleanStatistics) getMinMax(values []bool) (min, max bool) {
+	defMin := s.defaultMin()
+	defMax := s.defaultMax()
+
+	min = defMin
+	max = defMax
+
+	for _, v := range values {
+		min = s.minval(min, v)
+		max = s.maxval(max, v)
+	}
+	return
+}
+
+func (s *BooleanStatistics) getMinMaxSpaced(values []bool, validBits []byte, validBitsOffset int64) (min, max bool) {
+	min = s.defaultMin()
+	max = s.defaultMax()
+
+	if s.bitSetReader == nil {
+		s.bitSetReader = utils.NewSetBitRunReader(validBits, validBitsOffset, int64(len(values)))
+	} else {
+		s.bitSetReader.Reset(validBits, validBitsOffset, int64(len(values)))
+	}
+
+	for {
+		run := s.bitSetReader.NextRun()
+		if run.Length == 0 {
+			break
+		}
+		for _, v := range values[int(run.Pos):int(run.Pos+run.Length)] {
+			min = s.minval(min, v)
+			max = s.maxval(max, v)
+		}
+	}
+	return
+}
+
+func (s *BooleanStatistics) Min() bool { return s.min }
+func (s *BooleanStatistics) Max() bool { return s.max }
+
+// Merge merges the stats from other into this stat object, updating
+// the null count, distinct count, number of values and the min/max if
+// appropriate.
+func (s *BooleanStatistics) Merge(other TypedStatistics) {
+	rhs, ok := other.(*BooleanStatistics)
+	if !ok {
+		panic("incompatible stat type merge")
+	}
+
+	s.statistics.merge(rhs)
+	if rhs.HasMinMax() {
+		s.SetMinMax(rhs.Min(), rhs.Max())
+	}
+}
+
+// Update is used to add more values to the current stat object, finding the
+// min and max values etc.
+func (s *BooleanStatistics) Update(values []bool, numNull int64) {
+	s.incNulls(numNull)
+	s.nvalues += int64(len(values))
+
+	if len(values) == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMax(values))
+}
+
+// UpdateSpaced is just like Update, but for spaced values using validBits to determine
+// and skip null values.
+func (s *BooleanStatistics) UpdateSpaced(values []bool, validBits []byte, validBitsOffset, numNull int64) {
+	s.incNulls(numNull)
+	notnull := int64(len(values)) - numNull
+	s.nvalues += notnull
+
+	if notnull == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMaxSpaced(values, validBits, validBitsOffset))
+}
+
+// SetMinMax updates the min and max values only if they are not currently set
+// or if argMin is less than the current min / argMax is greater than the current max
+func (s *BooleanStatistics) SetMinMax(argMin, argMax bool) {
+	maybeMinMax := s.cleanStat([2]bool{argMin, argMax})
+	if maybeMinMax == nil {
+		return
+	}
+
+	min := (*maybeMinMax)[0]
+	max := (*maybeMinMax)[1]
+
+	if !s.hasMinMax {
+		s.hasMinMax = true
+		s.min = min
+		s.max = max
+	} else {
+		if !s.less(s.min, min) {
+			s.min = min
+		}
+		if s.less(s.max, max) {
+			s.max = max
+		}
+	}
+}
+
+// EncodeMin returns the encoded min value with plain encoding.
+//
+// ByteArray stats do not include the length in the encoding.
+func (s *BooleanStatistics) EncodeMin() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.min)
+	}
+	return nil
+}
+
+// EncodeMax returns the current encoded max value with plain encoding
+//
+// ByteArray stats do not include the length in the encoding
+func (s *BooleanStatistics) EncodeMax() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.max)
+	}
+	return nil
+}
+
+// Encode returns a populated EncodedStatistics object
+func (s *BooleanStatistics) Encode() (enc EncodedStatistics, err error) {
+	defer func() {
+		if r := recover(); r != nil {
+			switch r := r.(type) {
+			case error:
+				err = r
+			case string:
+				err = xerrors.New(r)
+			default:
+				err = xerrors.Errorf("unknown error type thrown from panic: %v", r)
+			}
+		}
+	}()
+	if s.HasMinMax() {
+		enc.SetMax(s.EncodeMax())
+		enc.SetMin(s.EncodeMin())
+	}
+	if s.HasNullCount() {
+		enc.SetNullCount(s.NullCount())
+	}
+	if s.HasDistinctCount() {
+		enc.SetDistinctCount(s.DistinctCount())
+	}
+	return
+}
+
+type minmaxPairByteArray [2]parquet.ByteArray
+
+// ByteArrayStatistics is the typed interface for managing stats for a column
+// of ByteArray type.
+type ByteArrayStatistics struct {
+	statistics
+	min parquet.ByteArray
+	max parquet.ByteArray
+
+	bitSetReader utils.SetBitRunReader
+}
+
+// NewByteArrayStatistics constructs an appropriate stat object type using the
+// given column descriptor and allocator.
+//
+// Panics if the physical type of descr is not parquet.Type.ByteArray
+func NewByteArrayStatistics(descr *schema.Column, mem memory.Allocator) *ByteArrayStatistics {
+	if descr.PhysicalType() != parquet.Types.ByteArray {
+		panic(xerrors.Errorf("parquet: invalid type %s for constructing a ByteArray stat object", descr.PhysicalType()))
+	}
+
+	return &ByteArrayStatistics{
+		statistics: statistics{
+			descr:            descr,
+			hasNullCount:     true,
+			hasDistinctCount: true,
+			order:            descr.SortOrder(),
+			encoder:          encoding.NewEncoder(descr.PhysicalType(), parquet.Encodings.Plain, false, descr, mem),
+			mem:              mem,
+		},
+
+		min: make([]byte, 0),
+		max: make([]byte, 0),
+	}
+}
+
+// NewByteArrayStatisticsFromEncoded will construct a propertly typed statistics object
+// initializing it with the provided information.
+func NewByteArrayStatisticsFromEncoded(descr *schema.Column, mem memory.Allocator, nvalues int64, encoded StatProvider) *ByteArrayStatistics {
+	ret := NewByteArrayStatistics(descr, mem)
+	ret.nvalues += nvalues
+	if encoded.IsSetNullCount() {
+		ret.incNulls(encoded.GetNullCount())
+	}
+	if encoded.IsSetDistinctCount() {
+		ret.incDistinct(encoded.GetDistinctCount())
+	}
+
+	encodedMin := encoded.GetMin()
+	if encodedMin != nil && len(encodedMin) > 0 {
+		ret.min = ret.plainDecode(encodedMin)
+	}
+	encodedMax := encoded.GetMax()
+	if encodedMax != nil && len(encodedMax) > 0 {
+		ret.max = ret.plainDecode(encodedMax)
+	}
+	ret.hasMinMax = encoded.IsSetMax() || encoded.IsSetMin()
+	return ret
+}
+
+func (s *ByteArrayStatistics) plainEncode(src parquet.ByteArray) []byte {
+	return src
+}
+
+func (s *ByteArrayStatistics) plainDecode(src []byte) parquet.ByteArray {
+	return src
+}
+
+func (s *ByteArrayStatistics) minval(a, b parquet.ByteArray) parquet.ByteArray {
+	switch {
+	case a == nil:
+		return b
+	case b == nil:
+		return a
+	case s.less(a, b):
+		return a
+	default:
+		return b
+	}
+}
+
+func (s *ByteArrayStatistics) maxval(a, b parquet.ByteArray) parquet.ByteArray {
+	switch {
+	case a == nil:
+		return b
+	case b == nil:
+		return a
+	case s.less(a, b):
+		return b
+	default:
+		return a
+	}
+}
+
+// MinMaxEqual returns true if both stat objects have the same Min and Max values
+func (s *ByteArrayStatistics) MinMaxEqual(rhs *ByteArrayStatistics) bool {
+	return s.equal(s.min, rhs.min) && s.equal(s.max, rhs.max)
+}
+
+// Equals returns true only if both objects are the same type, have the same min and
+// max values, null count, distinct count and number of values.
+func (s *ByteArrayStatistics) Equals(other TypedStatistics) bool {
+	if s.Type() != other.Type() {
+		return false
+	}
+	rhs, ok := other.(*ByteArrayStatistics)
+	if !ok {
+		return false
+	}
+
+	if s.HasMinMax() != rhs.HasMinMax() {
+		return false
+	}
+	return (s.hasMinMax && s.MinMaxEqual(rhs)) &&
+		s.NullCount() == rhs.NullCount() &&
+		s.DistinctCount() == rhs.DistinctCount() &&
+		s.NumValues() == rhs.NumValues()
+}
+
+func (s *ByteArrayStatistics) getMinMax(values []parquet.ByteArray) (min, max parquet.ByteArray) {
+	defMin := s.defaultMin()
+	defMax := s.defaultMax()
+
+	min = defMin
+	max = defMax
+
+	for _, v := range values {
+		min = s.minval(min, v)
+		max = s.maxval(max, v)
+	}
+	return
+}
+
+func (s *ByteArrayStatistics) getMinMaxSpaced(values []parquet.ByteArray, validBits []byte, validBitsOffset int64) (min, max parquet.ByteArray) {
+	min = s.defaultMin()
+	max = s.defaultMax()
+
+	if s.bitSetReader == nil {
+		s.bitSetReader = utils.NewSetBitRunReader(validBits, validBitsOffset, int64(len(values)))
+	} else {
+		s.bitSetReader.Reset(validBits, validBitsOffset, int64(len(values)))
+	}
+
+	for {
+		run := s.bitSetReader.NextRun()
+		if run.Length == 0 {
+			break
+		}
+		for _, v := range values[int(run.Pos):int(run.Pos+run.Length)] {
+			min = s.minval(min, v)
+			max = s.maxval(max, v)
+		}
+	}
+	return
+}
+
+func (s *ByteArrayStatistics) Min() parquet.ByteArray { return s.min }
+func (s *ByteArrayStatistics) Max() parquet.ByteArray { return s.max }
+
+// Merge merges the stats from other into this stat object, updating
+// the null count, distinct count, number of values and the min/max if
+// appropriate.
+func (s *ByteArrayStatistics) Merge(other TypedStatistics) {
+	rhs, ok := other.(*ByteArrayStatistics)
+	if !ok {
+		panic("incompatible stat type merge")
+	}
+
+	s.statistics.merge(rhs)
+	if rhs.HasMinMax() {
+		s.SetMinMax(rhs.Min(), rhs.Max())
+	}
+}
+
+// Update is used to add more values to the current stat object, finding the
+// min and max values etc.
+func (s *ByteArrayStatistics) Update(values []parquet.ByteArray, numNull int64) {
+	s.incNulls(numNull)
+	s.nvalues += int64(len(values))
+
+	if len(values) == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMax(values))
+}
+
+// UpdateSpaced is just like Update, but for spaced values using validBits to determine
+// and skip null values.
+func (s *ByteArrayStatistics) UpdateSpaced(values []parquet.ByteArray, validBits []byte, validBitsOffset, numNull int64) {
+	s.incNulls(numNull)
+	notnull := int64(len(values)) - numNull
+	s.nvalues += notnull
+
+	if notnull == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMaxSpaced(values, validBits, validBitsOffset))
+}
+
+// SetMinMax updates the min and max values only if they are not currently set
+// or if argMin is less than the current min / argMax is greater than the current max
+func (s *ByteArrayStatistics) SetMinMax(argMin, argMax parquet.ByteArray) {
+	maybeMinMax := s.cleanStat([2]parquet.ByteArray{argMin, argMax})
+	if maybeMinMax == nil {
+		return
+	}
+
+	min := (*maybeMinMax)[0]
+	max := (*maybeMinMax)[1]
+
+	if !s.hasMinMax {
+		s.hasMinMax = true
+		s.min = min
+		s.max = max
+	} else {
+		if !s.less(s.min, min) {
+			s.min = min
+		}
+		if s.less(s.max, max) {
+			s.max = max
+		}
+	}
+}
+
+// EncodeMin returns the encoded min value with plain encoding.
+//
+// ByteArray stats do not include the length in the encoding.
+func (s *ByteArrayStatistics) EncodeMin() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.min)
+	}
+	return nil
+}
+
+// EncodeMax returns the current encoded max value with plain encoding
+//
+// ByteArray stats do not include the length in the encoding
+func (s *ByteArrayStatistics) EncodeMax() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.max)
+	}
+	return nil
+}
+
+// Encode returns a populated EncodedStatistics object
+func (s *ByteArrayStatistics) Encode() (enc EncodedStatistics, err error) {
+	defer func() {
+		if r := recover(); r != nil {
+			switch r := r.(type) {
+			case error:
+				err = r
+			case string:
+				err = xerrors.New(r)
+			default:
+				err = xerrors.Errorf("unknown error type thrown from panic: %v", r)
+			}
+		}
+	}()
+	if s.HasMinMax() {
+		enc.SetMax(s.EncodeMax())
+		enc.SetMin(s.EncodeMin())
+	}
+	if s.HasNullCount() {
+		enc.SetNullCount(s.NullCount())
+	}
+	if s.HasDistinctCount() {
+		enc.SetDistinctCount(s.DistinctCount())
+	}
+	return
+}
+
+type minmaxPairFixedLenByteArray [2]parquet.FixedLenByteArray
+
+// FixedLenByteArrayStatistics is the typed interface for managing stats for a column
+// of FixedLenByteArray type.
+type FixedLenByteArrayStatistics struct {
+	statistics
+	min parquet.FixedLenByteArray
+	max parquet.FixedLenByteArray
+
+	bitSetReader utils.SetBitRunReader
+}
+
+// NewFixedLenByteArrayStatistics constructs an appropriate stat object type using the
+// given column descriptor and allocator.
+//
+// Panics if the physical type of descr is not parquet.Type.FixedLenByteArray
+func NewFixedLenByteArrayStatistics(descr *schema.Column, mem memory.Allocator) *FixedLenByteArrayStatistics {
+	if descr.PhysicalType() != parquet.Types.FixedLenByteArray {
+		panic(xerrors.Errorf("parquet: invalid type %s for constructing a FixedLenByteArray stat object", descr.PhysicalType()))
+	}
+
+	return &FixedLenByteArrayStatistics{
+		statistics: statistics{
+			descr:            descr,
+			hasNullCount:     true,
+			hasDistinctCount: true,
+			order:            descr.SortOrder(),
+			encoder:          encoding.NewEncoder(descr.PhysicalType(), parquet.Encodings.Plain, false, descr, mem),
+			mem:              mem,
+		},
+	}
+}
+
+// NewFixedLenByteArrayStatisticsFromEncoded will construct a propertly typed statistics object
+// initializing it with the provided information.
+func NewFixedLenByteArrayStatisticsFromEncoded(descr *schema.Column, mem memory.Allocator, nvalues int64, encoded StatProvider) *FixedLenByteArrayStatistics {
+	ret := NewFixedLenByteArrayStatistics(descr, mem)
+	ret.nvalues += nvalues
+	if encoded.IsSetNullCount() {
+		ret.incNulls(encoded.GetNullCount())
+	}
+	if encoded.IsSetDistinctCount() {
+		ret.incDistinct(encoded.GetDistinctCount())
+	}
+
+	encodedMin := encoded.GetMin()
+	if encodedMin != nil && len(encodedMin) > 0 {
+		ret.min = ret.plainDecode(encodedMin)
+	}
+	encodedMax := encoded.GetMax()
+	if encodedMax != nil && len(encodedMax) > 0 {
+		ret.max = ret.plainDecode(encodedMax)
+	}
+	ret.hasMinMax = encoded.IsSetMax() || encoded.IsSetMin()
+	return ret
+}
+
+func (s *FixedLenByteArrayStatistics) plainEncode(src parquet.FixedLenByteArray) []byte {
+	s.encoder.(encoding.FixedLenByteArrayEncoder).Put([]parquet.FixedLenByteArray{src})
+	buf, err := s.encoder.FlushValues()
+	if err != nil {
+		panic(err) // recovered by Encode
+	}
+	defer buf.Release()
+
+	out := make([]byte, buf.Len())
+	copy(out, buf.Bytes())
+	return out
+}
+
+func (s *FixedLenByteArrayStatistics) plainDecode(src []byte) parquet.FixedLenByteArray {
+	var buf [1]parquet.FixedLenByteArray
+
+	decoder := encoding.NewDecoder(s.descr.PhysicalType(), parquet.Encodings.Plain, s.descr, s.mem)
+	decoder.SetData(1, src)
+	decoder.(encoding.FixedLenByteArrayDecoder).Decode(buf[:])
+	return buf[0]
+}
+
+func (s *FixedLenByteArrayStatistics) minval(a, b parquet.FixedLenByteArray) parquet.FixedLenByteArray {
+	switch {
+	case a == nil:
+		return b
+	case b == nil:
+		return a
+	case s.less(a, b):
+		return a
+	default:
+		return b
+	}
+}
+
+func (s *FixedLenByteArrayStatistics) maxval(a, b parquet.FixedLenByteArray) parquet.FixedLenByteArray {
+	switch {
+	case a == nil:
+		return b
+	case b == nil:
+		return a
+	case s.less(a, b):
+		return b
+	default:
+		return a
+	}
+}
+
+// MinMaxEqual returns true if both stat objects have the same Min and Max values
+func (s *FixedLenByteArrayStatistics) MinMaxEqual(rhs *FixedLenByteArrayStatistics) bool {
+	return s.equal(s.min, rhs.min) && s.equal(s.max, rhs.max)
+}
+
+// Equals returns true only if both objects are the same type, have the same min and
+// max values, null count, distinct count and number of values.
+func (s *FixedLenByteArrayStatistics) Equals(other TypedStatistics) bool {
+	if s.Type() != other.Type() {
+		return false
+	}
+	rhs, ok := other.(*FixedLenByteArrayStatistics)
+	if !ok {
+		return false
+	}
+
+	if s.HasMinMax() != rhs.HasMinMax() {
+		return false
+	}
+	return (s.hasMinMax && s.MinMaxEqual(rhs)) &&
+		s.NullCount() == rhs.NullCount() &&
+		s.DistinctCount() == rhs.DistinctCount() &&
+		s.NumValues() == rhs.NumValues()
+}
+
+func (s *FixedLenByteArrayStatistics) getMinMax(values []parquet.FixedLenByteArray) (min, max parquet.FixedLenByteArray) {
+	defMin := s.defaultMin()
+	defMax := s.defaultMax()
+
+	min = defMin
+	max = defMax
+
+	for _, v := range values {
+		min = s.minval(min, v)
+		max = s.maxval(max, v)
+	}
+	return
+}
+
+func (s *FixedLenByteArrayStatistics) getMinMaxSpaced(values []parquet.FixedLenByteArray, validBits []byte, validBitsOffset int64) (min, max parquet.FixedLenByteArray) {
+	min = s.defaultMin()
+	max = s.defaultMax()
+
+	if s.bitSetReader == nil {
+		s.bitSetReader = utils.NewSetBitRunReader(validBits, validBitsOffset, int64(len(values)))
+	} else {
+		s.bitSetReader.Reset(validBits, validBitsOffset, int64(len(values)))
+	}
+
+	for {
+		run := s.bitSetReader.NextRun()
+		if run.Length == 0 {
+			break
+		}
+		for _, v := range values[int(run.Pos):int(run.Pos+run.Length)] {
+			min = s.minval(min, v)
+			max = s.maxval(max, v)
+		}
+	}
+	return
+}
+
+func (s *FixedLenByteArrayStatistics) Min() parquet.FixedLenByteArray { return s.min }
+func (s *FixedLenByteArrayStatistics) Max() parquet.FixedLenByteArray { return s.max }
+
+// Merge merges the stats from other into this stat object, updating
+// the null count, distinct count, number of values and the min/max if
+// appropriate.
+func (s *FixedLenByteArrayStatistics) Merge(other TypedStatistics) {
+	rhs, ok := other.(*FixedLenByteArrayStatistics)
+	if !ok {
+		panic("incompatible stat type merge")
+	}
+
+	s.statistics.merge(rhs)
+	if rhs.HasMinMax() {
+		s.SetMinMax(rhs.Min(), rhs.Max())
+	}
+}
+
+// Update is used to add more values to the current stat object, finding the
+// min and max values etc.
+func (s *FixedLenByteArrayStatistics) Update(values []parquet.FixedLenByteArray, numNull int64) {
+	s.incNulls(numNull)
+	s.nvalues += int64(len(values))
+
+	if len(values) == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMax(values))
+}
+
+// UpdateSpaced is just like Update, but for spaced values using validBits to determine
+// and skip null values.
+func (s *FixedLenByteArrayStatistics) UpdateSpaced(values []parquet.FixedLenByteArray, validBits []byte, validBitsOffset, numNull int64) {
+	s.incNulls(numNull)
+	notnull := int64(len(values)) - numNull
+	s.nvalues += notnull
+
+	if notnull == 0 {
+		return
+	}
+
+	s.SetMinMax(s.getMinMaxSpaced(values, validBits, validBitsOffset))
+}
+
+// SetMinMax updates the min and max values only if they are not currently set
+// or if argMin is less than the current min / argMax is greater than the current max
+func (s *FixedLenByteArrayStatistics) SetMinMax(argMin, argMax parquet.FixedLenByteArray) {
+	maybeMinMax := s.cleanStat([2]parquet.FixedLenByteArray{argMin, argMax})
+	if maybeMinMax == nil {
+		return
+	}
+
+	min := (*maybeMinMax)[0]
+	max := (*maybeMinMax)[1]
+
+	if !s.hasMinMax {
+		s.hasMinMax = true
+		s.min = min
+		s.max = max
+	} else {
+		if !s.less(s.min, min) {
+			s.min = min
+		}
+		if s.less(s.max, max) {
+			s.max = max
+		}
+	}
+}
+
+// EncodeMin returns the encoded min value with plain encoding.
+//
+// ByteArray stats do not include the length in the encoding.
+func (s *FixedLenByteArrayStatistics) EncodeMin() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.min)
+	}
+	return nil
+}
+
+// EncodeMax returns the current encoded max value with plain encoding
+//
+// ByteArray stats do not include the length in the encoding
+func (s *FixedLenByteArrayStatistics) EncodeMax() []byte {
+	if s.HasMinMax() {
+		return s.plainEncode(s.max)
+	}
+	return nil
+}
+
+// Encode returns a populated EncodedStatistics object
+func (s *FixedLenByteArrayStatistics) Encode() (enc EncodedStatistics, err error) {
+	defer func() {
+		if r := recover(); r != nil {
+			switch r := r.(type) {
+			case error:
+				err = r
+			case string:
+				err = xerrors.New(r)
+			default:
+				err = xerrors.Errorf("unknown error type thrown from panic: %v", r)
+			}
+		}
+	}()
+	if s.HasMinMax() {
+		enc.SetMax(s.EncodeMax())
+		enc.SetMin(s.EncodeMin())
+	}
+	if s.HasNullCount() {
+		enc.SetNullCount(s.NullCount())
+	}
+	if s.HasDistinctCount() {
+		enc.SetDistinctCount(s.DistinctCount())
+	}
+	return
+}
+
+// NewStatistics uses the type in the column descriptor to construct the appropriate
+// typed stats object. If mem is nil, then memory.DefaultAllocator will be used.
+func NewStatistics(descr *schema.Column, mem memory.Allocator) TypedStatistics {
+	if mem == nil {
+		mem = memory.DefaultAllocator
+	}
+	switch descr.PhysicalType() {
+	case parquet.Types.Int32:
+		return NewInt32Statistics(descr, mem)
+	case parquet.Types.Int64:
+		return NewInt64Statistics(descr, mem)
+	case parquet.Types.Int96:
+		return NewInt96Statistics(descr, mem)
+	case parquet.Types.Float:
+		return NewFloat32Statistics(descr, mem)
+	case parquet.Types.Double:
+		return NewFloat64Statistics(descr, mem)
+	case parquet.Types.Boolean:
+		return NewBooleanStatistics(descr, mem)
+	case parquet.Types.ByteArray:
+		return NewByteArrayStatistics(descr, mem)
+	case parquet.Types.FixedLenByteArray:
+		return NewFixedLenByteArrayStatistics(descr, mem)
+	default:
+		panic("not implemented")
+	}
+}
+
+// NewStatisticsFromEncoded uses the provided information to initialize a typed stat object
+// by checking the type of the provided column descriptor.
+//
+// If mem is nil, then memory.DefaultAllocator is used.
+func NewStatisticsFromEncoded(descr *schema.Column, mem memory.Allocator, nvalues int64, encoded StatProvider) TypedStatistics {
+	if mem == nil {
+		mem = memory.DefaultAllocator
+	}
+	switch descr.PhysicalType() {
+	case parquet.Types.Int32:
+		return NewInt32StatisticsFromEncoded(descr, mem, nvalues, encoded)
+	case parquet.Types.Int64:
+		return NewInt64StatisticsFromEncoded(descr, mem, nvalues, encoded)
+	case parquet.Types.Int96:
+		return NewInt96StatisticsFromEncoded(descr, mem, nvalues, encoded)
+	case parquet.Types.Float:
+		return NewFloat32StatisticsFromEncoded(descr, mem, nvalues, encoded)
+	case parquet.Types.Double:
+		return NewFloat64StatisticsFromEncoded(descr, mem, nvalues, encoded)
+	case parquet.Types.Boolean:
+		return NewBooleanStatisticsFromEncoded(descr, mem, nvalues, encoded)
+	case parquet.Types.ByteArray:
+		return NewByteArrayStatisticsFromEncoded(descr, mem, nvalues, encoded)
+	case parquet.Types.FixedLenByteArray:
+		return NewFixedLenByteArrayStatisticsFromEncoded(descr, mem, nvalues, encoded)
+	default:
+		panic("not implemented")
+	}
+}
diff --git a/go/parquet/metadata/statistics_types.gen.go.tmpl b/go/parquet/metadata/statistics_types.gen.go.tmpl
new file mode 100644
index 00000000000..4ee47a91725
--- /dev/null
+++ b/go/parquet/metadata/statistics_types.gen.go.tmpl
@@ -0,0 +1,420 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package metadata
+
+import (
+  "github.com/apache/arrow/go/parquet"
+  "github.com/apache/arrow/go/parquet/schema"
+  "github.com/apache/arrow/go/parquet/internal/utils"
+  "github.com/apache/arrow/go/parquet/internal/encoding"
+)
+
+{{range .In}}
+type minmaxPair{{.Name}} [2]{{.name}}
+
+// {{.Name}}Statistics is the typed interface for managing stats for a column
+// of {{.Name}} type.
+type {{.Name}}Statistics struct {
+  statistics
+  min {{.name}}
+  max {{.name}}
+
+  bitSetReader utils.SetBitRunReader
+}
+
+// New{{.Name}}Statistics constructs an appropriate stat object type using the
+// given column descriptor and allocator.
+//
+// Panics if the physical type of descr is not parquet.Type.{{if .physical}}{{.physical}}{{else}}{{.Name}}{{end}}
+func New{{.Name}}Statistics(descr *schema.Column, mem memory.Allocator) *{{.Name}}Statistics {
+  if descr.PhysicalType() != parquet.Types.{{if .physical}}{{.physical}}{{else}}{{.Name}}{{end}} {
+    panic(xerrors.Errorf("parquet: invalid type %s for constructing a {{.Name}} stat object", descr.PhysicalType()))
+  }
+
+  return &{{.Name}}Statistics{
+    statistics: statistics{
+      descr: descr,
+      hasNullCount: true,
+      hasDistinctCount: true,
+      order: descr.SortOrder(),
+      encoder: encoding.NewEncoder(descr.PhysicalType(), parquet.Encodings.Plain, false, descr, mem),
+      mem: mem,
+    },
+    {{if eq .Name "ByteArray"}}
+    min: make([]byte, 0),
+    max: make([]byte, 0),
+    {{end}}
+  }
+}
+
+// New{{.Name}}StatisticsFromEncoded will construct a propertly typed statistics object
+// initializing it with the provided information.
+func New{{.Name}}StatisticsFromEncoded(descr *schema.Column, mem memory.Allocator, nvalues int64, encoded StatProvider) *{{.Name}}Statistics {
+  ret := New{{.Name}}Statistics(descr, mem)
+  ret.nvalues += nvalues
+  if encoded.IsSetNullCount() {
+    ret.incNulls(encoded.GetNullCount())
+  }
+  if encoded.IsSetDistinctCount() {
+    ret.incDistinct(encoded.GetDistinctCount())
+  }
+
+  encodedMin := encoded.GetMin()
+  if encodedMin != nil && len(encodedMin) > 0 {
+    ret.min = ret.plainDecode(encodedMin)
+  }
+  encodedMax := encoded.GetMax()
+  if encodedMax != nil && len(encodedMax) > 0 {
+    ret.max = ret.plainDecode(encodedMax)
+  }
+  ret.hasMinMax = encoded.IsSetMax() || encoded.IsSetMin()
+  return ret
+}
+
+func (s *{{.Name}}Statistics) plainEncode(src {{.name}}) []byte {
+{{- if eq .Name "ByteArray"}}
+  return src
+{{- else}}
+  s.encoder.(encoding.{{.Name}}Encoder).Put([]{{.name}}{src})
+  buf, err := s.encoder.FlushValues()
+  if err != nil {
+    panic(err) // recovered by Encode
+  }
+  defer buf.Release()
+
+  out := make([]byte, buf.Len())
+  copy(out, buf.Bytes())
+  return out
+{{- end}}
+}
+
+func (s *{{.Name}}Statistics) plainDecode(src []byte) {{.name}} {
+{{- if eq .Name "ByteArray"}}
+  return src
+{{- else}}
+  var buf [1]{{.name}}
+
+  decoder := encoding.NewDecoder(s.descr.PhysicalType(), parquet.Encodings.Plain, s.descr, s.mem)
+  decoder.SetData(1, src)
+  decoder.(encoding.{{.Name}}Decoder).Decode(buf[:])
+  return buf[0]
+{{- end}}
+}
+
+{{if and (ne .Name "ByteArray") (ne .Name "FixedLenByteArray")}}
+func (s *{{.Name}}Statistics) minval(a, b {{.name}}) {{.name}} {
+  if s.less(a, b) {
+    return a
+  }
+  return b
+}
+
+func (s *{{.Name}}Statistics) maxval(a, b {{.name}}) {{.name}} {
+  if s.less(a, b) {
+    return b
+  }
+  return a
+}
+{{else}}
+func (s *{{.Name}}Statistics) minval(a, b {{.name}}) {{.name}} {
+  switch {
+  case a == nil:
+    return b
+  case b == nil:
+    return a
+  case s.less(a, b):
+    return a
+  default:
+    return b
+  }
+}
+
+func (s *{{.Name}}Statistics) maxval(a, b {{.name}}) {{.name}} {
+  switch {
+  case a == nil:
+    return b
+  case b == nil:
+    return a
+  case s.less(a, b):
+    return b
+  default:
+    return a
+  }
+}
+{{end}}
+
+// MinMaxEqual returns true if both stat objects have the same Min and Max values
+func (s *{{.Name}}Statistics) MinMaxEqual(rhs *{{.Name}}Statistics) bool {
+  return s.equal(s.min, rhs.min) && s.equal(s.max, rhs.max)
+}
+
+// Equals returns true only if both objects are the same type, have the same min and
+// max values, null count, distinct count and number of values.
+func (s *{{.Name}}Statistics) Equals(other TypedStatistics) bool {
+  if s.Type() != other.Type() {
+    return false
+  }
+  rhs, ok := other.(*{{.Name}}Statistics)
+  if !ok {
+    return false
+  }
+
+  if s.HasMinMax() != rhs.HasMinMax() { return false }
+  return (s.hasMinMax && s.MinMaxEqual(rhs)) &&
+    s.NullCount() == rhs.NullCount() &&
+    s.DistinctCount() == rhs.DistinctCount() &&
+    s.NumValues() == rhs.NumValues()
+}
+
+{{if or (eq .name "float32") (eq .name "float64")}}
+func (s *{{.Name}}Statistics) coalesce(val, fallback {{.name}}) {{.name}} {
+  if math.IsNaN(float64(val)) {
+    return fallback
+  }
+  return val
+}
+{{end}}
+
+func (s *{{.Name}}Statistics) getMinMax(values []{{.name}}) (min, max {{.name}}) {
+{{- if or (eq .name "int32") (eq .name "int64")}}
+  if s.order == schema.SortSIGNED {
+    min, max = utils.GetMinMax{{.Name}}(values)
+  } else {
+    umin, umax := utils.GetMinMaxU{{.name}}(arrow.U{{.name}}Traits.CastFromBytes(arrow.{{.Name}}Traits.CastToBytes(values)))
+    min, max = {{.name}}(umin), {{.name}}(umax)
+  }
+{{- else}}
+  defMin := s.defaultMin()
+  defMax := s.defaultMax()
+
+  min = defMin
+  max = defMax
+
+  for _, v := range values {
+{{- if or (eq .name "float32") (eq .name "float64") }}
+    min = s.minval(min, s.coalesce(v, defMin))
+    max = s.maxval(max, s.coalesce(v, defMax))
+{{- else}}
+    min = s.minval(min, v)
+    max = s.maxval(max, v)
+{{- end }}
+  }
+{{- end}}
+  return
+}
+
+func (s *{{.Name}}Statistics) getMinMaxSpaced(values []{{.name}}, validBits []byte, validBitsOffset int64) (min, max {{.name}}) {
+  min = s.defaultMin()
+  max = s.defaultMax()
+
+{{- if or (eq .name "int32") (eq .name "int64")}}
+  var fn func([]{{.name}}) ({{.name}}, {{.name}})
+  if s.order == schema.SortSIGNED {
+    fn = utils.GetMinMax{{.Name}}
+  } else {
+    fn = func(v []{{.name}}) ({{.name}}, {{.name}}) {
+      umin, umax := utils.GetMinMaxU{{.name}}(arrow.U{{.name}}Traits.CastFromBytes(arrow.{{.Name}}Traits.CastToBytes(values)))
+      return {{.name}}(umin), {{.name}}(umax)
+    }
+  }
+{{- end}}
+
+  if s.bitSetReader == nil {
+    s.bitSetReader = utils.NewSetBitRunReader(validBits, validBitsOffset, int64(len(values)))
+  } else {
+    s.bitSetReader.Reset(validBits, validBitsOffset, int64(len(values)))
+  }
+
+  for {
+    run := s.bitSetReader.NextRun()
+    if run.Length == 0 {
+      break
+    }
+{{- if or (eq .name "int32") (eq .name "int64")}}
+    localMin, localMax := fn(values[int(run.Pos):int(run.Pos+run.Length)])
+    if min > localMin {
+      min = localMin
+    }
+    if max < localMax {
+      max = localMax
+    }
+{{- else}}
+    for _, v := range values[int(run.Pos):int(run.Pos+run.Length)] {
+{{- if or (eq .name "float32") (eq .name "float64") }}
+      min = s.minval(min, coalesce(v, s.defaultMin()).({{.name}}))
+      max = s.maxval(max, coalesce(v, s.defaultMax()).({{.name}}))
+{{- else}}
+      min = s.minval(min, v)
+      max = s.maxval(max, v)
+{{- end }}
+    }
+{{- end}}
+  }
+  return
+}
+
+func (s *{{.Name}}Statistics) Min() {{.name}} { return s.min }
+func (s *{{.Name}}Statistics) Max() {{.name}} { return s.max }
+
+// Merge merges the stats from other into this stat object, updating
+// the null count, distinct count, number of values and the min/max if
+// appropriate.
+func (s *{{.Name}}Statistics) Merge(other TypedStatistics) {
+  rhs, ok := other.(*{{.Name}}Statistics)
+  if !ok {
+    panic("incompatible stat type merge")
+  }
+
+  s.statistics.merge(rhs)
+  if rhs.HasMinMax() {
+    s.SetMinMax(rhs.Min(), rhs.Max())
+  }
+}
+
+// Update is used to add more values to the current stat object, finding the
+// min and max values etc.
+func (s *{{.Name}}Statistics) Update(values []{{.name}}, numNull int64) {
+  s.incNulls(numNull)
+  s.nvalues += int64(len(values))
+
+  if len(values) == 0 {
+    return
+  }
+
+  s.SetMinMax(s.getMinMax(values))
+}
+
+// UpdateSpaced is just like Update, but for spaced values using validBits to determine
+// and skip null values.
+func (s *{{.Name}}Statistics) UpdateSpaced(values []{{.name}}, validBits []byte, validBitsOffset, numNull int64) {
+  s.incNulls(numNull)
+  notnull := int64(len(values)) - numNull
+  s.nvalues += notnull
+
+  if notnull == 0 {
+    return
+  }
+
+  s.SetMinMax(s.getMinMaxSpaced(values, validBits, validBitsOffset))
+}
+
+// SetMinMax updates the min and max values only if they are not currently set
+// or if argMin is less than the current min / argMax is greater than the current max
+func (s *{{.Name}}Statistics) SetMinMax(argMin, argMax {{.name}}) {
+  maybeMinMax := s.cleanStat([2]{{.name}}{argMin, argMax})
+  if maybeMinMax == nil {
+    return
+  }
+
+  min := (*maybeMinMax)[0]
+  max := (*maybeMinMax)[1]
+
+  if !s.hasMinMax {
+    s.hasMinMax = true
+    s.min = min
+    s.max = max
+  } else {
+    if !s.less(s.min, min) {
+      s.min = min
+    }
+    if s.less(s.max, max) {
+      s.max = max
+    }
+  }
+}
+
+// EncodeMin returns the encoded min value with plain encoding.
+//
+// ByteArray stats do not include the length in the encoding.
+func (s *{{.Name}}Statistics) EncodeMin() []byte {
+  if s.HasMinMax() {
+    return s.plainEncode(s.min)
+  }
+  return nil
+}
+
+// EncodeMax returns the current encoded max value with plain encoding
+//
+// ByteArray stats do not include the length in the encoding
+func (s *{{.Name}}Statistics) EncodeMax() []byte{
+  if s.HasMinMax() {
+    return s.plainEncode(s.max)
+  }
+  return nil
+}
+
+// Encode returns a populated EncodedStatistics object
+func (s *{{.Name}}Statistics) Encode() (enc EncodedStatistics, err error) {
+  defer func() {
+    if r := recover(); r != nil {
+      switch r := r.(type) {
+			case error:
+				err = r
+			case string:
+				err = xerrors.New(r)
+			default:
+				err = xerrors.Errorf("unknown error type thrown from panic: %v", r)
+			}
+    }
+  }()
+  if s.HasMinMax() {
+    enc.SetMax(s.EncodeMax())
+    enc.SetMin(s.EncodeMin())
+  }
+  if s.HasNullCount() {
+    enc.SetNullCount(s.NullCount())
+  }
+  if s.HasDistinctCount() {
+    enc.SetDistinctCount(s.DistinctCount())
+  }
+  return
+}
+{{end}}
+
+// NewStatistics uses the type in the column descriptor to construct the appropriate
+// typed stats object. If mem is nil, then memory.DefaultAllocator will be used.
+func NewStatistics(descr *schema.Column, mem memory.Allocator) TypedStatistics {
+  if mem == nil {
+    mem = memory.DefaultAllocator
+  }
+  switch descr.PhysicalType() {
+{{- range .In}}
+  case parquet.Types.{{if .physical}}{{.physical}}{{else}}{{.Name}}{{end}}:
+    return New{{.Name}}Statistics(descr, mem)
+{{- end}}
+  default:
+    panic("not implemented")
+  }
+}
+
+// NewStatisticsFromEncoded uses the provided information to initialize a typed stat object
+// by checking the type of the provided column descriptor.
+//
+// If mem is nil, then memory.DefaultAllocator is used.
+func NewStatisticsFromEncoded(descr *schema.Column, mem memory.Allocator, nvalues int64, encoded StatProvider) TypedStatistics {
+  if mem == nil {
+    mem = memory.DefaultAllocator
+  }
+  switch descr.PhysicalType() {
+{{- range .In}}
+  case parquet.Types.{{if .physical}}{{.physical}}{{else}}{{.Name}}{{end}}:
+    return New{{.Name}}StatisticsFromEncoded(descr, mem, nvalues, encoded)
+{{- end}}
+  default:
+    panic("not implemented")
+  }
+}
diff --git a/go/parquet/reader_writer_properties_test.go b/go/parquet/reader_writer_properties_test.go
index ed10a76bf05..a8bffef3fdf 100644
--- a/go/parquet/reader_writer_properties_test.go
+++ b/go/parquet/reader_writer_properties_test.go
@@ -37,7 +37,7 @@ func TestWriterPropBasics(t *testing.T) {
 
 	assert.Equal(t, parquet.DefaultDataPageSize, props.DataPageSize())
 	assert.Equal(t, parquet.DefaultDictionaryPageSizeLimit, props.DictionaryPageSizeLimit())
-	assert.Equal(t, parquet.V1, props.Version())
+	assert.Equal(t, parquet.V2_LATEST, props.Version())
 	assert.Equal(t, parquet.DataPageV1, props.DataPageVersion())
 }
 
diff --git a/go/parquet/types.go b/go/parquet/types.go
index b55d664c91e..e568984ebe3 100644
--- a/go/parquet/types.go
+++ b/go/parquet/types.go
@@ -220,10 +220,37 @@ const (
 	AesCtr
 )
 
-// Constants for the parquet Version
+// Constants for the parquet Version which governs which data types are allowed
+// and how they are represented. For example, uint32 data will be written differently
+// depending on this value (as INT64 for V1_0, as UINT32 for other versions).
+//
+// However, some features - such as compression algorithms, encryption,
+// or the improved v2 data page format must be enabled separately in writer
+// properties.
 const (
-	V1 Version = 1
-	V2 Version = 2
+	// Enable only pre-2.2 parquet format features when writing.
+	//
+	// This is useful for maximum compatibility with legacy readers.
+	// Note that logical types may still be emitted, as long as they have
+	// a corresponding converted type.
+	V1_0 Version = iota
+	// Enable parquet format 2.4 and earlier features when writing.
+	//
+	// This enables uint32 as well as logical types which don't have a
+	// corresponding converted type.
+	//
+	// Note: Parquet format 2.4.0 was released in October 2017
+	V2_4
+	// Enable Parquet format 2.6 and earlier features when writing.
+	//
+	// This enables the nanos time unit in addition to the V2_4 features.
+	//
+	// Note: Parquet format 2.6.0 was released in September 2018
+	V2_6
+	// Enable the latest parquet format 2.x features.
+	//
+	// This is equal to the greatest 2.x version supported by this library.
+	V2_LATEST = V2_6
 )
 
 // constants for the parquet DataPage Version to use
diff --git a/go/parquet/writer_properties.go b/go/parquet/writer_properties.go
index ef11454a863..97bf3343f25 100644
--- a/go/parquet/writer_properties.go
+++ b/go/parquet/writer_properties.go
@@ -297,7 +297,7 @@ func defaultWriterProperties() *WriterProperties {
 		batchSize:       DefaultWriteBatchSize,
 		maxRowGroupLen:  DefaultMaxRowGroupLen,
 		pageSize:        DefaultDataPageSize,
-		parquetVersion:  V1,
+		parquetVersion:  V2_LATEST,
 		dataPageVersion: DataPageV1,
 		createdBy:       DefaultCreatedBy,
 		defColumnProps:  DefaultColumnProperties(),
@@ -434,7 +434,7 @@ func (w *WriterProperties) EncodingPath(path ColumnPath) Encoding {
 // DictionaryIndexEncoding returns which encoding will be used for the Dictionary Index values based on the
 // parquet version. V1 uses PlainDict and V2 uses RLEDict
 func (w *WriterProperties) DictionaryIndexEncoding() Encoding {
-	if w.parquetVersion == V1 {
+	if w.parquetVersion == V1_0 {
 		return Encodings.PlainDict
 	}
 	return Encodings.RLEDict
@@ -443,7 +443,7 @@ func (w *WriterProperties) DictionaryIndexEncoding() Encoding {
 // DictionaryPageEncoding returns the encoding that will be utilized for the DictionaryPage itself based on the parquet
 // version. V1 uses PlainDict, v2 uses Plain
 func (w *WriterProperties) DictionaryPageEncoding() Encoding {
-	if w.parquetVersion == V1 {
+	if w.parquetVersion == V1_0 {
 		return Encodings.PlainDict
 	}
 	return Encodings.Plain
diff --git a/java/.gitignore b/java/.gitignore
index 03f5bf76e60..bc6ce4f6c32 100644
--- a/java/.gitignore
+++ b/java/.gitignore
@@ -2,6 +2,7 @@
 .buildpath
 .classpath
 .checkstyle
+.factorypath
 .settings/
 .idea/
 TAGS
diff --git a/java/adapter/jdbc/pom.xml b/java/adapter/jdbc/pom.xml
index 76a5f8fba8e..774676cf7e5 100644
--- a/java/adapter/jdbc/pom.xml
+++ b/java/adapter/jdbc/pom.xml
@@ -93,17 +93,4 @@
 
     </dependencies>
 
-    <build>	
-        <plugins>
-            <plugin>
-                <groupId>org.apache.maven.plugins</groupId>
-                <artifactId>maven-surefire-plugin</artifactId>
-                <configuration>
-                    <systemPropertyVariables>
-                        <user.timezone>UTC</user.timezone>
-                    </systemPropertyVariables>
-                </configuration>
-            </plugin>
-        </plugins>
-    </build>
 </project>
diff --git a/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/ArrowVectorIterator.java b/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/ArrowVectorIterator.java
index e44505605a3..0e833bcc251 100644
--- a/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/ArrowVectorIterator.java
+++ b/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/ArrowVectorIterator.java
@@ -46,6 +46,7 @@ public class ArrowVectorIterator implements Iterator<VectorSchemaRoot>, AutoClos
   private final JdbcConsumer[] consumers;
   final CompositeJdbcConsumer compositeConsumer;
 
+  // this is used only if resuing vector schema root is enabled.
   private VectorSchemaRoot nextBatch;
 
   private final int targetBatchSize;
@@ -73,7 +74,7 @@ private void initialize() throws SQLException {
           arrowType, i, isColumnNullable(resultSet, i), null, config);
     }
 
-    load(createVectorSchemaRoot());
+    this.nextBatch = config.isReuseVectorSchemaRoot() ? createVectorSchemaRoot() : null;
   }
 
   /**
@@ -83,15 +84,17 @@ public static ArrowVectorIterator create(
       ResultSet resultSet,
       JdbcToArrowConfig config)
       throws SQLException {
-
-    ArrowVectorIterator iterator = new ArrowVectorIterator(resultSet, config);
+    ArrowVectorIterator iterator = null;
     try {
+      iterator = new ArrowVectorIterator(resultSet, config);
       iterator.initialize();
-      return iterator;
-    } catch (Exception e) {
-      iterator.close();
+    } catch (Throwable e) {
+      if (iterator != null) {
+        iterator.close();
+      }
       throw new RuntimeException("Error occurred while creating iterator.", e);
     }
+    return iterator;
   }
 
   private void consumeData(VectorSchemaRoot root) {
@@ -111,9 +114,8 @@ private void consumeData(VectorSchemaRoot root) {
         }
       }
 
-
       root.setRowCount(readRowCount);
-    } catch (Exception e) {
+    } catch (Throwable e) {
       compositeConsumer.close();
       throw new RuntimeException("Error occurred while consuming data.", e);
     }
@@ -126,7 +128,7 @@ private VectorSchemaRoot createVectorSchemaRoot() {
       if (config.getTargetBatchSize() != JdbcToArrowConfig.NO_LIMIT_BATCH_SIZE) {
         ValueVectorUtility.preAllocate(root, config.getTargetBatchSize());
       }
-    } catch (Exception e) {
+    } catch (Throwable e) {
       if (root != null) {
         root.close();
       }
@@ -137,40 +139,38 @@ private VectorSchemaRoot createVectorSchemaRoot() {
 
   // Loads the next schema root or null if no more rows are available.
   private void load(VectorSchemaRoot root) throws SQLException {
-
-    for (int i = 1; i <= consumers.length; i++) {
-      consumers[i - 1].resetValueVector(root.getVector(rsmd.getColumnLabel(i)));
+    for (int i = 0; i < consumers.length; i++) {
+      consumers[i].resetValueVector(root.getVector(i));
     }
 
     consumeData(root);
-
-    if (root.getRowCount() == 0) {
-      root.close();
-      nextBatch = null;
-    } else {
-      nextBatch = root;
-    }
   }
 
   @Override
   public boolean hasNext() {
-    return nextBatch != null;
+    try {
+      return !resultSet.isAfterLast();
+    } catch (SQLException e) {
+      throw new RuntimeException(e);
+    }
   }
 
   /**
-   * Gets the next vector. The user is responsible for freeing its resources.
+   * Gets the next vector.
+   * If {@link JdbcToArrowConfig#isReuseVectorSchemaRoot()} is false,
+   * the client is responsible for freeing its resources.
    */
   @Override
   public VectorSchemaRoot next() {
     Preconditions.checkArgument(hasNext());
-    VectorSchemaRoot returned = nextBatch;
     try {
-      load(createVectorSchemaRoot());
+      VectorSchemaRoot ret = config.isReuseVectorSchemaRoot() ? nextBatch : createVectorSchemaRoot();
+      load(ret);
+      return ret;
     } catch (Exception e) {
       close();
       throw new RuntimeException("Error occurred while getting next schema root.", e);
     }
-    return returned;
   }
 
   /**
@@ -178,7 +178,7 @@ public VectorSchemaRoot next() {
    */
   @Override
   public void close() {
-    if (nextBatch != null) {
+    if (config.isReuseVectorSchemaRoot()) {
       nextBatch.close();
     }
     compositeConsumer.close();
diff --git a/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/JdbcToArrow.java b/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/JdbcToArrow.java
index c65523d837f..daee64d9308 100644
--- a/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/JdbcToArrow.java
+++ b/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/JdbcToArrow.java
@@ -18,17 +18,11 @@
 package org.apache.arrow.adapter.jdbc;
 
 import java.io.IOException;
-import java.sql.Connection;
 import java.sql.ResultSet;
 import java.sql.SQLException;
-import java.sql.Statement;
-import java.util.Calendar;
 
 import org.apache.arrow.memory.BufferAllocator;
-import org.apache.arrow.memory.RootAllocator;
 import org.apache.arrow.util.Preconditions;
-import org.apache.arrow.vector.VectorSchemaRoot;
-import org.apache.arrow.vector.util.ValueVectorUtility;
 
 /**
  * Utility class to convert JDBC objects to columnar Arrow format objects.
@@ -64,170 +58,6 @@
  */
 public class JdbcToArrow {
 
-  /**
-   * For the given SQL query, execute and fetch the data from Relational DB and convert it to Arrow objects.
-   * This method uses the default Calendar instance with default TimeZone and Locale as returned by the JVM.
-   * If you wish to use specific TimeZone or Locale for any Date, Time and Timestamp datasets, you may want use
-   * overloaded API that taken Calendar object instance.
-   *
-   * @param connection Database connection to be used. This method will not close the passed connection object. Since
-   *                   the caller has passed the connection object it's the responsibility of the caller to close or
-   *                   return the connection to the pool.
-   * @param query      The DB Query to fetch the data.
-   * @param allocator  Memory allocator
-   * @return Arrow Data Objects {@link VectorSchemaRoot}
-   * @throws SQLException Propagate any SQL Exceptions to the caller after closing any resources opened such as
-   *                      ResultSet and Statement objects.
-   */
-  @Deprecated
-  public static VectorSchemaRoot sqlToArrow(Connection connection, String query, BufferAllocator allocator)
-      throws SQLException, IOException {
-    Preconditions.checkNotNull(allocator, "Memory allocator object can not be null");
-
-    JdbcToArrowConfig config =
-        new JdbcToArrowConfig(allocator, JdbcToArrowUtils.getUtcCalendar());
-    return sqlToArrow(connection, query, config);
-  }
-
-  /**
-   * For the given SQL query, execute and fetch the data from Relational DB and convert it to Arrow objects.
-   *
-   * @param connection Database connection to be used. This method will not close the passed connection object. Since
-   *                   the caller has passed the connection object it's the responsibility of the caller to close or
-   *                   return the connection to the pool.
-   * @param query      The DB Query to fetch the data.
-   * @param allocator  Memory allocator
-   * @param calendar   Calendar object to use to handle Date, Time and Timestamp datasets.
-   * @return Arrow Data Objects {@link VectorSchemaRoot}
-   * @throws SQLException Propagate any SQL Exceptions to the caller after closing any resources opened such as
-   *                      ResultSet and Statement objects.
-   */
-  @Deprecated
-  public static VectorSchemaRoot sqlToArrow(
-      Connection connection,
-      String query,
-      BufferAllocator allocator,
-      Calendar calendar) throws SQLException, IOException {
-
-    Preconditions.checkNotNull(allocator, "Memory allocator object can not be null");
-    Preconditions.checkNotNull(calendar, "Calendar object can not be null");
-
-    return sqlToArrow(connection, query, new JdbcToArrowConfig(allocator, calendar));
-  }
-
-  /**
-   * For the given SQL query, execute and fetch the data from Relational DB and convert it to Arrow objects.
-   *
-   * @param connection Database connection to be used. This method will not close the passed connection object.
-   *                   Since the caller has passed the connection object it's the responsibility of the caller
-   *                   to close or return the connection to the pool.
-   * @param query      The DB Query to fetch the data.
-   * @param config     Configuration
-   * @return Arrow Data Objects {@link VectorSchemaRoot}
-   * @throws SQLException Propagate any SQL Exceptions to the caller after closing any resources opened such as
-   *                      ResultSet and Statement objects.
-   */
-  @Deprecated
-  public static VectorSchemaRoot sqlToArrow(Connection connection, String query, JdbcToArrowConfig config)
-      throws SQLException, IOException {
-    Preconditions.checkNotNull(connection, "JDBC connection object can not be null");
-    Preconditions.checkArgument(query != null && query.length() > 0, "SQL query can not be null or empty");
-
-    try (Statement stmt = connection.createStatement()) {
-      return sqlToArrow(stmt.executeQuery(query), config);
-    }
-  }
-
-  /**
-   * For the given JDBC {@link ResultSet}, fetch the data from Relational DB and convert it to Arrow objects. This
-   * method uses the default RootAllocator and Calendar object.
-   *
-   * @param resultSet ResultSet to use to fetch the data from underlying database
-   * @return Arrow Data Objects {@link VectorSchemaRoot}
-   * @throws SQLException on error
-   */
-  @Deprecated
-  public static VectorSchemaRoot sqlToArrow(ResultSet resultSet) throws SQLException, IOException {
-    Preconditions.checkNotNull(resultSet, "JDBC ResultSet object can not be null");
-
-    return sqlToArrow(resultSet, JdbcToArrowUtils.getUtcCalendar());
-  }
-
-  /**
-   * For the given JDBC {@link ResultSet}, fetch the data from Relational DB and convert it to Arrow objects.
-   *
-   * @param resultSet ResultSet to use to fetch the data from underlying database
-   * @param allocator Memory allocator
-   * @return Arrow Data Objects {@link VectorSchemaRoot}
-   * @throws SQLException on error
-   */
-  @Deprecated
-  public static VectorSchemaRoot sqlToArrow(ResultSet resultSet, BufferAllocator allocator)
-      throws SQLException, IOException {
-    Preconditions.checkNotNull(allocator, "Memory Allocator object can not be null");
-
-    JdbcToArrowConfig config =
-        new JdbcToArrowConfig(allocator, JdbcToArrowUtils.getUtcCalendar());
-    return sqlToArrow(resultSet, config);
-  }
-
-  /**
-   * For the given JDBC {@link ResultSet}, fetch the data from Relational DB and convert it to Arrow objects.
-   *
-   * @param resultSet ResultSet to use to fetch the data from underlying database
-   * @param calendar  Calendar instance to use for Date, Time and Timestamp datasets, or <code>null</code> if none.
-   * @return Arrow Data Objects {@link VectorSchemaRoot}
-   * @throws SQLException on error
-   */
-  @Deprecated
-  public static VectorSchemaRoot sqlToArrow(ResultSet resultSet, Calendar calendar) throws SQLException, IOException {
-    Preconditions.checkNotNull(resultSet, "JDBC ResultSet object can not be null");
-    return sqlToArrow(resultSet, new JdbcToArrowConfig(new RootAllocator(Integer.MAX_VALUE), calendar));
-  }
-
-  /**
-   * For the given JDBC {@link ResultSet}, fetch the data from Relational DB and convert it to Arrow objects.
-   *
-   * @param resultSet ResultSet to use to fetch the data from underlying database
-   * @param allocator Memory allocator to use.
-   * @param calendar  Calendar instance to use for Date, Time and Timestamp datasets, or <code>null</code> if none.
-   * @return Arrow Data Objects {@link VectorSchemaRoot}
-   * @throws SQLException on error
-   */
-  @Deprecated
-  public static VectorSchemaRoot sqlToArrow(
-      ResultSet resultSet,
-      BufferAllocator allocator,
-      Calendar calendar)
-      throws SQLException, IOException {
-    Preconditions.checkNotNull(allocator, "Memory Allocator object can not be null");
-
-    return sqlToArrow(resultSet, new JdbcToArrowConfig(allocator, calendar));
-  }
-
-  /**
-   * For the given JDBC {@link ResultSet}, fetch the data from Relational DB and convert it to Arrow objects.
-   *
-   * @param resultSet ResultSet to use to fetch the data from underlying database
-   * @param config    Configuration of the conversion from JDBC to Arrow.
-   * @return Arrow Data Objects {@link VectorSchemaRoot}
-   * @throws SQLException on error
-   */
-  @Deprecated
-  public static VectorSchemaRoot sqlToArrow(ResultSet resultSet, JdbcToArrowConfig config)
-      throws SQLException, IOException {
-    Preconditions.checkNotNull(resultSet, "JDBC ResultSet object can not be null");
-    Preconditions.checkNotNull(config, "The configuration cannot be null");
-
-    VectorSchemaRoot root = VectorSchemaRoot.create(
-        JdbcToArrowUtils.jdbcToArrowSchema(resultSet.getMetaData(), config), config.getAllocator());
-    if (config.getTargetBatchSize() != JdbcToArrowConfig.NO_LIMIT_BATCH_SIZE) {
-      ValueVectorUtility.preAllocate(root, config.getTargetBatchSize());
-    }
-    JdbcToArrowUtils.jdbcToArrowVectors(resultSet, root, config);
-    return root;
-  }
-
   /*----------------------------------------------------------------*
    |                                                                |
    |          Partial Convert API                        |
diff --git a/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/JdbcToArrowConfig.java b/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/JdbcToArrowConfig.java
index 9a587e7e44b..250b0edd2d3 100644
--- a/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/JdbcToArrowConfig.java
+++ b/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/JdbcToArrowConfig.java
@@ -58,6 +58,7 @@ public final class JdbcToArrowConfig {
   private final Calendar calendar;
   private final BufferAllocator allocator;
   private final boolean includeMetadata;
+  private final boolean reuseVectorSchemaRoot;
   private final Map<Integer, JdbcFieldInfo> arraySubTypesByColumnIndex;
   private final Map<String, JdbcFieldInfo> arraySubTypesByColumnName;
 
@@ -87,7 +88,12 @@ public final class JdbcToArrowConfig {
    * @param calendar        The calendar to use when constructing Timestamp fields and reading time-based results.
    */
   JdbcToArrowConfig(BufferAllocator allocator, Calendar calendar) {
-    this(allocator, calendar, false, null, null, DEFAULT_TARGET_BATCH_SIZE, null);
+    this(allocator, calendar,
+        /* include metadata */ false,
+        /* reuse vector schema root */ false,
+        /* array sub-types by column index */ null,
+        /* array sub-types by column name */ null,
+        DEFAULT_TARGET_BATCH_SIZE, null);
   }
 
   /**
@@ -98,6 +104,7 @@ public final class JdbcToArrowConfig {
    * @param allocator       The memory allocator to construct the Arrow vectors with.
    * @param calendar        The calendar to use when constructing Timestamp fields and reading time-based results.
    * @param includeMetadata Whether to include JDBC field metadata in the Arrow Schema Field metadata.
+   * @param reuseVectorSchemaRoot Whether to reuse the vector schema root for each data load.
    * @param arraySubTypesByColumnIndex The type of the JDBC array at the column index (1-based).
    * @param arraySubTypesByColumnName  The type of the JDBC array at the column name.
    * @param jdbcToArrowTypeConverter The function that maps JDBC field type information to arrow type. If set to null,
@@ -134,6 +141,7 @@ public final class JdbcToArrowConfig {
       BufferAllocator allocator,
       Calendar calendar,
       boolean includeMetadata,
+      boolean reuseVectorSchemaRoot,
       Map<Integer, JdbcFieldInfo> arraySubTypesByColumnIndex,
       Map<String, JdbcFieldInfo> arraySubTypesByColumnName,
       int targetBatchSize,
@@ -142,6 +150,7 @@ public final class JdbcToArrowConfig {
     this.allocator = allocator;
     this.calendar = calendar;
     this.includeMetadata = includeMetadata;
+    this.reuseVectorSchemaRoot = reuseVectorSchemaRoot;
     this.arraySubTypesByColumnIndex = arraySubTypesByColumnIndex;
     this.arraySubTypesByColumnName = arraySubTypesByColumnName;
     this.targetBatchSize = targetBatchSize;
@@ -243,6 +252,13 @@ public int getTargetBatchSize() {
     return targetBatchSize;
   }
 
+  /**
+   * Get whether it is allowed to reuse the vector schema root.
+   */
+  public boolean isReuseVectorSchemaRoot() {
+    return reuseVectorSchemaRoot;
+  }
+
   /**
    * Gets the mapping between JDBC type information to Arrow type.
    */
diff --git a/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/JdbcToArrowConfigBuilder.java b/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/JdbcToArrowConfigBuilder.java
index cf0873555a4..3941d978f91 100644
--- a/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/JdbcToArrowConfigBuilder.java
+++ b/java/adapter/jdbc/src/main/java/org/apache/arrow/adapter/jdbc/JdbcToArrowConfigBuilder.java
@@ -34,6 +34,7 @@ public class JdbcToArrowConfigBuilder {
   private Calendar calendar;
   private BufferAllocator allocator;
   private boolean includeMetadata;
+  private boolean reuseVectorSchemaRoot;
   private Map<Integer, JdbcFieldInfo> arraySubTypesByColumnIndex;
   private Map<String, JdbcFieldInfo> arraySubTypesByColumnName;
 
@@ -49,6 +50,7 @@ public JdbcToArrowConfigBuilder() {
     this.allocator = null;
     this.calendar = null;
     this.includeMetadata = false;
+    this.reuseVectorSchemaRoot = false;
     this.arraySubTypesByColumnIndex = null;
     this.arraySubTypesByColumnName = null;
   }
@@ -76,6 +78,7 @@ public JdbcToArrowConfigBuilder(BufferAllocator allocator, Calendar calendar) {
     this.allocator = allocator;
     this.calendar = calendar;
     this.includeMetadata = false;
+    this.reuseVectorSchemaRoot = false;
     this.targetBatchSize = DEFAULT_TARGET_BATCH_SIZE;
   }
 
@@ -172,6 +175,11 @@ public JdbcToArrowConfigBuilder setJdbcToArrowTypeConverter(
     return this;
   }
 
+  public JdbcToArrowConfigBuilder setReuseVectorSchemaRoot(boolean reuseVectorSchemaRoot) {
+    this.reuseVectorSchemaRoot = reuseVectorSchemaRoot;
+    return this;
+  }
+
   /**
    * This builds the {@link JdbcToArrowConfig} from the provided
    * {@link BufferAllocator} and {@link Calendar}.
@@ -184,6 +192,7 @@ public JdbcToArrowConfig build() {
         allocator,
         calendar,
         includeMetadata,
+        reuseVectorSchemaRoot,
         arraySubTypesByColumnIndex,
         arraySubTypesByColumnName,
         targetBatchSize,
diff --git a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/AbstractJdbcToArrowTest.java b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/AbstractJdbcToArrowTest.java
index 616363ecf64..c3cd4574b2e 100644
--- a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/AbstractJdbcToArrowTest.java
+++ b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/AbstractJdbcToArrowTest.java
@@ -20,10 +20,16 @@
 import java.io.IOException;
 import java.sql.Connection;
 import java.sql.DriverManager;
+import java.sql.ResultSet;
 import java.sql.SQLException;
 import java.sql.Statement;
+import java.util.Calendar;
 
+import org.apache.arrow.memory.BufferAllocator;
+import org.apache.arrow.memory.RootAllocator;
+import org.apache.arrow.util.Preconditions;
 import org.apache.arrow.vector.VectorSchemaRoot;
+import org.apache.arrow.vector.util.ValueVectorUtility;
 import org.junit.After;
 import org.junit.Before;
 import org.junit.Test;
@@ -57,6 +63,7 @@ public abstract class AbstractJdbcToArrowTest {
 
   protected Connection conn = null;
   protected Table table;
+  protected boolean reuseVectorSchemaRoot;
 
   /**
    * This method creates Table object after reading YAML file.
@@ -140,4 +147,176 @@ public static Object[][] prepareTestData(String[] testFiles, @SuppressWarnings("
    */
   public abstract void testDataSets(VectorSchemaRoot root);
 
+  /**
+   * For the given SQL query, execute and fetch the data from Relational DB and convert it to Arrow objects.
+   * This method uses the default Calendar instance with default TimeZone and Locale as returned by the JVM.
+   * If you wish to use specific TimeZone or Locale for any Date, Time and Timestamp datasets, you may want use
+   * overloaded API that taken Calendar object instance.
+   *
+   * This method is for test only.
+   *
+   * @param connection Database connection to be used. This method will not close the passed connection object. Since
+   *                   the caller has passed the connection object it's the responsibility of the caller to close or
+   *                   return the connection to the pool.
+   * @param query      The DB Query to fetch the data.
+   * @param allocator  Memory allocator
+   * @return Arrow Data Objects {@link VectorSchemaRoot}
+   * @throws SQLException Propagate any SQL Exceptions to the caller after closing any resources opened such as
+   *                      ResultSet and Statement objects.
+   */
+  public static VectorSchemaRoot sqlToArrow(Connection connection, String query, BufferAllocator allocator)
+      throws SQLException, IOException {
+    Preconditions.checkNotNull(allocator, "Memory allocator object can not be null");
+
+    JdbcToArrowConfig config =
+        new JdbcToArrowConfig(allocator, JdbcToArrowUtils.getUtcCalendar());
+    return sqlToArrow(connection, query, config);
+  }
+
+  /**
+   * For the given SQL query, execute and fetch the data from Relational DB and convert it to Arrow objects.
+   *
+   * This method is for test only.
+   *
+   * @param connection Database connection to be used. This method will not close the passed connection object. Since
+   *                   the caller has passed the connection object it's the responsibility of the caller to close or
+   *                   return the connection to the pool.
+   * @param query      The DB Query to fetch the data.
+   * @param allocator  Memory allocator
+   * @param calendar   Calendar object to use to handle Date, Time and Timestamp datasets.
+   * @return Arrow Data Objects {@link VectorSchemaRoot}
+   * @throws SQLException Propagate any SQL Exceptions to the caller after closing any resources opened such as
+   *                      ResultSet and Statement objects.
+   */
+  public static VectorSchemaRoot sqlToArrow(
+      Connection connection,
+      String query,
+      BufferAllocator allocator,
+      Calendar calendar) throws SQLException, IOException {
+
+    Preconditions.checkNotNull(allocator, "Memory allocator object can not be null");
+    Preconditions.checkNotNull(calendar, "Calendar object can not be null");
+
+    return sqlToArrow(connection, query, new JdbcToArrowConfig(allocator, calendar));
+  }
+
+  /**
+   * For the given SQL query, execute and fetch the data from Relational DB and convert it to Arrow objects.
+   *
+   * This method is for test only.
+   *
+   * @param connection Database connection to be used. This method will not close the passed connection object.
+   *                   Since the caller has passed the connection object it's the responsibility of the caller
+   *                   to close or return the connection to the pool.
+   * @param query      The DB Query to fetch the data.
+   * @param config     Configuration
+   * @return Arrow Data Objects {@link VectorSchemaRoot}
+   * @throws SQLException Propagate any SQL Exceptions to the caller after closing any resources opened such as
+   *                      ResultSet and Statement objects.
+   */
+  public static VectorSchemaRoot sqlToArrow(Connection connection, String query, JdbcToArrowConfig config)
+      throws SQLException, IOException {
+    Preconditions.checkNotNull(connection, "JDBC connection object can not be null");
+    Preconditions.checkArgument(query != null && query.length() > 0, "SQL query can not be null or empty");
+
+    try (Statement stmt = connection.createStatement()) {
+      return sqlToArrow(stmt.executeQuery(query), config);
+    }
+  }
+
+  /**
+   * For the given JDBC {@link ResultSet}, fetch the data from Relational DB and convert it to Arrow objects. This
+   * method uses the default RootAllocator and Calendar object.
+   *
+   * This method is for test only.
+   *
+   * @param resultSet ResultSet to use to fetch the data from underlying database
+   * @return Arrow Data Objects {@link VectorSchemaRoot}
+   * @throws SQLException on error
+   */
+  public static VectorSchemaRoot sqlToArrow(ResultSet resultSet) throws SQLException, IOException {
+    Preconditions.checkNotNull(resultSet, "JDBC ResultSet object can not be null");
+
+    return sqlToArrow(resultSet, JdbcToArrowUtils.getUtcCalendar());
+  }
+
+  /**
+   * For the given JDBC {@link ResultSet}, fetch the data from Relational DB and convert it to Arrow objects.
+   *
+   * This method is for test only.
+   *
+   * @param resultSet ResultSet to use to fetch the data from underlying database
+   * @param allocator Memory allocator
+   * @return Arrow Data Objects {@link VectorSchemaRoot}
+   * @throws SQLException on error
+   */
+  public static VectorSchemaRoot sqlToArrow(ResultSet resultSet, BufferAllocator allocator)
+      throws SQLException, IOException {
+    Preconditions.checkNotNull(allocator, "Memory Allocator object can not be null");
+
+    JdbcToArrowConfig config =
+        new JdbcToArrowConfig(allocator, JdbcToArrowUtils.getUtcCalendar());
+    return sqlToArrow(resultSet, config);
+  }
+
+  /**
+   * For the given JDBC {@link ResultSet}, fetch the data from Relational DB and convert it to Arrow objects.
+   *
+   * This method is for test only.
+   *
+   * @param resultSet ResultSet to use to fetch the data from underlying database
+   * @param calendar  Calendar instance to use for Date, Time and Timestamp datasets, or <code>null</code> if none.
+   * @return Arrow Data Objects {@link VectorSchemaRoot}
+   * @throws SQLException on error
+   */
+  public static VectorSchemaRoot sqlToArrow(ResultSet resultSet, Calendar calendar) throws SQLException, IOException {
+    Preconditions.checkNotNull(resultSet, "JDBC ResultSet object can not be null");
+    return sqlToArrow(resultSet, new JdbcToArrowConfig(new RootAllocator(Integer.MAX_VALUE), calendar));
+  }
+
+  /**
+   * For the given JDBC {@link ResultSet}, fetch the data from Relational DB and convert it to Arrow objects.
+   *
+   * This method is for test only.
+   *
+   * @param resultSet ResultSet to use to fetch the data from underlying database
+   * @param allocator Memory allocator to use.
+   * @param calendar  Calendar instance to use for Date, Time and Timestamp datasets, or <code>null</code> if none.
+   * @return Arrow Data Objects {@link VectorSchemaRoot}
+   * @throws SQLException on error
+   */
+  public static VectorSchemaRoot sqlToArrow(
+      ResultSet resultSet,
+      BufferAllocator allocator,
+      Calendar calendar)
+      throws SQLException, IOException {
+    Preconditions.checkNotNull(allocator, "Memory Allocator object can not be null");
+
+    return sqlToArrow(resultSet, new JdbcToArrowConfig(allocator, calendar));
+  }
+
+  /**
+   * For the given JDBC {@link ResultSet}, fetch the data from Relational DB and convert it to Arrow objects.
+   *
+   * This method is for test only.
+   *
+   * @param resultSet ResultSet to use to fetch the data from underlying database
+   * @param config    Configuration of the conversion from JDBC to Arrow.
+   * @return Arrow Data Objects {@link VectorSchemaRoot}
+   * @throws SQLException on error
+   */
+  public static VectorSchemaRoot sqlToArrow(ResultSet resultSet, JdbcToArrowConfig config)
+      throws SQLException, IOException {
+    Preconditions.checkNotNull(resultSet, "JDBC ResultSet object can not be null");
+    Preconditions.checkNotNull(config, "The configuration cannot be null");
+
+    VectorSchemaRoot root = VectorSchemaRoot.create(
+        JdbcToArrowUtils.jdbcToArrowSchema(resultSet.getMetaData(), config), config.getAllocator());
+    if (config.getTargetBatchSize() != JdbcToArrowConfig.NO_LIMIT_BATCH_SIZE) {
+      ValueVectorUtility.preAllocate(root, config.getTargetBatchSize());
+    }
+    JdbcToArrowUtils.jdbcToArrowVectors(resultSet, root, config);
+    return root;
+  }
+
 }
diff --git a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/JdbcToArrowConfigTest.java b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/JdbcToArrowConfigTest.java
index 9682f65925f..68a681b052c 100644
--- a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/JdbcToArrowConfigTest.java
+++ b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/JdbcToArrowConfigTest.java
@@ -116,13 +116,15 @@ public void testIncludeMetadata() {
     config = new JdbcToArrowConfigBuilder(allocator, calendar, true).build();
     assertTrue(config.shouldIncludeMetadata());
 
-    config = new JdbcToArrowConfig(allocator, calendar, true, null,
-        null, JdbcToArrowConfig.NO_LIMIT_BATCH_SIZE, null);
+    config = new JdbcToArrowConfig(allocator, calendar, /* include metadata */ true,
+        /* reuse vector schema root */ true, null, null, JdbcToArrowConfig.NO_LIMIT_BATCH_SIZE, null);
     assertTrue(config.shouldIncludeMetadata());
+    assertTrue(config.isReuseVectorSchemaRoot());
 
-    config = new JdbcToArrowConfig(allocator, calendar, false, null,
-        null, JdbcToArrowConfig.NO_LIMIT_BATCH_SIZE, null);
+    config = new JdbcToArrowConfig(allocator, calendar, /* include metadata */ false,
+        /* reuse vector schema root */ false, null, null, JdbcToArrowConfig.NO_LIMIT_BATCH_SIZE, null);
     assertFalse(config.shouldIncludeMetadata());
+    assertFalse(config.isReuseVectorSchemaRoot());
   }
 
   @Test
diff --git a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcAliasToArrowTest.java b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcAliasToArrowTest.java
index f44818a9f09..a6e6b22fcb4 100644
--- a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcAliasToArrowTest.java
+++ b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcAliasToArrowTest.java
@@ -17,6 +17,7 @@
 
 package org.apache.arrow.adapter.jdbc.h2;
 
+import static org.apache.arrow.adapter.jdbc.AbstractJdbcToArrowTest.sqlToArrow;
 import static org.junit.Assert.assertEquals;
 
 import java.sql.Connection;
@@ -28,7 +29,6 @@
 import java.sql.Statement;
 import java.util.List;
 
-import org.apache.arrow.adapter.jdbc.JdbcToArrow;
 import org.apache.arrow.memory.RootAllocator;
 import org.apache.arrow.vector.VectorSchemaRoot;
 import org.apache.arrow.vector.types.pojo.Field;
@@ -106,7 +106,7 @@ public void testJdbcAliasToArrow() throws Exception {
 
     try (ResultSet resultSet = conn.createStatement().executeQuery(QUERY)) {
       final VectorSchemaRoot vector =
-          JdbcToArrow.sqlToArrow(resultSet, new RootAllocator(Integer.MAX_VALUE));
+          sqlToArrow(resultSet, new RootAllocator(Integer.MAX_VALUE));
 
       assertEquals(rowCount, vector.getRowCount());
       Schema vectorSchema = vector.getSchema();
diff --git a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowArrayTest.java b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowArrayTest.java
index 31f7db549e9..b7dc1ee58a5 100644
--- a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowArrayTest.java
+++ b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowArrayTest.java
@@ -17,7 +17,10 @@
 
 package org.apache.arrow.adapter.jdbc.h2;
 
-import static org.junit.Assert.*;
+import static org.apache.arrow.adapter.jdbc.AbstractJdbcToArrowTest.sqlToArrow;
+import static org.junit.Assert.assertArrayEquals;
+import static org.junit.Assert.assertEquals;
+import static org.junit.Assert.assertFalse;
 
 import java.sql.Array;
 import java.sql.Connection;
@@ -32,7 +35,6 @@
 import java.util.Map;
 
 import org.apache.arrow.adapter.jdbc.JdbcFieldInfo;
-import org.apache.arrow.adapter.jdbc.JdbcToArrow;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowConfig;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowConfigBuilder;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowUtils;
@@ -160,7 +162,7 @@ public void testJdbcToArrow() throws Exception {
     final JdbcToArrowConfig config = builder.build();
 
     try (ResultSet resultSet = conn.createStatement().executeQuery(QUERY)) {
-      final VectorSchemaRoot vector = JdbcToArrow.sqlToArrow(resultSet, config);
+      final VectorSchemaRoot vector = sqlToArrow(resultSet, config);
 
       assertEquals(rowCount, vector.getRowCount());
 
@@ -204,7 +206,7 @@ public void testJdbcToArrowWithNulls() throws Exception {
     final JdbcToArrowConfig config = builder.build();
 
     try (ResultSet resultSet = conn.createStatement().executeQuery(QUERY)) {
-      final VectorSchemaRoot vector = JdbcToArrow.sqlToArrow(resultSet, config);
+      final VectorSchemaRoot vector = sqlToArrow(resultSet, config);
 
       assertEquals(rowCount, vector.getRowCount());
 
diff --git a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowCharSetTest.java b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowCharSetTest.java
index b2ac349b596..b548c9169af 100644
--- a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowCharSetTest.java
+++ b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowCharSetTest.java
@@ -31,7 +31,6 @@
 import java.util.Collection;
 
 import org.apache.arrow.adapter.jdbc.AbstractJdbcToArrowTest;
-import org.apache.arrow.adapter.jdbc.JdbcToArrow;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowConfig;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowConfigBuilder;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowTestHelper;
@@ -109,20 +108,20 @@ public static Collection<Object[]> getTestData() throws SQLException, ClassNotFo
    */
   @Test
   public void testJdbcToArrowValues() throws SQLException, IOException {
-    testDataSets(JdbcToArrow.sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE),
+    testDataSets(sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE),
         Calendar.getInstance()));
-    testDataSets(JdbcToArrow.sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE)));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
+    testDataSets(sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE)));
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
         new RootAllocator(Integer.MAX_VALUE), Calendar.getInstance()));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery())));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery())));
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
         new RootAllocator(Integer.MAX_VALUE)));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
         Calendar.getInstance()));
-    testDataSets(JdbcToArrow.sqlToArrow(
+    testDataSets(sqlToArrow(
         conn.createStatement().executeQuery(table.getQuery()),
         new JdbcToArrowConfigBuilder(new RootAllocator(Integer.MAX_VALUE), Calendar.getInstance()).build()));
-    testDataSets(JdbcToArrow.sqlToArrow(
+    testDataSets(sqlToArrow(
         conn,
         table.getQuery(),
         new JdbcToArrowConfigBuilder(new RootAllocator(Integer.MAX_VALUE), Calendar.getInstance()).build()));
diff --git a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowDataTypesTest.java b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowDataTypesTest.java
index 2be6a83c342..40db5c23579 100644
--- a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowDataTypesTest.java
+++ b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowDataTypesTest.java
@@ -41,7 +41,6 @@
 import java.util.Collection;
 
 import org.apache.arrow.adapter.jdbc.AbstractJdbcToArrowTest;
-import org.apache.arrow.adapter.jdbc.JdbcToArrow;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowConfig;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowConfigBuilder;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowTestHelper;
@@ -143,19 +142,19 @@ public static Collection<Object[]> getTestData() throws SQLException, ClassNotFo
    */
   @Test
   public void testJdbcToArrowValues() throws SQLException, IOException {
-    testDataSets(JdbcToArrow.sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE),
+    testDataSets(sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE),
         Calendar.getInstance()));
-    testDataSets(JdbcToArrow.sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE)));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
+    testDataSets(sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE)));
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
         new RootAllocator(Integer.MAX_VALUE), Calendar.getInstance()));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery())));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery())));
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
         new RootAllocator(Integer.MAX_VALUE)));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery()), Calendar.getInstance()));
-    testDataSets(JdbcToArrow.sqlToArrow(
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery()), Calendar.getInstance()));
+    testDataSets(sqlToArrow(
         conn.createStatement().executeQuery(table.getQuery()),
         new JdbcToArrowConfigBuilder(new RootAllocator(Integer.MAX_VALUE), Calendar.getInstance()).build()));
-    testDataSets(JdbcToArrow.sqlToArrow(
+    testDataSets(sqlToArrow(
         conn,
         table.getQuery(),
         new JdbcToArrowConfigBuilder(new RootAllocator(Integer.MAX_VALUE), Calendar.getInstance()).build()));
diff --git a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowNullTest.java b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowNullTest.java
index fd373091f93..71cc700568f 100644
--- a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowNullTest.java
+++ b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowNullTest.java
@@ -49,7 +49,6 @@
 import java.util.Collection;
 
 import org.apache.arrow.adapter.jdbc.AbstractJdbcToArrowTest;
-import org.apache.arrow.adapter.jdbc.JdbcToArrow;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowConfig;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowConfigBuilder;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowTestHelper;
@@ -120,19 +119,19 @@ public static Collection<Object[]> getTestData() throws SQLException, ClassNotFo
    */
   @Test
   public void testJdbcToArrowValues() throws SQLException, IOException {
-    testDataSets(JdbcToArrow.sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE),
+    testDataSets(sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE),
         Calendar.getInstance()));
-    testDataSets(JdbcToArrow.sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE)));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
+    testDataSets(sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE)));
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
         new RootAllocator(Integer.MAX_VALUE), Calendar.getInstance()));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery())));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery())));
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
         new RootAllocator(Integer.MAX_VALUE)));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery()), Calendar.getInstance()));
-    testDataSets(JdbcToArrow.sqlToArrow(
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery()), Calendar.getInstance()));
+    testDataSets(sqlToArrow(
         conn.createStatement().executeQuery(table.getQuery()),
         new JdbcToArrowConfigBuilder(new RootAllocator(Integer.MAX_VALUE), Calendar.getInstance()).build()));
-    testDataSets(JdbcToArrow.sqlToArrow(
+    testDataSets(sqlToArrow(
         conn,
         table.getQuery(),
         new JdbcToArrowConfigBuilder(new RootAllocator(Integer.MAX_VALUE), Calendar.getInstance()).build()));
diff --git a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowOptionalColumnsTest.java b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowOptionalColumnsTest.java
index 4ab9017e247..84960dc8880 100644
--- a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowOptionalColumnsTest.java
+++ b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowOptionalColumnsTest.java
@@ -26,7 +26,6 @@
 import java.util.Collection;
 
 import org.apache.arrow.adapter.jdbc.AbstractJdbcToArrowTest;
-import org.apache.arrow.adapter.jdbc.JdbcToArrow;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowTestHelper;
 import org.apache.arrow.adapter.jdbc.Table;
 import org.apache.arrow.memory.RootAllocator;
@@ -72,7 +71,7 @@ public static Collection<Object[]> getTestData() throws SQLException, ClassNotFo
    */
   @Test
   public void testJdbcToArrowValues() throws SQLException, IOException {
-    testDataSets(JdbcToArrow.sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE)));
+    testDataSets(sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE)));
   }
 
   /**
diff --git a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowTest.java b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowTest.java
index 8c5a17c37f7..ca1c0c00bf7 100644
--- a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowTest.java
+++ b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowTest.java
@@ -67,6 +67,8 @@
 import java.util.Calendar;
 import java.util.Collection;
 import java.util.Map;
+import java.util.stream.Collectors;
+import java.util.stream.Stream;
 
 import org.apache.arrow.adapter.jdbc.AbstractJdbcToArrowTest;
 import org.apache.arrow.adapter.jdbc.ArrowVectorIterator;
@@ -97,7 +99,6 @@
 import org.junit.Test;
 import org.junit.runner.RunWith;
 import org.junit.runners.Parameterized;
-import org.junit.runners.Parameterized.Parameters;
 
 /**
  * JUnit Test Class which contains methods to test JDBC to Arrow data conversion functionality with various data types
@@ -112,9 +113,11 @@ public class JdbcToArrowTest extends AbstractJdbcToArrowTest {
    * Constructor which populates the table object for each test iteration.
    *
    * @param table Table object
+   * @param reuseVectorSchemaRoot A flag indicating if we should reuse vector schema roots.
    */
-  public JdbcToArrowTest(Table table) {
+  public JdbcToArrowTest(Table table, boolean reuseVectorSchemaRoot) {
     this.table = table;
+    this.reuseVectorSchemaRoot = reuseVectorSchemaRoot;
   }
 
   /**
@@ -125,9 +128,10 @@ public JdbcToArrowTest(Table table) {
    * @throws ClassNotFoundException on error
    * @throws IOException on error
    */
-  @Parameters
+  @Parameterized.Parameters(name = "table = {0}, reuse batch = {1}")
   public static Collection<Object[]> getTestData() throws SQLException, ClassNotFoundException, IOException {
-    return Arrays.asList(prepareTestData(testFiles, JdbcToArrowTest.class));
+    return Arrays.stream(prepareTestData(testFiles, JdbcToArrowTest.class)).flatMap(row ->
+      Stream.of(new Object[] {row[0], true}, new Object[] {row[0], false})).collect(Collectors.toList());
   }
 
   /**
@@ -135,20 +139,20 @@ public static Collection<Object[]> getTestData() throws SQLException, ClassNotFo
    */
   @Test
   public void testJdbcToArrowValues() throws SQLException, IOException {
-    testDataSets(JdbcToArrow.sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE),
+    testDataSets(sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE),
         Calendar.getInstance()));
-    testDataSets(JdbcToArrow.sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE)));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
+    testDataSets(sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE)));
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
         new RootAllocator(Integer.MAX_VALUE), Calendar.getInstance()));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery())));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery())));
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
         new RootAllocator(Integer.MAX_VALUE)));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
         Calendar.getInstance()));
-    testDataSets(JdbcToArrow.sqlToArrow(
+    testDataSets(sqlToArrow(
         conn.createStatement().executeQuery(table.getQuery()),
         new JdbcToArrowConfigBuilder(new RootAllocator(Integer.MAX_VALUE), Calendar.getInstance()).build()));
-    testDataSets(JdbcToArrow.sqlToArrow(
+    testDataSets(sqlToArrow(
         conn,
         table.getQuery(),
         new JdbcToArrowConfigBuilder(new RootAllocator(Integer.MAX_VALUE), Calendar.getInstance()).build()));
@@ -156,7 +160,8 @@ public void testJdbcToArrowValues() throws SQLException, IOException {
 
   @Test
   public void testJdbcSchemaMetadata() throws SQLException {
-    JdbcToArrowConfig config = new JdbcToArrowConfigBuilder(new RootAllocator(0), Calendar.getInstance(), true).build();
+    JdbcToArrowConfig config = new JdbcToArrowConfigBuilder(new RootAllocator(0), Calendar.getInstance(), true)
+        .setReuseVectorSchemaRoot(reuseVectorSchemaRoot).build();
     ResultSetMetaData rsmd = conn.createStatement().executeQuery(table.getQuery()).getMetaData();
     Schema schema = JdbcToArrowUtils.jdbcToArrowSchema(rsmd, config);
     JdbcToArrowTestHelper.assertFieldMetadataMatchesResultSetMetadata(rsmd, schema);
@@ -230,11 +235,17 @@ public void runLargeNumberOfRows() throws IOException, SQLException {
     int x = 0;
     final int targetRows = 600000;
     ResultSet rs = new FakeResultSet(targetRows);
-    try (ArrowVectorIterator iter = JdbcToArrow.sqlToArrowVectorIterator(rs, allocator)) {
+    JdbcToArrowConfig config = new JdbcToArrowConfigBuilder(
+        allocator, JdbcToArrowUtils.getUtcCalendar(), /* include metadata */ false)
+        .setReuseVectorSchemaRoot(reuseVectorSchemaRoot).build();
+
+    try (ArrowVectorIterator iter = JdbcToArrow.sqlToArrowVectorIterator(rs, config)) {
       while (iter.hasNext()) {
         VectorSchemaRoot root = iter.next();
         x += root.getRowCount();
-        root.close();
+        if (!reuseVectorSchemaRoot) {
+          root.close();
+        }
       }
     } finally {
       allocator.close();
@@ -618,7 +629,7 @@ public boolean isBeforeFirst() throws SQLException {
 
     @Override
     public boolean isAfterLast() throws SQLException {
-      return false;
+      return numRows < 0;
     }
 
     @Override
diff --git a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowTimeZoneTest.java b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowTimeZoneTest.java
index 7062fa6aec1..f5ddbdb9bf0 100644
--- a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowTimeZoneTest.java
+++ b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowTimeZoneTest.java
@@ -30,7 +30,6 @@
 import java.util.TimeZone;
 
 import org.apache.arrow.adapter.jdbc.AbstractJdbcToArrowTest;
-import org.apache.arrow.adapter.jdbc.JdbcToArrow;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowConfig;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowConfigBuilder;
 import org.apache.arrow.adapter.jdbc.JdbcToArrowTestHelper;
@@ -105,18 +104,18 @@ public static Collection<Object[]> getTestData() throws SQLException, ClassNotFo
    */
   @Test
   public void testJdbcToArrowValues() throws SQLException, IOException {
-    testDataSets(JdbcToArrow.sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE),
+    testDataSets(sqlToArrow(conn, table.getQuery(), new RootAllocator(Integer.MAX_VALUE),
         Calendar.getInstance(TimeZone.getTimeZone(table.getTimezone()))));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
         new RootAllocator(Integer.MAX_VALUE), Calendar.getInstance(TimeZone.getTimeZone(table.getTimezone()))));
-    testDataSets(JdbcToArrow.sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
+    testDataSets(sqlToArrow(conn.createStatement().executeQuery(table.getQuery()),
         Calendar.getInstance(TimeZone.getTimeZone(table.getTimezone()))));
-    testDataSets(JdbcToArrow.sqlToArrow(
+    testDataSets(sqlToArrow(
         conn.createStatement().executeQuery(table.getQuery()),
         new JdbcToArrowConfigBuilder(
             new RootAllocator(Integer.MAX_VALUE),
             Calendar.getInstance(TimeZone.getTimeZone(table.getTimezone()))).build()));
-    testDataSets(JdbcToArrow.sqlToArrow(
+    testDataSets(sqlToArrow(
         conn,
         table.getQuery(),
         new JdbcToArrowConfigBuilder(
diff --git a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowVectorIteratorTest.java b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowVectorIteratorTest.java
index edd1952be05..6206ddcf79f 100644
--- a/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowVectorIteratorTest.java
+++ b/java/adapter/jdbc/src/test/java/org/apache/arrow/adapter/jdbc/h2/JdbcToArrowVectorIteratorTest.java
@@ -27,6 +27,7 @@
 import static org.apache.arrow.adapter.jdbc.JdbcToArrowTestHelper.getLongValues;
 import static org.junit.Assert.assertArrayEquals;
 import static org.junit.Assert.assertEquals;
+import static org.junit.Assert.assertFalse;
 import static org.junit.Assert.assertNotNull;
 import static org.junit.jupiter.api.Assertions.assertNull;
 import static org.junit.jupiter.api.Assertions.assertTrue;
@@ -77,9 +78,10 @@ public class JdbcToArrowVectorIteratorTest extends JdbcToArrowTest {
    * Constructor which populates the table object for each test iteration.
    *
    * @param table Table object
+   * @param reuseVectorSchemaRoot A flag indicating if we should reuse vector schema roots.
    */
-  public JdbcToArrowVectorIteratorTest(Table table) {
-    super(table);
+  public JdbcToArrowVectorIteratorTest(Table table, boolean reuseVectorSchemaRoot) {
+    super(table, reuseVectorSchemaRoot);
   }
 
   @Test
@@ -95,6 +97,42 @@ public void testJdbcToArrowValues() throws SQLException, IOException {
     validate(iterator);
   }
 
+  @Test
+  public void testVectorSchemaRootReuse() throws SQLException, IOException {
+
+    JdbcToArrowConfig config = new JdbcToArrowConfigBuilder(new RootAllocator(Integer.MAX_VALUE),
+        Calendar.getInstance()).setTargetBatchSize(3).setReuseVectorSchemaRoot(reuseVectorSchemaRoot).build();
+
+    ArrowVectorIterator iterator =
+        JdbcToArrow.sqlToArrowVectorIterator(conn.createStatement().executeQuery(table.getQuery()), config);
+
+    int batchCount = 0;
+    VectorSchemaRoot prev = null;
+    while (iterator.hasNext()) {
+      VectorSchemaRoot cur = iterator.next();
+      assertNotNull(cur);
+
+      if (prev != null) {
+        // skip the first iteration
+
+        if (reuseVectorSchemaRoot) {
+          // when reuse is enabled, different iterations are based on the same vector schema root.
+          assertTrue(prev == cur);
+        } else {
+          // when reuse is enabled, a new vector schema root is created in each iteration.
+          assertFalse(prev == cur);
+          cur.close();
+        }
+      }
+
+      prev = cur;
+      batchCount += 1;
+    }
+
+    // make sure we have at least two batches, so the above test paths are actually covered
+    assertTrue(batchCount > 1);
+  }
+
   @Test
   public void testJdbcToArrowValuesNoLimit() throws SQLException, IOException {
 
@@ -113,7 +151,7 @@ public void testTimeStampConsumer() throws SQLException, IOException {
 
     // first experiment, with calendar and time zone.
     JdbcToArrowConfig config = new JdbcToArrowConfigBuilder(new RootAllocator(Integer.MAX_VALUE),
-        Calendar.getInstance()).setTargetBatchSize(3).build();
+        Calendar.getInstance()).setTargetBatchSize(3).setReuseVectorSchemaRoot(reuseVectorSchemaRoot).build();
     assertNotNull(config.getCalendar());
 
     try (ArrowVectorIterator iterator =
@@ -127,7 +165,7 @@ public void testTimeStampConsumer() throws SQLException, IOException {
 
     // second experiment, without calendar and time zone.
     config = new JdbcToArrowConfigBuilder(new RootAllocator(Integer.MAX_VALUE),
-        null).setTargetBatchSize(3).build();
+        null).setTargetBatchSize(3).setReuseVectorSchemaRoot(reuseVectorSchemaRoot).build();
     assertNull(config.getCalendar());
 
     try (ArrowVectorIterator iterator =
@@ -164,6 +202,7 @@ private void validate(ArrowVectorIterator iterator) throws SQLException, IOExcep
     while (iterator.hasNext()) {
       VectorSchemaRoot root = iterator.next();
       roots.add(root);
+
       JdbcToArrowTestHelper.assertFieldMetadataIsEmpty(root);
 
       bigIntVectors.add((BigIntVector) root.getVector(BIGINT));
@@ -397,7 +436,8 @@ private FieldVector getQueryResult(JdbcToArrowConfig config) throws SQLException
   @Test
   public void testJdbcToArrowCustomTypeConversion() throws SQLException, IOException {
     JdbcToArrowConfigBuilder builder = new JdbcToArrowConfigBuilder(new RootAllocator(Integer.MAX_VALUE),
-        Calendar.getInstance()).setTargetBatchSize(JdbcToArrowConfig.NO_LIMIT_BATCH_SIZE);
+        Calendar.getInstance()).setTargetBatchSize(JdbcToArrowConfig.NO_LIMIT_BATCH_SIZE)
+        .setReuseVectorSchemaRoot(reuseVectorSchemaRoot);
 
     // first experiment, using default type converter
     JdbcToArrowConfig config = builder.build();
diff --git a/java/adapter/orc/pom.xml b/java/adapter/orc/pom.xml
index 7928d2ca272..2b203304d97 100644
--- a/java/adapter/orc/pom.xml
+++ b/java/adapter/orc/pom.xml
@@ -109,16 +109,5 @@
                 </includes>
             </resource>
         </resources>
-        <plugins>
-            <plugin>
-                <groupId>org.apache.maven.plugins</groupId>
-                <artifactId>maven-surefire-plugin</artifactId>
-                <configuration>
-                    <systemPropertyVariables>
-                        <user.timezone>UTC</user.timezone>
-                    </systemPropertyVariables>
-                </configuration>
-            </plugin>
-        </plugins>
     </build>
 </project>
diff --git a/java/memory/memory-core/pom.xml b/java/memory/memory-core/pom.xml
index 65abe8e0152..c6cbe4adacf 100644
--- a/java/memory/memory-core/pom.xml
+++ b/java/memory/memory-core/pom.xml
@@ -37,22 +37,4 @@
     </dependency>
   </dependencies>
 
-  <build>
-    <plugins>
-      <plugin>
-        <artifactId>maven-surefire-plugin</artifactId>
-        <version>3.0.0-M3</version>
-        <configuration>
-          <enableAssertions>true</enableAssertions>
-          <childDelegation>true</childDelegation>
-          <forkCount>${forkCount}</forkCount>
-          <reuseForks>true</reuseForks>
-          <systemPropertyVariables>
-            <java.io.tmpdir>${project.build.directory}</java.io.tmpdir>
-            <user.timezone>UTC</user.timezone>
-          </systemPropertyVariables>
-        </configuration>
-      </plugin>
-    </plugins>
-  </build>
 </project>
diff --git a/java/memory/memory-core/src/main/java/org/apache/arrow/memory/ArrowBuf.java b/java/memory/memory-core/src/main/java/org/apache/arrow/memory/ArrowBuf.java
index ea5e29f7253..d7827073ea2 100644
--- a/java/memory/memory-core/src/main/java/org/apache/arrow/memory/ArrowBuf.java
+++ b/java/memory/memory-core/src/main/java/org/apache/arrow/memory/ArrowBuf.java
@@ -1195,51 +1195,8 @@ public ArrowBuf reallocIfNeeded(final long size) {
     }
   }
 
-  /**
-   * Following are wrapper methods to keep this backward compatible.
-   */
-  @Deprecated
-  public void release() {
-    referenceManager.release();
-  }
-
-  @Deprecated
-  public void release(int decrement) {
-    referenceManager.release(decrement);
-  }
-
-  @Deprecated
-  public void retain() {
-    referenceManager.retain();
-  }
-
-  @Deprecated
-  public void retain(int increment) {
-    referenceManager.retain(increment);
-  }
-
-  @Deprecated
   public ArrowBuf clear() {
     this.readerIndex = this.writerIndex = 0;
     return this;
   }
-
-  /**
-   * Initialize the reader and writer index.
-   * @param readerIndex index to read from
-   * @param writerIndex index to write to
-   * @return this
-   */
-  @Deprecated
-  public ArrowBuf setIndex(int readerIndex, int writerIndex) {
-    if (readerIndex >= 0 && readerIndex <= writerIndex && writerIndex <= this.capacity()) {
-      this.readerIndex = readerIndex;
-      this.writerIndex = writerIndex;
-      return this;
-    } else {
-      throw new IndexOutOfBoundsException(String.format("readerIndex: %d, writerIndex: %d " +
-       "(expected:0 <= readerIndex <= writerIndex <= capacity(%d))", readerIndex, writerIndex, this.capacity()));
-    }
-  }
-
 }
diff --git a/java/memory/memory-netty/pom.xml b/java/memory/memory-netty/pom.xml
index b5f256fb102..d94f4da2894 100644
--- a/java/memory/memory-netty/pom.xml
+++ b/java/memory/memory-netty/pom.xml
@@ -45,27 +45,6 @@
     </dependency>
   </dependencies>
 
-  <build>
-    <plugins>
-      <plugin>
-        <artifactId>maven-surefire-plugin</artifactId>
-        <version>3.0.0-M3</version>
-        <configuration>
-          <enableAssertions>true</enableAssertions>
-          <childDelegation>true</childDelegation>
-          <forkCount>${forkCount}</forkCount>
-          <reuseForks>true</reuseForks>
-          <systemPropertyVariables>
-            <java.io.tmpdir>${project.build.directory}</java.io.tmpdir>
-            <io.netty.tryReflectionSetAccessible>true</io.netty.tryReflectionSetAccessible>
-            <arrow.vector.max_allocation_bytes>1048576</arrow.vector.max_allocation_bytes>
-            <user.timezone>UTC</user.timezone>
-          </systemPropertyVariables>
-        </configuration>
-      </plugin>
-    </plugins>
-  </build>
-
   <profiles>
     <profile>
       <!-- This profile turns on integration testing. It activates the failsafe plugin and will run any tests
@@ -77,14 +56,6 @@
           <plugin>
             <groupId>org.apache.maven.plugins</groupId>
             <artifactId>maven-failsafe-plugin</artifactId>
-            <configuration>
-              <systemPropertyVariables>
-                <java.io.tmpdir>${project.build.directory}</java.io.tmpdir>
-                <io.netty.tryReflectionSetAccessible>true</io.netty.tryReflectionSetAccessible>
-                <user.timezone>UTC</user.timezone>
-              </systemPropertyVariables>
-              <argLine />
-            </configuration>
             <executions>
               <execution>
                 <goals>
diff --git a/java/memory/memory-unsafe/pom.xml b/java/memory/memory-unsafe/pom.xml
index d5ceb2cde57..0ed164c4a12 100644
--- a/java/memory/memory-unsafe/pom.xml
+++ b/java/memory/memory-unsafe/pom.xml
@@ -30,23 +30,4 @@
     </dependency>
   </dependencies>
 
-  <build>
-    <plugins>
-      <plugin>
-        <artifactId>maven-surefire-plugin</artifactId>
-        <version>3.0.0-M3</version>
-        <configuration>
-          <enableAssertions>true</enableAssertions>
-          <childDelegation>true</childDelegation>
-          <forkCount>${forkCount}</forkCount>
-          <reuseForks>true</reuseForks>
-          <systemPropertyVariables>
-            <java.io.tmpdir>${project.build.directory}</java.io.tmpdir>
-            <user.timezone>UTC</user.timezone>
-          </systemPropertyVariables>
-        </configuration>
-      </plugin>
-    </plugins>
-  </build>
-
 </project>
diff --git a/java/pom.xml b/java/pom.xml
index 8752abe1fc4..ac5892a7550 100644
--- a/java/pom.xml
+++ b/java/pom.xml
@@ -28,7 +28,7 @@
   <url>https://arrow.apache.org/</url>
 
   <properties>
-    <target.gen.source.path>${project.basedir}/target/generated-sources</target.gen.source.path>
+    <target.gen.source.path>${project.build.directory}/generated-sources</target.gen.source.path>
     <dep.junit.platform.version>1.4.0</dep.junit.platform.version>
     <dep.junit.jupiter.version>5.4.0</dep.junit.jupiter.version>
     <dep.slf4j.version>1.7.25</dep.slf4j.version>
@@ -128,6 +128,7 @@
             <exclude>**/TAGS</exclude>
             <exclude>**/*.checkstyle</exclude>
             <exclude>**/.classpath</exclude>
+            <exclude>**/.factorypath</exclude>
             <exclude>**/.settings/**</exclude>
             <exclude>.*/**</exclude>
             <exclude>**/*.patch</exclude>
@@ -394,13 +395,28 @@
               <java.io.tmpdir>${project.build.directory}</java.io.tmpdir>
               <io.netty.tryReflectionSetAccessible>true</io.netty.tryReflectionSetAccessible>
               <user.timezone>UTC</user.timezone>
+              <!-- Note: changing the below configuration might increase the max allocation size for a vector
+              which in turn can cause OOM. -->
+              <arrow.vector.max_allocation_bytes>1048576</arrow.vector.max_allocation_bytes>
             </systemPropertyVariables>
-            <!-- Note: changing the below configuration might increase the max allocation size for a vector
-            which in turn can cause OOM. -->
-            <argLine>-Darrow.vector.max_allocation_bytes=1048576</argLine>
           </configuration>
         </plugin>
-
+        <plugin>
+          <artifactId>maven-failsafe-plugin</artifactId>
+          <version>3.0.0-M3</version>
+          <configuration>
+            <systemPropertyVariables>
+              <java.io.tmpdir>${project.build.directory}</java.io.tmpdir>
+              <io.netty.tryReflectionSetAccessible>true</io.netty.tryReflectionSetAccessible>
+              <user.timezone>UTC</user.timezone>
+            </systemPropertyVariables>
+          </configuration>
+        </plugin>
+        <plugin>
+          <groupId>org.jacoco</groupId>
+          <artifactId>jacoco-maven-plugin</artifactId>
+          <version>0.8.7</version>
+        </plugin>
 
         <!--This plugin's configuration is used to store Eclipse m2e settings
           only. It has no influence on the Maven build itself. -->
@@ -759,6 +775,57 @@
       </build>
     </profile>
 
+    <profile>
+      <id>code-coverage</id>
+      <!--
+        Use `mvn -Pcode-coverage install site` to capture and generate the code coverage report
+        Alternatively, if you do not want to generate the full set of reports, use:
+        `mvn -Pcode-coverage install org.jacoco:jacoco-maven-plugin:report org.jacoco:jacoco-maven-plugin:report-integration`
+
+        Add `-Pintegration-tests` to the previous commandline to also capture integration tests coverage
+      -->
+      <build>
+        <plugins>
+          <plugin>
+            <groupId>org.jacoco</groupId>
+            <artifactId>jacoco-maven-plugin</artifactId>
+            <executions>
+              <execution>
+                <id>default-prepare-agent</id>
+                <goals>
+                  <goal>prepare-agent</goal>
+                </goals>
+              </execution>
+              <execution>
+                <id>default-prepare-agent-integration</id>
+                <goals>
+                  <goal>prepare-agent-integration</goal>
+                </goals>
+              </execution>
+            </executions>
+          </plugin>
+        </plugins>
+      </build>
+      <reporting>
+        <plugins>
+          <plugin>
+            <groupId>org.jacoco</groupId>
+            <artifactId>jacoco-maven-plugin</artifactId>
+            <version>0.8.7</version>
+            <reportSets>
+              <reportSet>
+                <inherited>false</inherited><!-- don't run aggregate in child modules -->
+                <reports>
+                  <!-- select non-aggregate reports -->
+                  <report>report</report>
+                </reports>
+              </reportSet>
+            </reportSets>
+          </plugin>
+        </plugins>
+      </reporting>
+    </profile>
+
   </profiles>
 
 </project>
diff --git a/java/vector/pom.xml b/java/vector/pom.xml
index 1336f0debe2..4661a133172 100644
--- a/java/vector/pom.xml
+++ b/java/vector/pom.xml
@@ -105,20 +105,6 @@
       <plugin>
         <groupId>org.apache.maven.plugins</groupId>
         <artifactId>maven-surefire-plugin</artifactId>
-        <configuration>
-          <enableAssertions>true</enableAssertions>
-          <childDelegation>true</childDelegation>
-          <forkCount>${forkCount}</forkCount>
-          <reuseForks>true</reuseForks>
-          <systemPropertyVariables>
-            <java.io.tmpdir>${project.build.directory}</java.io.tmpdir>
-            <io.netty.tryReflectionSetAccessible>true</io.netty.tryReflectionSetAccessible>
-            <user.timezone>UTC</user.timezone>
-          </systemPropertyVariables>
-          <!-- Note: changing the below configuration might increase the max allocation size for a vector
-          which in turn can cause OOM. -->
-          <argLine>-Darrow.vector.max_allocation_bytes=1048576</argLine>
-        </configuration>
         <executions>
           <execution>
             <id>default-test</id>
@@ -139,6 +125,7 @@
               <classpathDependencyExcludes>
                 <classpathDependencyExclude>org.apache.arrow:arrow-memory-netty</classpathDependencyExclude>
               </classpathDependencyExcludes>
+              <reportNameSuffix>netty</reportNameSuffix>
             </configuration>
           </execution>
         </executions>
@@ -267,12 +254,8 @@
             <configuration>
               <forkedProcessTimeoutInSeconds>3600</forkedProcessTimeoutInSeconds>
               <systemPropertyVariables>
-                <java.io.tmpdir>${project.build.directory}</java.io.tmpdir>
-                <io.netty.tryReflectionSetAccessible>true</io.netty.tryReflectionSetAccessible>
                 <arrow.memory.debug.allocator>false</arrow.memory.debug.allocator>
-                <user.timezone>UTC</user.timezone>
               </systemPropertyVariables>
-              <argLine />
             </configuration>
             <executions>
               <execution>
diff --git a/java/vector/src/main/codegen/templates/UnionVector.java b/java/vector/src/main/codegen/templates/UnionVector.java
index bd5202977b8..8e5d76f39b8 100644
--- a/java/vector/src/main/codegen/templates/UnionVector.java
+++ b/java/vector/src/main/codegen/templates/UnionVector.java
@@ -114,11 +114,6 @@ public static UnionVector empty(String name, BufferAllocator allocator) {
     return new UnionVector(name, allocator, fieldType, null);
   }
 
-  @Deprecated
-  public UnionVector(String name, BufferAllocator allocator, CallBack callBack) {
-    this(name, allocator, null, callBack);
-  }
-
   public UnionVector(String name, BufferAllocator allocator, FieldType fieldType, CallBack callBack) {
     super(name, allocator, callBack);
     this.fieldType = fieldType;
@@ -522,7 +517,7 @@ private class TransferImpl implements TransferPair {
     private final UnionVector to;
 
     public TransferImpl(String name, BufferAllocator allocator, CallBack callBack) {
-      to = new UnionVector(name, allocator, callBack);
+      to = new UnionVector(name, allocator, /* field type */ null, callBack);
       internalStructVectorTransferPair = internalStruct.makeTransferPair(to.internalStruct);
     }
 
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/BaseVariableWidthVector.java b/java/vector/src/main/java/org/apache/arrow/vector/BaseVariableWidthVector.java
index 7fd19196733..cb36481ef5e 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/BaseVariableWidthVector.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/BaseVariableWidthVector.java
@@ -1215,17 +1215,6 @@ protected final void setBytes(int index, byte[] value, int start, int length) {
     valueBuffer.setBytes(startOffset, value, start, length);
   }
 
-  /**
-   * Gets the starting offset of a record, given its index.
-   * This method is deprecated. Please use {@link BaseVariableWidthVector#getStartOffset(int)} instead.
-   * @param index index of the record.
-   * @return the starting offset of the record.
-   */
-  @Deprecated
-  protected final int getstartOffset(int index) {
-    return getStartOffset(index);
-  }
-
   public final int getStartOffset(int index) {
     return offsetBuffer.getInt((long) index * OFFSET_WIDTH);
   }
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/BitVectorHelper.java b/java/vector/src/main/java/org/apache/arrow/vector/BitVectorHelper.java
index ec73382a0ef..3745c5a75c3 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/BitVectorHelper.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/BitVectorHelper.java
@@ -88,16 +88,6 @@ public static void setBit(ArrowBuf validityBuffer, long index) {
     validityBuffer.setByte(byteIndex, currentByte);
   }
 
-  /**
-   * Set the bit at provided index to 1.
-   *
-   * @deprecated Please use {@link BitVectorHelper#setBit(ArrowBuf, long)} instead..
-   */
-  @Deprecated
-  public static void setValidityBitToOne(ArrowBuf validityBuffer, int index) {
-    setBit(validityBuffer, index);
-  }
-
   /**
    * Set the bit at provided index to 0.
    *
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/ExtensionTypeVector.java b/java/vector/src/main/java/org/apache/arrow/vector/ExtensionTypeVector.java
index 516077d8328..37222507e4c 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/ExtensionTypeVector.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/ExtensionTypeVector.java
@@ -261,6 +261,6 @@ public BufferAllocator getAllocator() {
 
   @Override
   public <OUT, IN> OUT accept(VectorVisitor<OUT, IN> visitor, IN value) {
-    return getUnderlyingVector().accept(visitor, value);
+    return visitor.visit(this, value);
   }
 }
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/UInt1Vector.java b/java/vector/src/main/java/org/apache/arrow/vector/UInt1Vector.java
index b735f5fbeb4..bd9a732c108 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/UInt1Vector.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/UInt1Vector.java
@@ -29,6 +29,7 @@
 import org.apache.arrow.vector.types.pojo.Field;
 import org.apache.arrow.vector.types.pojo.FieldType;
 import org.apache.arrow.vector.util.TransferPair;
+import org.apache.arrow.vector.util.ValueVectorUtility;
 
 /**
  * UInt1Vector implements a fixed width (1 bytes) vector of
@@ -328,7 +329,10 @@ public long getValueAsLong(int index) {
     return this.get(index) & PROMOTION_MASK;
   }
 
-
+  @Override
+  public String toString() {
+    return ValueVectorUtility.getToString(this, 0, getValueCount(), (v, i) -> v.getObjectNoOverflow(i));
+  }
 
   private class TransferImpl implements TransferPair {
     UInt1Vector to;
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/UInt2Vector.java b/java/vector/src/main/java/org/apache/arrow/vector/UInt2Vector.java
index 917700e09c6..5c29ab6b321 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/UInt2Vector.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/UInt2Vector.java
@@ -29,6 +29,7 @@
 import org.apache.arrow.vector.types.pojo.Field;
 import org.apache.arrow.vector.types.pojo.FieldType;
 import org.apache.arrow.vector.util.TransferPair;
+import org.apache.arrow.vector.util.ValueVectorUtility;
 
 /**
  * UInt2Vector implements a fixed width (2 bytes) vector of
@@ -305,6 +306,12 @@ public long getValueAsLong(int index) {
     return this.get(index);
   }
 
+  @Override
+  public String toString() {
+    return ValueVectorUtility.getToString(this, 0, getValueCount(), (v, i) ->
+      v.isNull(i) ? "null" : Integer.toString(v.get(i) & 0x0000ffff));
+  }
+
   private class TransferImpl implements TransferPair {
     UInt2Vector to;
 
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/UInt4Vector.java b/java/vector/src/main/java/org/apache/arrow/vector/UInt4Vector.java
index c5045e6a510..cc954d67ddd 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/UInt4Vector.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/UInt4Vector.java
@@ -29,6 +29,7 @@
 import org.apache.arrow.vector.types.pojo.Field;
 import org.apache.arrow.vector.types.pojo.FieldType;
 import org.apache.arrow.vector.util.TransferPair;
+import org.apache.arrow.vector.util.ValueVectorUtility;
 
 /**
  * UInt4Vector implements a fixed width (4 bytes) vector of
@@ -300,6 +301,11 @@ public long getValueAsLong(int index) {
     return this.get(index) & PROMOTION_MASK;
   }
 
+  @Override
+  public String toString() {
+    return ValueVectorUtility.getToString(this, 0, getValueCount(), (v, i) -> v.getObjectNoOverflow(i));
+  }
+
   private class TransferImpl implements TransferPair {
     UInt4Vector to;
 
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/UInt8Vector.java b/java/vector/src/main/java/org/apache/arrow/vector/UInt8Vector.java
index 3aa4451711d..98eaf25a6e2 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/UInt8Vector.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/UInt8Vector.java
@@ -31,6 +31,7 @@
 import org.apache.arrow.vector.types.pojo.Field;
 import org.apache.arrow.vector.types.pojo.FieldType;
 import org.apache.arrow.vector.util.TransferPair;
+import org.apache.arrow.vector.util.ValueVectorUtility;
 
 /**
  * UInt8Vector implements a fixed width vector (8 bytes) of
@@ -296,6 +297,11 @@ public long getValueAsLong(int index) {
     return this.get(index);
   }
 
+  @Override
+  public String toString() {
+    return ValueVectorUtility.getToString(this, 0, getValueCount(), (v, i) -> v.getObjectNoOverflow(i));
+  }
+
   private class TransferImpl implements TransferPair {
     UInt8Vector to;
 
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/compare/RangeEqualsVisitor.java b/java/vector/src/main/java/org/apache/arrow/vector/compare/RangeEqualsVisitor.java
index 6805d7caf8e..35b4936e357 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/compare/RangeEqualsVisitor.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/compare/RangeEqualsVisitor.java
@@ -27,6 +27,7 @@
 import org.apache.arrow.vector.BaseFixedWidthVector;
 import org.apache.arrow.vector.BaseLargeVariableWidthVector;
 import org.apache.arrow.vector.BaseVariableWidthVector;
+import org.apache.arrow.vector.ExtensionTypeVector;
 import org.apache.arrow.vector.NullVector;
 import org.apache.arrow.vector.ValueVector;
 import org.apache.arrow.vector.complex.BaseRepeatedValueVector;
@@ -214,6 +215,18 @@ public Boolean visit(NullVector left, Range range) {
     return true;
   }
 
+  @Override
+  public Boolean visit(ExtensionTypeVector<?> left, Range range) {
+    if (!(right instanceof ExtensionTypeVector<?>) || !validate(left)) {
+      return false;
+    }
+    ValueVector rightUnderlying = ((ExtensionTypeVector<?>) right).getUnderlyingVector();
+    TypeEqualsVisitor typeVisitor = new TypeEqualsVisitor(rightUnderlying);
+    RangeEqualsVisitor underlyingVisitor =
+            createInnerVisitor(left.getUnderlyingVector(), rightUnderlying, (l, r) -> typeVisitor.equals(l));
+    return underlyingVisitor.rangeEquals(range);
+  }
+
   protected RangeEqualsVisitor createInnerVisitor(
           ValueVector leftInner, ValueVector rightInner,
           BiFunction<ValueVector, ValueVector, Boolean> typeComparator) {
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/compare/TypeEqualsVisitor.java b/java/vector/src/main/java/org/apache/arrow/vector/compare/TypeEqualsVisitor.java
index 95db7924cd1..443ee1f96e2 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/compare/TypeEqualsVisitor.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/compare/TypeEqualsVisitor.java
@@ -23,6 +23,7 @@
 import org.apache.arrow.vector.BaseFixedWidthVector;
 import org.apache.arrow.vector.BaseLargeVariableWidthVector;
 import org.apache.arrow.vector.BaseVariableWidthVector;
+import org.apache.arrow.vector.ExtensionTypeVector;
 import org.apache.arrow.vector.NullVector;
 import org.apache.arrow.vector.ValueVector;
 import org.apache.arrow.vector.complex.DenseUnionVector;
@@ -119,6 +120,11 @@ public Boolean visit(NullVector left, Void value) {
     return compareField(left.getField(), right.getField());
   }
 
+  @Override
+  public Boolean visit(ExtensionTypeVector<?> left, Void value) {
+    return compareField(left.getField(), right.getField());
+  }
+
   private boolean compareField(Field leftField, Field rightField) {
 
     if (leftField == rightField) {
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/compare/VectorVisitor.java b/java/vector/src/main/java/org/apache/arrow/vector/compare/VectorVisitor.java
index 14f3434736e..aee090706b3 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/compare/VectorVisitor.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/compare/VectorVisitor.java
@@ -20,6 +20,7 @@
 import org.apache.arrow.vector.BaseFixedWidthVector;
 import org.apache.arrow.vector.BaseLargeVariableWidthVector;
 import org.apache.arrow.vector.BaseVariableWidthVector;
+import org.apache.arrow.vector.ExtensionTypeVector;
 import org.apache.arrow.vector.NullVector;
 import org.apache.arrow.vector.complex.DenseUnionVector;
 import org.apache.arrow.vector.complex.FixedSizeListVector;
@@ -54,5 +55,7 @@ public interface VectorVisitor<OUT, IN> {
   OUT visit(DenseUnionVector left, IN value);
 
   OUT visit(NullVector left, IN value);
+
+  OUT visit(ExtensionTypeVector<?> left, IN value);
 }
 
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/complex/FixedSizeListVector.java b/java/vector/src/main/java/org/apache/arrow/vector/complex/FixedSizeListVector.java
index c22cba43c56..231ac470f6a 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/complex/FixedSizeListVector.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/complex/FixedSizeListVector.java
@@ -50,7 +50,6 @@
 import org.apache.arrow.vector.ipc.message.ArrowFieldNode;
 import org.apache.arrow.vector.types.Types.MinorType;
 import org.apache.arrow.vector.types.pojo.ArrowType;
-import org.apache.arrow.vector.types.pojo.DictionaryEncoding;
 import org.apache.arrow.vector.types.pojo.Field;
 import org.apache.arrow.vector.types.pojo.FieldType;
 import org.apache.arrow.vector.util.CallBack;
@@ -77,20 +76,6 @@ public static FixedSizeListVector empty(String name, int size, BufferAllocator a
   private int valueCount;
   private int validityAllocationSizeInBytes;
 
-  /**
-   * Creates a new instance.
-   *
-   * @deprecated use FieldType or static constructor instead.
-   */
-  @Deprecated
-  public FixedSizeListVector(String name,
-                             BufferAllocator allocator,
-                             int listSize,
-                             DictionaryEncoding dictionary,
-                             CallBack schemaChangeCallback) {
-    this(name, allocator, new FieldType(true, new ArrowType.FixedSizeList(listSize), dictionary), schemaChangeCallback);
-  }
-
   /**
    * Creates a new instance.
    *
@@ -407,7 +392,7 @@ public void copyFrom(int fromIndex, int thisIndex, ValueVector from) {
 
   @Override
   public UnionVector promoteToUnion() {
-    UnionVector vector = new UnionVector(name, allocator, null);
+    UnionVector vector = new UnionVector(name, allocator, /* field type */ null, /* call-back */ null);
     this.vector.clear();
     this.vector = vector;
     invalidateReader();
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/complex/LargeListVector.java b/java/vector/src/main/java/org/apache/arrow/vector/complex/LargeListVector.java
index 31e30cc44d4..2aef50babd1 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/complex/LargeListVector.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/complex/LargeListVector.java
@@ -541,7 +541,7 @@ protected void replaceDataVector(FieldVector v) {
 
   @Override
   public UnionVector promoteToUnion() {
-    UnionVector vector = new UnionVector("$data$", allocator, callBack);
+    UnionVector vector = new UnionVector("$data$", allocator, /* field type */ null, callBack);
     replaceDataVector(vector);
     invalidateReader();
     if (callBack != null) {
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/complex/ListVector.java b/java/vector/src/main/java/org/apache/arrow/vector/complex/ListVector.java
index 7e969263cb9..77d2c684619 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/complex/ListVector.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/complex/ListVector.java
@@ -50,7 +50,6 @@
 import org.apache.arrow.vector.ipc.message.ArrowFieldNode;
 import org.apache.arrow.vector.types.Types.MinorType;
 import org.apache.arrow.vector.types.pojo.ArrowType;
-import org.apache.arrow.vector.types.pojo.DictionaryEncoding;
 import org.apache.arrow.vector.types.pojo.Field;
 import org.apache.arrow.vector.types.pojo.FieldType;
 import org.apache.arrow.vector.util.CallBack;
@@ -84,26 +83,6 @@ public static ListVector empty(String name, BufferAllocator allocator) {
    */
   private int lastSet;
 
-  /**
-   * Creates a ListVector.
-   *
-   * @deprecated Use FieldType or static constructor instead.
-   */
-  @Deprecated
-  public ListVector(String name, BufferAllocator allocator, CallBack callBack) {
-    this(name, allocator, FieldType.nullable(ArrowType.List.INSTANCE), callBack);
-  }
-
-  /**
-   * Creates a ListVector.
-   *
-   * @deprecated Use FieldType or static constructor instead.
-   */
-  @Deprecated
-  public ListVector(String name, BufferAllocator allocator, DictionaryEncoding dictionary, CallBack callBack) {
-    this(name, allocator, new FieldType(true, ArrowType.List.INSTANCE, dictionary, null), callBack);
-  }
-
   /**
    * Constructs a new instance.
    *
@@ -680,7 +659,7 @@ public ArrowBuf[] getBuffers(boolean clear) {
 
   @Override
   public UnionVector promoteToUnion() {
-    UnionVector vector = new UnionVector("$data$", allocator, callBack);
+    UnionVector vector = new UnionVector("$data$", allocator, /* field type*/ null, callBack);
     replaceDataVector(vector);
     invalidateReader();
     if (callBack != null) {
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/ipc/JsonFileWriter.java b/java/vector/src/main/java/org/apache/arrow/vector/ipc/JsonFileWriter.java
index f6cd3bcb655..58760c1a94b 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/ipc/JsonFileWriter.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/ipc/JsonFileWriter.java
@@ -232,7 +232,7 @@ private void writeFromVectorIntoJson(Field field, FieldVector vector) throws IOE
             ArrowBuf vectorBufferTmp = vector.getAllocator().buffer(4);
             vectorBufferTmp.setInt(0, 0);
             writeValueToGenerator(bufferType, vectorBufferTmp, null, vector, i);
-            vectorBufferTmp.release();
+            vectorBufferTmp.close();
           } else {
             writeValueToGenerator(bufferType, vectorBuffer, null, vector, i);
           }
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/types/pojo/Field.java b/java/vector/src/main/java/org/apache/arrow/vector/types/pojo/Field.java
index d4fdb9a15ec..2eeb3bea449 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/types/pojo/Field.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/types/pojo/Field.java
@@ -94,26 +94,6 @@ private Field(String name, FieldType fieldType, List<Field> children, TypeLayout
     this.children = children == null ? Collections.emptyList() : children.stream().collect(Collectors.toList());
   }
 
-  /**
-   * Creates a new field.
-   *
-   * @deprecated Use FieldType or static constructor instead.
-   */
-  @Deprecated
-  public Field(String name, boolean nullable, ArrowType type, List<Field> children) {
-    this(name, new FieldType(nullable, type, null, null), children);
-  }
-
-  /**
-   * Creates a new field.
-   *
-   * @deprecated Use FieldType or static constructor instead.
-   */
-  @Deprecated
-  public Field(String name, boolean nullable, ArrowType type, DictionaryEncoding dictionary, List<Field> children) {
-    this(name, new FieldType(nullable, type, dictionary, null), children);
-  }
-
   public Field(String name, FieldType fieldType, List<Field> children) {
     this(name, fieldType, children, fieldType == null ? null : TypeLayout.getTypeLayout(fieldType.getType()));
   }
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/util/ByteFunctionHelpers.java b/java/vector/src/main/java/org/apache/arrow/vector/util/ByteFunctionHelpers.java
deleted file mode 100644
index 2faa1ff74c7..00000000000
--- a/java/vector/src/main/java/org/apache/arrow/vector/util/ByteFunctionHelpers.java
+++ /dev/null
@@ -1,112 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.arrow.vector.util;
-
-import org.apache.arrow.memory.ArrowBuf;
-
-/**
- * Helper class for comparing byte buffers.
- *
- * @deprecated This class will be removed. Please use org.apache.arrow.memory.util.ByteFunctionHelpers instead.
- */
-@Deprecated
-public class ByteFunctionHelpers {
-  static final org.slf4j.Logger logger = org.slf4j.LoggerFactory.getLogger(ByteFunctionHelpers.class);
-
-  private ByteFunctionHelpers() {}
-
-  /**
-   * Helper function to check for equality of bytes in two ArrowBufs.
-   *
-   * @param left   Left ArrowBuf for comparison
-   * @param lStart start offset in the buffer
-   * @param lEnd   end offset in the buffer
-   * @param right  Right ArrowBuf for comparison
-   * @param rStart start offset in the buffer
-   * @param rEnd   end offset in the buffer
-   * @return 1 if equals, 0 otherwise
-   */
-  @Deprecated
-  public static final int equal(final ArrowBuf left, int lStart, int lEnd, final ArrowBuf right, int rStart, int rEnd) {
-    return org.apache.arrow.memory.util.ByteFunctionHelpers.equal(left, lStart, lEnd, right, rStart, rEnd);
-  }
-
-  /**
-   * Helper function to compare a set of bytes in two ArrowBufs.
-   * Function will check data before completing in the case that
-   *
-   * @param left   Left ArrowBuf to compare
-   * @param lStart start offset in the buffer
-   * @param lEnd   end offset in the buffer
-   * @param right  Right ArrowBuf to compare
-   * @param rStart start offset in the buffer
-   * @param rEnd   end offset in the buffer
-   * @return 1 if left input is greater, -1 if left input is smaller, 0 otherwise
-   */
-  @Deprecated
-  public static final int compare(
-      final ArrowBuf left,
-      int lStart,
-      int lEnd,
-      final ArrowBuf right,
-      int rStart,
-      int rEnd) {
-    return org.apache.arrow.memory.util.ByteFunctionHelpers.compare(left, lStart, lEnd, right, rStart, rEnd);
-  }
-
-  /**
-   * Helper function to compare a set of bytes in ArrowBuf to a ByteArray.
-   *
-   * @param left   Left ArrowBuf for comparison purposes
-   * @param lStart start offset in the buffer
-   * @param lEnd   end offset in the buffer
-   * @param right  second input to be compared
-   * @param rStart start offset in the byte array
-   * @param rEnd   end offset in the byte array
-   * @return 1 if left input is greater, -1 if left input is smaller, 0 otherwise
-   */
-  @Deprecated
-  public static final int compare(
-      final ArrowBuf left,
-      int lStart,
-      int lEnd,
-      final byte[] right,
-      int rStart,
-      final int rEnd) {
-    return org.apache.arrow.memory.util.ByteFunctionHelpers.compare(left, lStart, lEnd, right, rStart, rEnd);
-  }
-
-  /**
-   * Compares the two specified {@code long} values, treating them as unsigned values between
-   * {@code 0} and {@code 2^64 - 1} inclusive.
-   *
-   * @param a the first unsigned {@code long} to compare
-   * @param b the second unsigned {@code long} to compare
-   * @return a negative value if {@code a} is less than {@code b}; a positive value if {@code a} is
-   *     greater than {@code b}; or zero if they are equal
-   */
-  @Deprecated
-  public static int unsignedLongCompare(long a, long b) {
-    return org.apache.arrow.memory.util.ByteFunctionHelpers.unsignedLongCompare(a, b);
-  }
-
-  @Deprecated
-  public static int unsignedIntCompare(int a, int b) {
-    return org.apache.arrow.memory.util.ByteFunctionHelpers.unsignedIntCompare(a, b);
-  }
-}
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/util/ValueVectorUtility.java b/java/vector/src/main/java/org/apache/arrow/vector/util/ValueVectorUtility.java
index 60553b4e342..ceb7081e1ea 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/util/ValueVectorUtility.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/util/ValueVectorUtility.java
@@ -19,6 +19,8 @@
 
 import static org.apache.arrow.vector.validate.ValidateUtil.validateOrThrow;
 
+import java.util.function.BiFunction;
+
 import org.apache.arrow.util.Preconditions;
 import org.apache.arrow.vector.BaseFixedWidthVector;
 import org.apache.arrow.vector.ValueVector;
@@ -37,7 +39,7 @@ private ValueVectorUtility() {
 
   /**
    * Get the toString() representation of vector suitable for debugging.
-   * Note since vectors may have millions of values, this method only show max 20 values.
+   * Note since vectors may have millions of values, this method only shows max 20 values.
    * Examples as below (v represents value):
    * <li>
    *   vector with 0 value:
@@ -52,7 +54,20 @@ private ValueVectorUtility() {
    *  [v0, v1, v2, v3, v4, v5, v6, v7, v8, v9, ..., v90, v91, v92, v93, v94, v95, v96, v97, v98, v99]
    * </li>
    */
-  public static String getToString(ValueVector vector, int start, int end) {
+  public static <V extends ValueVector> String getToString(V vector, int start, int end) {
+    return getToString(vector, start, end, (v, i) -> v.getObject(i));
+  }
+
+  /**
+   * Get the toString() representation of vector suitable for debugging.
+   * Note since vectors may have millions of values, this method only shows at most 20 values.
+   * @param vector the vector for which to get toString representation.
+   * @param start the starting index, inclusive.
+   * @param end the end index, exclusive.
+   * @param valueToString the function to transform individual elements to strings.
+   */
+  public static <V extends ValueVector> String getToString(
+      V vector, int start, int end, BiFunction<V, Integer, Object> valueToString) {
     Preconditions.checkNotNull(vector);
     final int length = end - start;
     Preconditions.checkArgument(length >= 0);
@@ -77,7 +92,7 @@ public static String getToString(ValueVector vector, int start, int end) {
         i = end - window - 1;
         skipComma = true;
       } else {
-        sb.append(vector.getObject(i));
+        sb.append(valueToString.apply(vector, i));
       }
 
       if (i == end - 1) {
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/util/VectorAppender.java b/java/vector/src/main/java/org/apache/arrow/vector/util/VectorAppender.java
index 7703fed65a6..e5809e93ea8 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/util/VectorAppender.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/util/VectorAppender.java
@@ -26,6 +26,7 @@
 import org.apache.arrow.vector.BaseLargeVariableWidthVector;
 import org.apache.arrow.vector.BaseVariableWidthVector;
 import org.apache.arrow.vector.BitVectorHelper;
+import org.apache.arrow.vector.ExtensionTypeVector;
 import org.apache.arrow.vector.NullVector;
 import org.apache.arrow.vector.ValueVector;
 import org.apache.arrow.vector.compare.TypeEqualsVisitor;
@@ -530,4 +531,12 @@ public ValueVector visit(NullVector deltaVector, Void value) {
             "The targetVector to append must have the same type as the targetVector being appended");
     return targetVector;
   }
+
+  @Override
+  public ValueVector visit(ExtensionTypeVector<?> deltaVector, Void value) {
+    ValueVector targetUnderlying = ((ExtensionTypeVector<?>) targetVector).getUnderlyingVector();
+    VectorAppender underlyingAppender = new VectorAppender(targetUnderlying);
+    deltaVector.getUnderlyingVector().accept(underlyingAppender, null);
+    return targetVector;
+  }
 }
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorBufferVisitor.java b/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorBufferVisitor.java
index 46064c37bdd..d4abaa1945b 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorBufferVisitor.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorBufferVisitor.java
@@ -24,6 +24,7 @@
 import org.apache.arrow.vector.BaseLargeVariableWidthVector;
 import org.apache.arrow.vector.BaseVariableWidthVector;
 import org.apache.arrow.vector.BitVector;
+import org.apache.arrow.vector.ExtensionTypeVector;
 import org.apache.arrow.vector.FieldVector;
 import org.apache.arrow.vector.NullVector;
 import org.apache.arrow.vector.TypeLayout;
@@ -236,4 +237,10 @@ public Void visit(DenseUnionVector vector, Void value) {
   public Void visit(NullVector vector, Void value) {
     return null;
   }
+
+  @Override
+  public Void visit(ExtensionTypeVector<?> vector, Void value) {
+    vector.getUnderlyingVector().accept(this, value);
+    return null;
+  }
 }
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorDataVisitor.java b/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorDataVisitor.java
index 23a0beeb51f..cdeb4f1eaa1 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorDataVisitor.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorDataVisitor.java
@@ -23,6 +23,7 @@
 import org.apache.arrow.vector.BaseFixedWidthVector;
 import org.apache.arrow.vector.BaseLargeVariableWidthVector;
 import org.apache.arrow.vector.BaseVariableWidthVector;
+import org.apache.arrow.vector.ExtensionTypeVector;
 import org.apache.arrow.vector.NullVector;
 import org.apache.arrow.vector.ValueVector;
 import org.apache.arrow.vector.compare.VectorVisitor;
@@ -170,4 +171,10 @@ public Void visit(DenseUnionVector vector, Void value) {
   public Void visit(NullVector vector, Void value) {
     return null;
   }
+
+  @Override
+  public Void visit(ExtensionTypeVector<?> vector, Void value) {
+    vector.getUnderlyingVector().accept(this, value);
+    return null;
+  }
 }
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorTypeVisitor.java b/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorTypeVisitor.java
index b7aa44c99f9..65795b46813 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorTypeVisitor.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorTypeVisitor.java
@@ -29,6 +29,7 @@
 import org.apache.arrow.vector.Decimal256Vector;
 import org.apache.arrow.vector.DecimalVector;
 import org.apache.arrow.vector.DurationVector;
+import org.apache.arrow.vector.ExtensionTypeVector;
 import org.apache.arrow.vector.FixedSizeBinaryVector;
 import org.apache.arrow.vector.Float4Vector;
 import org.apache.arrow.vector.Float8Vector;
@@ -146,6 +147,17 @@ private void validateTimeStampVector(ValueVector vector, TimeUnit expectedTimeUn
     }
   }
 
+  private void validateExtensionTypeVector(ExtensionTypeVector<?> vector) {
+    validateOrThrow(vector.getField().getFieldType().getType() instanceof ArrowType.ExtensionType,
+        "Vector %s is not an extension type vector.", vector.getClass());
+    validateOrThrow(vector.getField().getMetadata().containsKey(ArrowType.ExtensionType.EXTENSION_METADATA_KEY_NAME),
+            "Field %s does not have proper extension type metadata: %s",
+            vector.getField().getName(),
+            vector.getField().getMetadata());
+    // Validate the storage vector type
+    vector.getUnderlyingVector().accept(this, null);
+  }
+
   @Override
   public Void visit(BaseFixedWidthVector vector, Void value) {
     if (vector instanceof TinyIntVector) {
@@ -357,4 +369,10 @@ public Void visit(NullVector vector, Void value) {
     validateVectorCommon(vector, ArrowType.Null.class);
     return null;
   }
+
+  @Override
+  public Void visit(ExtensionTypeVector<?> vector, Void value) {
+    validateExtensionTypeVector(vector);
+    return null;
+  }
 }
diff --git a/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorVisitor.java b/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorVisitor.java
index 3e44c262d75..7e99b1f90fb 100644
--- a/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorVisitor.java
+++ b/java/vector/src/main/java/org/apache/arrow/vector/validate/ValidateVectorVisitor.java
@@ -23,6 +23,7 @@
 import org.apache.arrow.vector.BaseFixedWidthVector;
 import org.apache.arrow.vector.BaseLargeVariableWidthVector;
 import org.apache.arrow.vector.BaseVariableWidthVector;
+import org.apache.arrow.vector.ExtensionTypeVector;
 import org.apache.arrow.vector.FieldVector;
 import org.apache.arrow.vector.NullVector;
 import org.apache.arrow.vector.ValueVector;
@@ -39,7 +40,7 @@
 /**
  * Visitor to validate vector (without validating data).
  * This visitor could be used for {@link ValueVector#accept(VectorVisitor, Object)} API,
- * and also users could simply use {@link ValueVectorUtility#validate(FieldVector)}.
+ * and also users could simply use {@link ValueVectorUtility#validate(ValueVector)}.
  */
 public class ValidateVectorVisitor implements VectorVisitor<Void, Void> {
 
@@ -263,4 +264,10 @@ public Void visit(DenseUnionVector vector, Void value) {
   public Void visit(NullVector vector, Void value) {
     return null;
   }
+
+  @Override
+  public Void visit(ExtensionTypeVector<?> vector, Void value) {
+    vector.getUnderlyingVector().accept(this, value);
+    return null;
+  }
 }
diff --git a/java/vector/src/test/java/org/apache/arrow/vector/TestBitVectorHelper.java b/java/vector/src/test/java/org/apache/arrow/vector/TestBitVectorHelper.java
index 4b48876ff16..9c7e1979d2b 100644
--- a/java/vector/src/test/java/org/apache/arrow/vector/TestBitVectorHelper.java
+++ b/java/vector/src/test/java/org/apache/arrow/vector/TestBitVectorHelper.java
@@ -164,8 +164,8 @@ public void testConcatBits() {
         final int maxCount = 100;
         for (int i = 0; i < maxCount; i++) {
           if (i % 3 == 0) {
-            BitVectorHelper.setValidityBitToOne(buf1, i);
-            BitVectorHelper.setValidityBitToOne(buf2, i);
+            BitVectorHelper.setBit(buf1, i);
+            BitVectorHelper.setBit(buf2, i);
           }
         }
 
@@ -199,8 +199,8 @@ public void testConcatBitsInPlace() {
         final int maxCount = 100;
         for (int i = 0; i < maxCount; i++) {
           if (i % 3 == 0) {
-            BitVectorHelper.setValidityBitToOne(buf1, i);
-            BitVectorHelper.setValidityBitToOne(buf2, i);
+            BitVectorHelper.setBit(buf1, i);
+            BitVectorHelper.setBit(buf2, i);
           }
         }
 
diff --git a/java/vector/src/test/java/org/apache/arrow/vector/TestDictionaryVector.java b/java/vector/src/test/java/org/apache/arrow/vector/TestDictionaryVector.java
index 165cb7bad3e..bc6cddf3674 100644
--- a/java/vector/src/test/java/org/apache/arrow/vector/TestDictionaryVector.java
+++ b/java/vector/src/test/java/org/apache/arrow/vector/TestDictionaryVector.java
@@ -306,8 +306,9 @@ public void testEncodeBinaryVector() {
   @Test
   public void testEncodeUnion() {
     // Create a new value vector
-    try (final UnionVector vector = new UnionVector("vector", allocator, null);
-         final UnionVector dictionaryVector = new UnionVector("dict", allocator, null);) {
+    try (final UnionVector vector = new UnionVector("vector", allocator, /* field type */ null, /* call-back */ null);
+         final UnionVector dictionaryVector =
+             new UnionVector("dict", allocator, /* field type */ null, /* call-back */ null);) {
 
       final NullableUInt4Holder uintHolder1 = new NullableUInt4Holder();
       uintHolder1.value = 10;
@@ -494,8 +495,9 @@ public void testStructEquals() {
 
   @Test
   public void testUnionEquals() {
-    try (final UnionVector vector1 = new UnionVector("union", allocator, null);
-         final UnionVector vector2 = new UnionVector("union", allocator, null);) {
+    try (final UnionVector vector1 = new UnionVector("union", allocator, /* field type */ null, /* call-back */ null);
+         final UnionVector vector2 =
+             new UnionVector("union", allocator, /* field type */ null, /* call-back */ null);) {
 
       final NullableUInt4Holder uInt4Holder = new NullableUInt4Holder();
       uInt4Holder.value = 10;
diff --git a/java/vector/src/test/java/org/apache/arrow/vector/TestFixedSizeListVector.java b/java/vector/src/test/java/org/apache/arrow/vector/TestFixedSizeListVector.java
index 365789e04c8..9d7e413a739 100644
--- a/java/vector/src/test/java/org/apache/arrow/vector/TestFixedSizeListVector.java
+++ b/java/vector/src/test/java/org/apache/arrow/vector/TestFixedSizeListVector.java
@@ -165,8 +165,10 @@ public void testNestedInList() {
 
   @Test
   public void testTransferPair() {
-    try (FixedSizeListVector from = new FixedSizeListVector("from", allocator, 2, null, null);
-         FixedSizeListVector to = new FixedSizeListVector("to", allocator, 2, null, null)) {
+    try (FixedSizeListVector from = new FixedSizeListVector(
+        "from", allocator, new FieldType(true, new ArrowType.FixedSizeList(2), null), null);
+         FixedSizeListVector to = new FixedSizeListVector(
+             "to", allocator, new FieldType(true, new ArrowType.FixedSizeList(2), null), null)) {
       Float4Vector nested = (Float4Vector) from.addOrGetVector(FieldType.nullable(MinorType.FLOAT4.getType()))
           .getVector();
       from.allocateNew();
diff --git a/java/vector/src/test/java/org/apache/arrow/vector/TestUnionVector.java b/java/vector/src/test/java/org/apache/arrow/vector/TestUnionVector.java
index 962c233889d..f04998915b6 100644
--- a/java/vector/src/test/java/org/apache/arrow/vector/TestUnionVector.java
+++ b/java/vector/src/test/java/org/apache/arrow/vector/TestUnionVector.java
@@ -69,7 +69,8 @@ public void testUnionVector() throws Exception {
     uInt4Holder.value = 100;
     uInt4Holder.isSet = 1;
 
-    try (UnionVector unionVector = new UnionVector(EMPTY_SCHEMA_PATH, allocator, null)) {
+    try (UnionVector unionVector =
+             new UnionVector(EMPTY_SCHEMA_PATH, allocator, /* field type */ null, /* call-back */ null)) {
       unionVector.allocateNew();
 
       // write some data
@@ -96,7 +97,8 @@ public void testUnionVector() throws Exception {
 
   @Test
   public void testUnionVectorMapValue() throws Exception {
-    try (UnionVector unionVector = new UnionVector(EMPTY_SCHEMA_PATH, allocator, null)) {
+    try (UnionVector unionVector =
+             new UnionVector(EMPTY_SCHEMA_PATH, allocator, /* field type */ null, /* call-back */ null)) {
       unionVector.allocateNew();
 
       UnionWriter writer = (UnionWriter) unionVector.getWriter();
@@ -157,7 +159,8 @@ public void testUnionVectorMapValue() throws Exception {
 
   @Test
   public void testTransfer() throws Exception {
-    try (UnionVector srcVector = new UnionVector(EMPTY_SCHEMA_PATH, allocator, null)) {
+    try (UnionVector srcVector =
+             new UnionVector(EMPTY_SCHEMA_PATH, allocator, /* field type */ null, /* call-back */ null)) {
       srcVector.allocateNew();
 
       // write some data
@@ -171,7 +174,8 @@ public void testTransfer() throws Exception {
       srcVector.setSafe(5, newBitHolder(false));
       srcVector.setValueCount(6);
 
-      try (UnionVector destVector = new UnionVector(EMPTY_SCHEMA_PATH, allocator, null)) {
+      try (UnionVector destVector =
+               new UnionVector(EMPTY_SCHEMA_PATH, allocator, /* field type */ null, /* call-back */ null)) {
         TransferPair pair = srcVector.makeTransferPair(destVector);
 
         // Creating the transfer should transfer the type of the field at least.
@@ -206,7 +210,8 @@ public void testTransfer() throws Exception {
 
   @Test
   public void testSplitAndTransfer() throws Exception {
-    try (UnionVector sourceVector = new UnionVector(EMPTY_SCHEMA_PATH, allocator, null)) {
+    try (UnionVector sourceVector =
+             new UnionVector(EMPTY_SCHEMA_PATH, allocator, /* field type */ null, /* call-back */ null)) {
 
       sourceVector.allocateNew();
 
@@ -256,7 +261,8 @@ public void testSplitAndTransfer() throws Exception {
       assertEquals(false, sourceVector.isNull(9));
       assertEquals(50, sourceVector.getObject(9));
 
-      try (UnionVector toVector = new UnionVector(EMPTY_SCHEMA_PATH, allocator, null)) {
+      try (UnionVector toVector =
+               new UnionVector(EMPTY_SCHEMA_PATH, allocator, /* field type */ null, /* call-back */ null)) {
 
         final TransferPair transferPair = sourceVector.makeTransferPair(toVector);
 
@@ -286,7 +292,8 @@ public void testSplitAndTransfer() throws Exception {
 
   @Test
   public void testSplitAndTransferWithMixedVectors() throws Exception {
-    try (UnionVector sourceVector = new UnionVector(EMPTY_SCHEMA_PATH, allocator, null)) {
+    try (UnionVector sourceVector =
+             new UnionVector(EMPTY_SCHEMA_PATH, allocator, /* field type */ null, /* call-back */ null)) {
 
       sourceVector.allocateNew();
 
@@ -345,7 +352,8 @@ public void testSplitAndTransferWithMixedVectors() throws Exception {
       assertEquals(false, sourceVector.isNull(9));
       assertEquals(30.5f, sourceVector.getObject(9));
 
-      try (UnionVector toVector = new UnionVector(EMPTY_SCHEMA_PATH, allocator, null)) {
+      try (UnionVector toVector =
+               new UnionVector(EMPTY_SCHEMA_PATH, allocator, /* field type */ null, /* call-back */ null)) {
 
         final TransferPair transferPair = sourceVector.makeTransferPair(toVector);
 
@@ -410,7 +418,8 @@ public void testGetFieldTypeInfo() throws Exception {
 
   @Test
   public void testGetBufferAddress() throws Exception {
-    try (UnionVector vector = new UnionVector(EMPTY_SCHEMA_PATH, allocator, null)) {
+    try (UnionVector vector =
+             new UnionVector(EMPTY_SCHEMA_PATH, allocator, /* field type */ null, /* call-back */ null)) {
       boolean error = false;
 
       vector.allocateNew();
@@ -467,7 +476,8 @@ public void testGetBufferAddress() throws Exception {
 
   @Test
   public void testSetGetNull() {
-    try (UnionVector srcVector = new UnionVector(EMPTY_SCHEMA_PATH, allocator, null)) {
+    try (UnionVector srcVector =
+             new UnionVector(EMPTY_SCHEMA_PATH, allocator, /* field type */ null, /* call-back */ null)) {
       srcVector.allocateNew();
 
       final NullableIntHolder holder = new NullableIntHolder();
diff --git a/java/vector/src/test/java/org/apache/arrow/vector/TestValueVector.java b/java/vector/src/test/java/org/apache/arrow/vector/TestValueVector.java
index 2d0f8dab37d..572c3d594c5 100644
--- a/java/vector/src/test/java/org/apache/arrow/vector/TestValueVector.java
+++ b/java/vector/src/test/java/org/apache/arrow/vector/TestValueVector.java
@@ -2651,8 +2651,8 @@ public void testStructVectorEqualsWithDiffChild() {
 
   @Test
   public void testUnionVectorEquals() {
-    try (final UnionVector vector1 = new UnionVector("union", allocator, null);
-        final UnionVector vector2 = new UnionVector("union", allocator, null);) {
+    try (final UnionVector vector1 = new UnionVector("union", allocator, /* field type */ null, /* call-back */ null);
+        final UnionVector vector2 = new UnionVector("union", allocator, /* field type */ null, /* call-back */ null);) {
 
       final NullableUInt4Holder uInt4Holder = new NullableUInt4Holder();
       uInt4Holder.value = 10;
@@ -2721,7 +2721,8 @@ public void testVariableWidthVectorNullHashCode() {
 
   @Test
   public void testUnionNullHashCode() {
-    try (UnionVector srcVector = new UnionVector(EMPTY_SCHEMA_PATH, allocator, null)) {
+    try (UnionVector srcVector =
+             new UnionVector(EMPTY_SCHEMA_PATH, allocator, /* field type */ null, /* call-back */ null)) {
       srcVector.allocateNew();
 
       final NullableIntHolder holder = new NullableIntHolder();
@@ -2791,6 +2792,38 @@ public void testToString() {
     }
   }
 
+  @Test
+  public void testUInt1VectorToString() {
+    try (final UInt1Vector uInt1Vector = new UInt1Vector("uInt1Vector", allocator)) {
+      setVector(uInt1Vector, (byte) 0xff);
+      assertEquals("[255]", uInt1Vector.toString());
+    }
+  }
+
+  @Test
+  public void testUInt2VectorToString() {
+    try (final UInt2Vector uInt2Vector = new UInt2Vector("uInt2Vector", allocator)) {
+      setVector(uInt2Vector, (char) 0xffff);
+      assertEquals("[65535]", uInt2Vector.toString());
+    }
+  }
+
+  @Test
+  public void testUInt4VectorToString() {
+    try (final UInt4Vector uInt4Vector = new UInt4Vector("uInt4Vector", allocator)) {
+      setVector(uInt4Vector, 0xffffffff);
+      assertEquals("[4294967295]", uInt4Vector.toString());
+    }
+  }
+
+  @Test
+  public void testUInt8VectorToString() {
+    try (final UInt8Vector uInt8Vector = new UInt8Vector("uInt8Vector", allocator)) {
+      setVector(uInt8Vector, 0xffffffffffffffffL);
+      assertEquals("[18446744073709551615]", uInt8Vector.toString());
+    }
+  }
+
   @Test
   public void testUnloadVariableWidthVector() {
     try (final VarCharVector varCharVector = new VarCharVector("var char", allocator)) {
diff --git a/java/vector/src/test/java/org/apache/arrow/vector/TestVectorReAlloc.java b/java/vector/src/test/java/org/apache/arrow/vector/TestVectorReAlloc.java
index fae50c9dffc..18bb2c95738 100644
--- a/java/vector/src/test/java/org/apache/arrow/vector/TestVectorReAlloc.java
+++ b/java/vector/src/test/java/org/apache/arrow/vector/TestVectorReAlloc.java
@@ -421,7 +421,7 @@ public void testFixedSizeListVectorClearAndSet() {
 
   @Test
   public void testUnionVectorClearAndSet() {
-    try (final UnionVector vector = new UnionVector("", allocator, null)) {
+    try (final UnionVector vector = new UnionVector("", allocator, /* field type */ null, /* call-back */ null)) {
       vector.allocateNewSafe(); // Initial allocation
 
       NullableIntHolder holder = new NullableIntHolder();
diff --git a/java/vector/src/test/java/org/apache/arrow/vector/TestVectorReset.java b/java/vector/src/test/java/org/apache/arrow/vector/TestVectorReset.java
index adb51960ecd..71009a33375 100644
--- a/java/vector/src/test/java/org/apache/arrow/vector/TestVectorReset.java
+++ b/java/vector/src/test/java/org/apache/arrow/vector/TestVectorReset.java
@@ -153,7 +153,7 @@ public void testStructTypeReset() {
 
   @Test
   public void testUnionTypeReset() {
-    try (final UnionVector vector = new UnionVector("Union", allocator, null);
+    try (final UnionVector vector = new UnionVector("Union", allocator, /* field type */ null, /* call-back */ null);
          final IntVector dataVector = new IntVector("Int", allocator)
     ) {
       vector.getBufferSize();
diff --git a/java/vector/src/test/java/org/apache/arrow/vector/compare/TestRangeEqualsVisitor.java b/java/vector/src/test/java/org/apache/arrow/vector/compare/TestRangeEqualsVisitor.java
index 9121e82fcaf..4495881ad78 100644
--- a/java/vector/src/test/java/org/apache/arrow/vector/compare/TestRangeEqualsVisitor.java
+++ b/java/vector/src/test/java/org/apache/arrow/vector/compare/TestRangeEqualsVisitor.java
@@ -270,8 +270,9 @@ public void testStructVectorRangeEquals() {
 
   @Test
   public void testUnionVectorRangeEquals() {
-    try (final UnionVector vector1 = new UnionVector("union", allocator, null);
-         final UnionVector vector2 = new UnionVector("union", allocator, null);) {
+    try (final UnionVector vector1 = new UnionVector("union", allocator, /* field type */ null, /* call-back */ null);
+         final UnionVector vector2 =
+             new UnionVector("union", allocator, /* field type */ null, /* call-back */ null);) {
 
       final NullableUInt4Holder uInt4Holder = new NullableUInt4Holder();
       uInt4Holder.value = 10;
@@ -547,9 +548,9 @@ public void testStructVectorApproxEquals() {
 
   @Test
   public void testUnionVectorApproxEquals() {
-    try (final UnionVector right = new UnionVector("union", allocator, null);
-         final UnionVector left1 = new UnionVector("union", allocator, null);
-         final UnionVector left2 = new UnionVector("union", allocator, null);) {
+    try (final UnionVector right = new UnionVector("union", allocator, /* field type */ null, /* call-back */ null);
+         final UnionVector left1 = new UnionVector("union", allocator, /* field type */ null, /* call-back */ null);
+         final UnionVector left2 = new UnionVector("union", allocator, /* field type */ null, /* call-back */ null);) {
 
       final NullableFloat4Holder float4Holder = new NullableFloat4Holder();
       float4Holder.value = 1.01f;
diff --git a/java/vector/src/test/java/org/apache/arrow/vector/compare/TestTypeEqualsVisitor.java b/java/vector/src/test/java/org/apache/arrow/vector/compare/TestTypeEqualsVisitor.java
index 4195c8811ee..c0a3bd89dc1 100644
--- a/java/vector/src/test/java/org/apache/arrow/vector/compare/TestTypeEqualsVisitor.java
+++ b/java/vector/src/test/java/org/apache/arrow/vector/compare/TestTypeEqualsVisitor.java
@@ -127,9 +127,9 @@ public void testStructTypeEquals() {
 
   @Test
   public void testUnionTypeEquals() {
-    try (final UnionVector right = new UnionVector("union", allocator, null);
-         final UnionVector left1 = new UnionVector("union", allocator, null);
-         final UnionVector left2 = new UnionVector("union", allocator, null)) {
+    try (final UnionVector right = new UnionVector("union", allocator, /* field type */ null, /* call-back */ null);
+         final UnionVector left1 = new UnionVector("union", allocator, /* field type */ null, /* call-back */ null);
+         final UnionVector left2 = new UnionVector("union", allocator, /* field type */ null, /* call-back */ null)) {
 
       right.addVector(new IntVector("int", allocator));
       left1.addVector(new IntVector("int", allocator));
diff --git a/java/vector/src/test/java/org/apache/arrow/vector/complex/writer/TestComplexWriter.java b/java/vector/src/test/java/org/apache/arrow/vector/complex/writer/TestComplexWriter.java
index d44ada2f30f..d4cf6ea8937 100644
--- a/java/vector/src/test/java/org/apache/arrow/vector/complex/writer/TestComplexWriter.java
+++ b/java/vector/src/test/java/org/apache/arrow/vector/complex/writer/TestComplexWriter.java
@@ -604,7 +604,7 @@ private void checkListMap(ListVector listVector) {
 
   @Test
   public void simpleUnion() {
-    UnionVector vector = new UnionVector("union", allocator, null);
+    UnionVector vector = new UnionVector("union", allocator, /* field type */ null, /* call-back */ null);
     UnionWriter unionWriter = new UnionWriter(vector);
     unionWriter.allocate();
     for (int i = 0; i < COUNT; i++) {
diff --git a/java/vector/src/test/java/org/apache/arrow/vector/pojo/TestConvert.java b/java/vector/src/test/java/org/apache/arrow/vector/pojo/TestConvert.java
index 8c291e01a36..5cc0d080053 100644
--- a/java/vector/src/test/java/org/apache/arrow/vector/pojo/TestConvert.java
+++ b/java/vector/src/test/java/org/apache/arrow/vector/pojo/TestConvert.java
@@ -144,7 +144,7 @@ public void nestedSchema() {
           Collections2.asImmutableList(
             new Field("child5.1", FieldType.nullable(new Timestamp(TimeUnit.MILLISECOND, null)), null),
             new Field("child5.2", FieldType.nullable(new FloatingPoint(DOUBLE)), Collections.emptyList()),
-            new Field("child5.3", true, new Timestamp(TimeUnit.MILLISECOND, "UTC"), null)
+            new Field("child5.3", FieldType.nullable(new Timestamp(TimeUnit.MILLISECOND, "UTC")), null)
           )));
     Schema initialSchema = new Schema(children);
     run(initialSchema);
diff --git a/java/vector/src/test/java/org/apache/arrow/vector/types/pojo/TestExtensionType.java b/java/vector/src/test/java/org/apache/arrow/vector/types/pojo/TestExtensionType.java
index 53f009cb761..8b2743210de 100644
--- a/java/vector/src/test/java/org/apache/arrow/vector/types/pojo/TestExtensionType.java
+++ b/java/vector/src/test/java/org/apache/arrow/vector/types/pojo/TestExtensionType.java
@@ -17,6 +17,8 @@
 
 package org.apache.arrow.vector.types.pojo;
 
+import static org.junit.Assert.assertEquals;
+import static org.junit.Assert.assertFalse;
 import static org.junit.Assert.assertTrue;
 import static org.junit.jupiter.api.Assertions.assertThrows;
 
@@ -40,11 +42,15 @@
 import org.apache.arrow.vector.FixedSizeBinaryVector;
 import org.apache.arrow.vector.Float4Vector;
 import org.apache.arrow.vector.VectorSchemaRoot;
+import org.apache.arrow.vector.compare.Range;
+import org.apache.arrow.vector.compare.RangeEqualsVisitor;
 import org.apache.arrow.vector.complex.StructVector;
 import org.apache.arrow.vector.ipc.ArrowFileReader;
 import org.apache.arrow.vector.ipc.ArrowFileWriter;
 import org.apache.arrow.vector.types.FloatingPointPrecision;
 import org.apache.arrow.vector.types.pojo.ArrowType.ExtensionType;
+import org.apache.arrow.vector.util.VectorBatchAppender;
+import org.apache.arrow.vector.validate.ValidateVectorVisitor;
 import org.junit.Assert;
 import org.junit.Test;
 
@@ -230,6 +236,48 @@ public void roundtripLocation() throws IOException {
     }
   }
 
+  @Test
+  public void testVectorCompare() {
+    UuidType uuidType = new UuidType();
+    ExtensionTypeRegistry.register(uuidType);
+    try (final BufferAllocator allocator = new RootAllocator(Integer.MAX_VALUE);
+         UuidVector a1 = (UuidVector) uuidType.getNewVector("a", FieldType.nullable(uuidType), allocator);
+         UuidVector a2 = (UuidVector) uuidType.getNewVector("a", FieldType.nullable(uuidType), allocator);
+         UuidVector bb = (UuidVector) uuidType.getNewVector("a", FieldType.nullable(uuidType), allocator)
+         ) {
+      UUID u1 = UUID.randomUUID();
+      UUID u2 = UUID.randomUUID();
+
+      // Test out type and vector validation visitors for an ExtensionTypeVector
+      ValidateVectorVisitor validateVisitor = new ValidateVectorVisitor();
+      validateVisitor.visit(a1, null);
+
+      a1.setValueCount(2);
+      a1.set(0, u1);
+      a1.set(1, u2);
+
+      a2.setValueCount(2);
+      a2.set(0, u1);
+      a2.set(1, u2);
+
+      bb.setValueCount(2);
+      bb.set(0, u2);
+      bb.set(1, u1);
+
+      Range range = new Range(0, 0, a1.getValueCount());
+      RangeEqualsVisitor visitor = new RangeEqualsVisitor(a1, a2);
+      assertTrue(visitor.rangeEquals(range));
+
+      visitor = new RangeEqualsVisitor(a1, bb);
+      assertFalse(visitor.rangeEquals(range));
+
+      // Test out vector appender
+      VectorBatchAppender.batchAppend(a1, a2, bb);
+      assertEquals(a1.getValueCount(), 6);
+      validateVisitor.visit(a1, null);
+    }
+  }
+
   static class UuidType extends ExtensionType {
 
     @Override
diff --git a/python/pyarrow/_compute.pyx b/python/pyarrow/_compute.pyx
index 39bb5315f7a..780ec8fead6 100644
--- a/python/pyarrow/_compute.pyx
+++ b/python/pyarrow/_compute.pyx
@@ -699,6 +699,57 @@ class ElementWiseAggregateOptions(_ElementWiseAggregateOptions):
         self._set_options(skip_nulls)
 
 
+cdef CRoundMode unwrap_round_mode(round_mode) except *:
+    if round_mode == 'down':
+        return CRoundMode_DOWN
+    elif round_mode == 'up':
+        return CRoundMode_UP
+    elif round_mode == 'towards_zero':
+        return CRoundMode_TOWARDS_ZERO
+    elif round_mode == 'towards_infinity':
+        return CRoundMode_TOWARDS_INFINITY
+    elif round_mode == 'half_down':
+        return CRoundMode_HALF_DOWN
+    elif round_mode == 'half_up':
+        return CRoundMode_HALF_UP
+    elif round_mode == 'half_towards_zero':
+        return CRoundMode_HALF_TOWARDS_ZERO
+    elif round_mode == 'half_towards_infinity':
+        return CRoundMode_HALF_TOWARDS_INFINITY
+    elif round_mode == 'half_to_even':
+        return CRoundMode_HALF_TO_EVEN
+    elif round_mode == 'half_to_odd':
+        return CRoundMode_HALF_TO_ODD
+    else:
+        raise ValueError('"{}" is not a valid round mode'.format(round_mode))
+
+
+cdef class _RoundOptions(FunctionOptions):
+    def _set_options(self, int64_t ndigits, round_mode):
+        cdef:
+            CRoundMode c_round_mode = CRoundMode_HALF_TO_EVEN
+        c_round_mode = unwrap_round_mode(round_mode)
+        self.wrapped.reset(new CRoundOptions(ndigits, c_round_mode))
+
+
+class RoundOptions(_RoundOptions):
+    def __init__(self, ndigits=0, round_mode='half_to_even'):
+        self._set_options(ndigits, round_mode)
+
+
+cdef class _RoundToMultipleOptions(FunctionOptions):
+    def _set_options(self, double multiple, round_mode):
+        cdef:
+            CRoundMode c_round_mode = CRoundMode_HALF_TO_EVEN
+        c_round_mode = unwrap_round_mode(round_mode)
+        self.wrapped.reset(new CRoundToMultipleOptions(multiple, c_round_mode))
+
+
+class RoundToMultipleOptions(_RoundToMultipleOptions):
+    def __init__(self, multiple=1.0, round_mode='half_to_even'):
+        self._set_options(multiple, round_mode)
+
+
 cdef class _JoinOptions(FunctionOptions):
     def _set_options(self, null_handling, null_replacement):
         cdef:
@@ -924,13 +975,13 @@ class IndexOptions(_IndexOptions):
 
 
 cdef class _ModeOptions(FunctionOptions):
-    def _set_options(self, n):
-        self.wrapped.reset(new CModeOptions(n))
+    def _set_options(self, n, skip_nulls, min_count):
+        self.wrapped.reset(new CModeOptions(n, skip_nulls, min_count))
 
 
 class ModeOptions(_ModeOptions):
-    def __init__(self, n=1):
-        self._set_options(n)
+    def __init__(self, n=1, skip_nulls=True, min_count=0):
+        self._set_options(n, skip_nulls, min_count)
 
 
 cdef class _SetLookupOptions(FunctionOptions):
@@ -989,7 +1040,7 @@ cdef class _StrftimeOptions(FunctionOptions):
 
 
 class StrftimeOptions(_StrftimeOptions):
-    def __init__(self, format="%Y-%m-%dT%H:%M:%SZ", locale="C"):
+    def __init__(self, format="%Y-%m-%dT%H:%M:%S", locale="C"):
         self._set_options(format, locale)
 
 
@@ -1005,6 +1056,41 @@ class DayOfWeekOptions(_DayOfWeekOptions):
         self._set_options(one_based_numbering, week_start)
 
 
+cdef class _AssumeTimezoneOptions(FunctionOptions):
+    def _set_options(self, timezone, ambiguous, nonexistent):
+        ambiguous_dict = {
+            'raise': CAssumeTimezoneAmbiguous_AMBIGUOUS_RAISE,
+            'earliest': CAssumeTimezoneAmbiguous_AMBIGUOUS_EARLIEST,
+            'latest': CAssumeTimezoneAmbiguous_AMBIGUOUS_LATEST,
+        }
+        nonexistent_dict = {
+            'raise': CAssumeTimezoneNonexistent_NONEXISTENT_RAISE,
+            'earliest': CAssumeTimezoneNonexistent_NONEXISTENT_EARLIEST,
+            'latest': CAssumeTimezoneNonexistent_NONEXISTENT_LATEST,
+        }
+
+        if ambiguous not in ambiguous_dict:
+            raise ValueError(
+                "{!r} is not a valid 'ambiguous' keyword".format(ambiguous)
+            )
+        if nonexistent not in nonexistent_dict:
+            raise ValueError(
+                "{!r} is not a valid 'nonexistent' keyword".format(
+                    nonexistent)
+            )
+        self.wrapped.reset(
+            new CAssumeTimezoneOptions(
+                tobytes(timezone),
+                ambiguous_dict[ambiguous],
+                nonexistent_dict[nonexistent])
+        )
+
+
+class AssumeTimezoneOptions(_AssumeTimezoneOptions):
+    def __init__(self, timezone, *, ambiguous="raise", nonexistent="raise"):
+        self._set_options(timezone, ambiguous, nonexistent)
+
+
 cdef class _NullOptions(FunctionOptions):
     def _set_options(self, nan_is_null):
         self.wrapped.reset(
@@ -1095,8 +1181,37 @@ class SortOptions(_SortOptions):
         self._set_options(sort_keys)
 
 
+cdef class _SelectKOptions(FunctionOptions):
+    def _set_options(self, k, sort_keys):
+        cdef:
+            c_string c_name
+            vector[CSortKey] c_sort_keys
+            CSortOrder c_order
+
+        for name, order in sort_keys:
+            if order == "ascending":
+                c_order = CSortOrder_Ascending
+            elif order == "descending":
+                c_order = CSortOrder_Descending
+            else:
+                raise ValueError(
+                    "{!r} is not a valid order".format(order)
+                )
+            c_name = tobytes(name)
+            c_sort_keys.push_back(CSortKey(c_name, c_order))
+
+        self.wrapped.reset(new CSelectKOptions(k, c_sort_keys))
+
+
+class SelectKOptions(_SelectKOptions):
+    def __init__(self, k, sort_keys=None):
+        if sort_keys is None:
+            sort_keys = []
+        self._set_options(k, sort_keys)
+
+
 cdef class _QuantileOptions(FunctionOptions):
-    def _set_options(self, quantiles, interp):
+    def _set_options(self, quantiles, interp, skip_nulls, min_count):
         interp_dict = {
             'linear': CQuantileInterp_LINEAR,
             'lower': CQuantileInterp_LOWER,
@@ -1109,24 +1224,29 @@ cdef class _QuantileOptions(FunctionOptions):
                 '{!r} is not a valid interpolation'
                 .format(interp))
         self.wrapped.reset(
-            new CQuantileOptions(quantiles, interp_dict[interp]))
+            new CQuantileOptions(quantiles, interp_dict[interp],
+                                 skip_nulls, min_count))
 
 
 class QuantileOptions(_QuantileOptions):
-    def __init__(self, *, q=0.5, interpolation='linear'):
+    def __init__(self, *, q=0.5, interpolation='linear',
+                 skip_nulls=True, min_count=0):
         if not isinstance(q, (list, tuple, np.ndarray)):
             q = [q]
-        self._set_options(q, interpolation)
+        self._set_options(q, interpolation, skip_nulls, min_count)
 
 
 cdef class _TDigestOptions(FunctionOptions):
-    def _set_options(self, quantiles, delta, buffer_size):
+    def _set_options(self, quantiles, delta, buffer_size,
+                     skip_nulls, min_count):
         self.wrapped.reset(
-            new CTDigestOptions(quantiles, delta, buffer_size))
+            new CTDigestOptions(quantiles, delta, buffer_size,
+                                skip_nulls, min_count))
 
 
 class TDigestOptions(_TDigestOptions):
-    def __init__(self, *, q=0.5, delta=100, buffer_size=500):
+    def __init__(self, *, q=0.5, delta=100, buffer_size=500,
+                 skip_nulls=True, min_count=0):
         if not isinstance(q, (list, tuple, np.ndarray)):
             q = [q]
-        self._set_options(q, delta, buffer_size)
+        self._set_options(q, delta, buffer_size, skip_nulls, min_count)
diff --git a/python/pyarrow/_orc.pxd b/python/pyarrow/_orc.pxd
index fd72ac42930..e948d73f058 100644
--- a/python/pyarrow/_orc.pxd
+++ b/python/pyarrow/_orc.pxd
@@ -35,20 +35,20 @@ cdef extern from "arrow/adapters/orc/adapter.h" \
 
     cdef cppclass ORCFileReader:
         @staticmethod
-        CStatus Open(const shared_ptr[CRandomAccessFile]& file,
-                     CMemoryPool* pool,
-                     unique_ptr[ORCFileReader]* reader)
+        CResult[unique_ptr[ORCFileReader]] Open(
+            const shared_ptr[CRandomAccessFile]& file,
+            CMemoryPool* pool)
 
         CResult[shared_ptr[const CKeyValueMetadata]] ReadMetadata()
 
-        CStatus ReadSchema(shared_ptr[CSchema]* out)
+        CResult[shared_ptr[CSchema]] ReadSchema()
 
-        CStatus ReadStripe(int64_t stripe, shared_ptr[CRecordBatch]* out)
-        CStatus ReadStripe(int64_t stripe, std_vector[int],
-                           shared_ptr[CRecordBatch]* out)
+        CResult[shared_ptr[CRecordBatch]] ReadStripe(int64_t stripe)
+        CResult[shared_ptr[CRecordBatch]] ReadStripe(
+            int64_t stripe, std_vector[int])
 
-        CStatus Read(shared_ptr[CTable]* out)
-        CStatus Read(std_vector[int], shared_ptr[CTable]* out)
+        CResult[shared_ptr[CTable]] Read()
+        CResult[shared_ptr[CTable]] Read(std_vector[int])
 
         int64_t NumberOfStripes()
 
diff --git a/python/pyarrow/_orc.pyx b/python/pyarrow/_orc.pyx
index f58b52a0d37..ee17f786edf 100644
--- a/python/pyarrow/_orc.pyx
+++ b/python/pyarrow/_orc.pyx
@@ -55,8 +55,9 @@ cdef class ORCReader(_Weakrefable):
 
         get_reader(source, use_memory_map, &rd_handle)
         with nogil:
-            check_status(ORCFileReader.Open(rd_handle, self.allocator,
-                                            &self.reader))
+            self.reader = move(GetResultValue(
+                ORCFileReader.Open(rd_handle, self.allocator)
+            ))
 
     def metadata(self):
         """
@@ -88,7 +89,7 @@ cdef class ORCReader(_Weakrefable):
             shared_ptr[CSchema] sp_arrow_schema
 
         with nogil:
-            check_status(deref(self.reader).ReadSchema(&sp_arrow_schema))
+            sp_arrow_schema = GetResultValue(deref(self.reader).ReadSchema())
 
         return pyarrow_wrap_schema(sp_arrow_schema)
 
@@ -109,13 +110,15 @@ cdef class ORCReader(_Weakrefable):
 
         if include_indices is None:
             with nogil:
-                (check_status(deref(self.reader)
-                              .ReadStripe(stripe, &sp_record_batch)))
+                sp_record_batch = GetResultValue(
+                    deref(self.reader).ReadStripe(stripe)
+                )
         else:
             indices = include_indices
             with nogil:
-                (check_status(deref(self.reader)
-                              .ReadStripe(stripe, indices, &sp_record_batch)))
+                sp_record_batch = GetResultValue(
+                    deref(self.reader).ReadStripe(stripe, indices)
+                )
 
         return pyarrow_wrap_batch(sp_record_batch)
 
@@ -126,11 +129,11 @@ cdef class ORCReader(_Weakrefable):
 
         if include_indices is None:
             with nogil:
-                check_status(deref(self.reader).Read(&sp_table))
+                sp_table = GetResultValue(deref(self.reader).Read())
         else:
             indices = include_indices
             with nogil:
-                check_status(deref(self.reader).Read(indices, &sp_table))
+                sp_table = GetResultValue(deref(self.reader).Read(indices))
 
         return pyarrow_wrap_table(sp_table)
 
diff --git a/python/pyarrow/compute.py b/python/pyarrow/compute.py
index 6f8b9fa3dae..d0112f26130 100644
--- a/python/pyarrow/compute.py
+++ b/python/pyarrow/compute.py
@@ -30,6 +30,7 @@
     VectorKernel,
     # Option classes
     ArraySortOptions,
+    AssumeTimezoneOptions,
     CastOptions,
     CountOptions,
     DayOfWeekOptions,
@@ -48,10 +49,13 @@
     QuantileOptions,
     ReplaceSliceOptions,
     ReplaceSubstringOptions,
+    RoundOptions,
+    RoundToMultipleOptions,
     ScalarAggregateOptions,
     SetLookupOptions,
     SliceOptions,
     SortOptions,
+    SelectKOptions,
     SplitOptions,
     SplitPatternOptions,
     StrftimeOptions,
@@ -445,7 +449,7 @@ def match_substring_regex(array, pattern, *, ignore_case=False):
                          MatchSubstringOptions(pattern, ignore_case))
 
 
-def mode(array, n=1):
+def mode(array, n=1, skip_nulls=True, min_count=0):
     """
     Return top-n most common values and number of times they occur in a passed
     numerical (chunked) array, in descending order of occurance. If there are
@@ -454,6 +458,12 @@ def mode(array, n=1):
     Parameters
     ----------
     array : pyarrow.Array or pyarrow.ChunkedArray
+    skip_nulls : bool, default True
+        If True, ignore nulls in the input. Else return an empty array
+        if any input is null.
+    min_count : int, default 0
+        If there are fewer than this many values in the input, return
+        an empty array.
 
     Returns
     -------
@@ -470,7 +480,7 @@ def mode(array, n=1):
     >>> modes[1]
     <pyarrow.StructScalar: {'mode': 1, 'count': 2}>
     """
-    options = ModeOptions(n=n)
+    options = ModeOptions(n=n, skip_nulls=skip_nulls, min_count=min_count)
     return call_function("mode", [array], options)
 
 
diff --git a/python/pyarrow/includes/libarrow.pxd b/python/pyarrow/includes/libarrow.pxd
index 4f9f4184b2d..9e023ec08e0 100644
--- a/python/pyarrow/includes/libarrow.pxd
+++ b/python/pyarrow/includes/libarrow.pxd
@@ -146,6 +146,7 @@ cdef extern from "arrow/api.h" namespace "arrow" nogil:
         Type id()
 
         c_bool Equals(const CDataType& other)
+        c_bool Equals(const shared_ptr[CDataType]& other)
 
         shared_ptr[CField] field(int i)
         const vector[shared_ptr[CField]] fields()
@@ -1826,6 +1827,41 @@ cdef extern from "arrow/compute/api.h" namespace "arrow::compute" nogil:
         CElementWiseAggregateOptions(c_bool skip_nulls)
         c_bool skip_nulls
 
+    ctypedef enum CRoundMode \
+            "arrow::compute::RoundMode":
+        CRoundMode_DOWN \
+            "arrow::compute::RoundMode::DOWN"
+        CRoundMode_UP \
+            "arrow::compute::RoundMode::UP"
+        CRoundMode_TOWARDS_ZERO \
+            "arrow::compute::RoundMode::TOWARDS_ZERO"
+        CRoundMode_TOWARDS_INFINITY \
+            "arrow::compute::RoundMode::TOWARDS_INFINITY"
+        CRoundMode_HALF_DOWN \
+            "arrow::compute::RoundMode::HALF_DOWN"
+        CRoundMode_HALF_UP \
+            "arrow::compute::RoundMode::HALF_UP"
+        CRoundMode_HALF_TOWARDS_ZERO \
+            "arrow::compute::RoundMode::HALF_TOWARDS_ZERO"
+        CRoundMode_HALF_TOWARDS_INFINITY \
+            "arrow::compute::RoundMode::HALF_TOWARDS_INFINITY"
+        CRoundMode_HALF_TO_EVEN \
+            "arrow::compute::RoundMode::HALF_TO_EVEN"
+        CRoundMode_HALF_TO_ODD \
+            "arrow::compute::RoundMode::HALF_TO_ODD"
+
+    cdef cppclass CRoundOptions \
+            "arrow::compute::RoundOptions"(CFunctionOptions):
+        CRoundOptions(int64_t ndigits, CRoundMode round_mode)
+        int64_t ndigits
+        CRoundMode round_mode
+
+    cdef cppclass CRoundToMultipleOptions \
+            "arrow::compute::RoundToMultipleOptions"(CFunctionOptions):
+        CRoundToMultipleOptions(double multiple, CRoundMode round_mode)
+        double multiple
+        CRoundMode round_mode
+
     enum CJoinNullHandlingBehavior \
             "arrow::compute::JoinOptions::NullHandlingBehavior":
         CJoinNullHandlingBehavior_EMIT_NULL \
@@ -1963,6 +1999,30 @@ cdef extern from "arrow/compute/api.h" namespace "arrow::compute" nogil:
         c_bool one_based_numbering
         uint32_t week_start
 
+    enum CAssumeTimezoneAmbiguous \
+            "arrow::compute::AssumeTimezoneOptions::Ambiguous":
+        CAssumeTimezoneAmbiguous_AMBIGUOUS_RAISE \
+            "arrow::compute::AssumeTimezoneOptions::AMBIGUOUS_RAISE"
+        CAssumeTimezoneAmbiguous_AMBIGUOUS_EARLIEST \
+            "arrow::compute::AssumeTimezoneOptions::AMBIGUOUS_EARLIEST"
+        CAssumeTimezoneAmbiguous_AMBIGUOUS_LATEST \
+            "arrow::compute::AssumeTimezoneOptions::AMBIGUOUS_LATEST"
+
+    enum CAssumeTimezoneNonexistent \
+            "arrow::compute::AssumeTimezoneOptions::Nonexistent":
+        CAssumeTimezoneNonexistent_NONEXISTENT_RAISE \
+            "arrow::compute::AssumeTimezoneOptions::NONEXISTENT_RAISE"
+        CAssumeTimezoneNonexistent_NONEXISTENT_EARLIEST \
+            "arrow::compute::AssumeTimezoneOptions::NONEXISTENT_EARLIEST"
+        CAssumeTimezoneNonexistent_NONEXISTENT_LATEST \
+            "arrow::compute::AssumeTimezoneOptions::NONEXISTENT_LATEST"
+
+    cdef cppclass CAssumeTimezoneOptions \
+            "arrow::compute::AssumeTimezoneOptions"(CFunctionOptions):
+        CAssumeTimezoneOptions(
+            c_string timezone, CAssumeTimezoneAmbiguous ambiguous,
+            CAssumeTimezoneNonexistent nonexistent)
+
     cdef cppclass CNullOptions \
             "arrow::compute::NullOptions"(CFunctionOptions):
         CNullOptions(c_bool nan_is_null)
@@ -1993,8 +2053,10 @@ cdef extern from "arrow/compute/api.h" namespace "arrow::compute" nogil:
 
     cdef cppclass CModeOptions \
             "arrow::compute::ModeOptions"(CFunctionOptions):
-        CModeOptions(int64_t n)
+        CModeOptions(int64_t n, c_bool skip_nulls, uint32_t min_count)
         int64_t n
+        c_bool skip_nulls
+        uint32_t min_count
 
     cdef cppclass CIndexOptions \
             "arrow::compute::IndexOptions"(CFunctionOptions):
@@ -2031,6 +2093,12 @@ cdef extern from "arrow/compute/api.h" namespace "arrow::compute" nogil:
         CSortOptions(vector[CSortKey] sort_keys)
         vector[CSortKey] sort_keys
 
+    cdef cppclass CSelectKOptions \
+            "arrow::compute::SelectKOptions"(CFunctionOptions):
+        CSelectKOptions(int64_t k, vector[CSortKey] sort_keys)
+        int64_t k
+        vector[CSortKey] sort_keys
+
     enum CQuantileInterp \
             "arrow::compute::QuantileOptions::Interpolation":
         CQuantileInterp_LINEAR   "arrow::compute::QuantileOptions::LINEAR"
@@ -2041,17 +2109,23 @@ cdef extern from "arrow/compute/api.h" namespace "arrow::compute" nogil:
 
     cdef cppclass CQuantileOptions \
             "arrow::compute::QuantileOptions"(CFunctionOptions):
-        CQuantileOptions(vector[double] q, CQuantileInterp interpolation)
+        CQuantileOptions(vector[double] q, CQuantileInterp interpolation,
+                         c_bool skip_nulls, uint32_t min_count)
         vector[double] q
         CQuantileInterp interpolation
+        c_bool skip_nulls
+        uint32_t min_count
 
     cdef cppclass CTDigestOptions \
             "arrow::compute::TDigestOptions"(CFunctionOptions):
         CTDigestOptions(vector[double] q,
-                        unsigned int delta, unsigned int buffer_size)
+                        unsigned int delta, unsigned int buffer_size,
+                        c_bool skip_nulls, uint32_t min_count)
         vector[double] q
         unsigned int delta
         unsigned int buffer_size
+        c_bool skip_nulls
+        uint32_t min_count
 
     enum DatumType" arrow::Datum::type":
         DatumType_NONE" arrow::Datum::NONE"
@@ -2341,6 +2415,14 @@ cdef extern from 'arrow/extension_type.h' namespace 'arrow':
         c_string extension_name()
         shared_ptr[CDataType] storage_type()
 
+        @staticmethod
+        shared_ptr[CArray] WrapArray(shared_ptr[CDataType] ext_type,
+                                     shared_ptr[CArray] storage)
+
+        @staticmethod
+        shared_ptr[CChunkedArray] WrapArray(shared_ptr[CDataType] ext_type,
+                                            shared_ptr[CChunkedArray] storage)
+
     cdef cppclass CExtensionArray" arrow::ExtensionArray"(CArray):
         CExtensionArray(shared_ptr[CDataType], shared_ptr[CArray] storage)
 
diff --git a/python/pyarrow/tests/test_cffi.py b/python/pyarrow/tests/test_cffi.py
index 2ac30fd2cf2..f0ce42909f1 100644
--- a/python/pyarrow/tests/test_cffi.py
+++ b/python/pyarrow/tests/test_cffi.py
@@ -47,15 +47,41 @@
     ValueError, match="Cannot import released ArrowArrayStream")
 
 
+class ParamExtType(pa.PyExtensionType):
+
+    def __init__(self, width):
+        self._width = width
+        pa.PyExtensionType.__init__(self, pa.binary(width))
+
+    @property
+    def width(self):
+        return self._width
+
+    def __reduce__(self):
+        return ParamExtType, (self.width,)
+
+
 def make_schema():
     return pa.schema([('ints', pa.list_(pa.int32()))],
                      metadata={b'key1': b'value1'})
 
 
+def make_extension_schema():
+    return pa.schema([('ext', ParamExtType(3))],
+                     metadata={b'key1': b'value1'})
+
+
 def make_batch():
     return pa.record_batch([[[1], [2, 42]]], make_schema())
 
 
+def make_extension_batch():
+    schema = make_extension_schema()
+    ext_col = schema[0].type.wrap_array(pa.array([b"foo", b"bar"],
+                                                 type=pa.binary(3)))
+    return pa.record_batch([ext_col], schema)
+
+
 def make_batches():
     schema = make_schema()
     return [
@@ -174,19 +200,18 @@ def test_export_import_array():
         pa.Array._import_from_c(ptr_array, ptr_schema)
 
 
-@needs_cffi
-def test_export_import_schema():
+def check_export_import_schema(schema_factory):
     c_schema = ffi.new("struct ArrowSchema*")
     ptr_schema = int(ffi.cast("uintptr_t", c_schema))
 
     gc.collect()  # Make sure no Arrow data dangles in a ref cycle
     old_allocated = pa.total_allocated_bytes()
 
-    make_schema()._export_to_c(ptr_schema)
+    schema_factory()._export_to_c(ptr_schema)
     assert pa.total_allocated_bytes() > old_allocated
     # Delete and recreate C++ object from exported pointer
     schema_new = pa.Schema._import_from_c(ptr_schema)
-    assert schema_new == make_schema()
+    assert schema_new == schema_factory()
     assert pa.total_allocated_bytes() == old_allocated
     del schema_new
     assert pa.total_allocated_bytes() == old_allocated
@@ -205,7 +230,16 @@ def test_export_import_schema():
 
 
 @needs_cffi
-def test_export_import_batch():
+def test_export_import_schema():
+    check_export_import_schema(make_schema)
+
+
+@needs_cffi
+def test_export_import_schema_with_extension():
+    check_export_import_schema(make_extension_schema)
+
+
+def check_export_import_batch(batch_factory):
     c_schema = ffi.new("struct ArrowSchema*")
     ptr_schema = int(ffi.cast("uintptr_t", c_schema))
     c_array = ffi.new("struct ArrowArray*")
@@ -215,8 +249,8 @@ def test_export_import_batch():
     old_allocated = pa.total_allocated_bytes()
 
     # Schema is known up front
-    schema = make_schema()
-    batch = make_batch()
+    batch = batch_factory()
+    schema = batch.schema
     py_value = batch.to_pydict()
     batch._export_to_c(ptr_array)
     assert pa.total_allocated_bytes() > old_allocated
@@ -233,14 +267,14 @@ def test_export_import_batch():
         pa.RecordBatch._import_from_c(ptr_array, make_schema())
 
     # Type is exported and imported at the same time
-    batch = make_batch()
+    batch = batch_factory()
     py_value = batch.to_pydict()
     batch._export_to_c(ptr_array, ptr_schema)
     # Delete and recreate C++ objects from exported pointers
     del batch
     batch_new = pa.RecordBatch._import_from_c(ptr_array, ptr_schema)
     assert batch_new.to_pydict() == py_value
-    assert batch_new.schema == make_schema()
+    assert batch_new.schema == batch_factory().schema
     assert pa.total_allocated_bytes() > old_allocated
     del batch_new
     assert pa.total_allocated_bytes() == old_allocated
@@ -250,7 +284,7 @@ def test_export_import_batch():
 
     # Not a struct type
     pa.int32()._export_to_c(ptr_schema)
-    make_batch()._export_to_c(ptr_array)
+    batch_factory()._export_to_c(ptr_array)
     with pytest.raises(ValueError,
                        match="ArrowSchema describes non-struct type"):
         pa.RecordBatch._import_from_c(ptr_array, ptr_schema)
@@ -259,6 +293,16 @@ def test_export_import_batch():
         pa.RecordBatch._import_from_c(ptr_array, ptr_schema)
 
 
+@needs_cffi
+def test_export_import_batch():
+    check_export_import_batch(make_batch)
+
+
+@needs_cffi
+def test_export_import_batch_with_extension():
+    check_export_import_batch(make_extension_batch)
+
+
 def _export_import_batch_reader(ptr_stream, reader_factory):
     # Prepare input
     batches = make_batches()
diff --git a/python/pyarrow/tests/test_compute.py b/python/pyarrow/tests/test_compute.py
index c6a106fbebd..46ba78027b5 100644
--- a/python/pyarrow/tests/test_compute.py
+++ b/python/pyarrow/tests/test_compute.py
@@ -16,7 +16,7 @@
 # under the License.
 
 from datetime import datetime
-from functools import lru_cache
+from functools import lru_cache, partial
 import inspect
 import pickle
 import pytest
@@ -34,7 +34,6 @@
 import pyarrow as pa
 import pyarrow.compute as pc
 
-
 all_array_types = [
     ('bool', [True, False, False, True, True]),
     ('uint8', np.arange(5)),
@@ -53,22 +52,19 @@
     (pa.list_(pa.int8()), [[1, 2], [3, 4], [5, 6], None, [9, 16]]),
     (pa.large_list(pa.int16()), [[1], [2, 3, 4], [5, 6], None, [9, 16]]),
     (pa.struct([('a', pa.int8()), ('b', pa.int8())]), [
-     {'a': 1, 'b': 2}, None, {'a': 3, 'b': 4}, None, {'a': 5, 'b': 6}]),
+        {'a': 1, 'b': 2}, None, {'a': 3, 'b': 4}, None, {'a': 5, 'b': 6}]),
 ]
 
-
 exported_functions = [
     func for (name, func) in sorted(pc.__dict__.items())
     if hasattr(func, '__arrow_compute_function__')]
 
-
 exported_option_classes = [
     cls for (name, cls) in sorted(pc.__dict__.items())
     if (isinstance(cls, type) and
         cls is not pc.FunctionOptions and
         issubclass(cls, pc.FunctionOptions))]
 
-
 numerical_arrow_types = [
     pa.int8(),
     pa.int16(),
@@ -127,13 +123,23 @@ def test_option_class_equality():
         pc.SetLookupOptions(value_set=pa.array([1])),
         pc.SliceOptions(start=0, stop=1, step=1),
         pc.SplitPatternOptions(pattern="pattern"),
+        pc.SelectKOptions(k=0, sort_keys=[("b", "ascending")]),
         pc.StrptimeOptions("%Y", "s"),
         pc.TrimOptions(" "),
         pc.StrftimeOptions(),
+        pc.RoundOptions(ndigits=2, round_mode="towards_infinity"),
+        pc.RoundToMultipleOptions(multiple=100, round_mode="towards_infinity"),
     ]
+    # TODO: We should test on windows once ARROW-13168 is resolved.
+    # Timezone database is not available on Windows yet
+    if sys.platform != 'win32':
+        options.append(pc.AssumeTimezoneOptions("Europe/Ljubljana"))
+
     classes = {type(option) for option in options}
     for cls in exported_option_classes:
-        if cls not in classes:
+        # Timezone database is not available on Windows yet
+        if cls not in classes and sys.platform != 'win32' and \
+                cls != pc.AssumeTimezoneOptions:
             try:
                 options.append(cls())
             except TypeError:
@@ -306,6 +312,14 @@ def test_mode_array():
     arr = pa.array([], type='int64')
     assert len(pc.mode(arr)) == 0
 
+    arr = pa.array([1, 1, 3, 4, 3, None], type='int64')
+    mode = pc.mode(arr, skip_nulls=False)
+    assert len(mode) == 0
+    mode = pc.mode(arr, min_count=6)
+    assert len(mode) == 0
+    mode = pc.mode(arr, skip_nulls=False, min_count=5)
+    assert len(mode) == 0
+
 
 def test_mode_chunked_array():
     # ARROW-9917
@@ -650,7 +664,8 @@ def test_generated_signatures():
                         "options=None, skip_nulls=True, min_count=1)")
     sig = inspect.signature(pc.quantile)
     assert str(sig) == ("(array, *, memory_pool=None, "
-                        "options=None, q=0.5, interpolation='linear')")
+                        "options=None, q=0.5, interpolation='linear', "
+                        "skip_nulls=True, min_count=0)")
     sig = inspect.signature(pc.binary_join_element_wise)
     assert str(sig) == ("(*strings, memory_pool=None, options=None, "
                         "null_handling='emit_null', null_replacement='')")
@@ -766,7 +781,7 @@ def find_new_unicode_codepoints():
 def test_string_py_compat_boolean(function_name, variant):
     arrow_name = variant + "_" + function_name
     py_name = function_name.replace('_', '')
-    ignore = codepoints_ignore.get(function_name, set()) |\
+    ignore = codepoints_ignore.get(function_name, set()) | \
         find_new_unicode_codepoints()
     for i in range(128 if ascii else 0x11000):
         if i in range(0xD800, 0xE000):
@@ -1172,9 +1187,11 @@ def test_filter_null_type():
 @pytest.mark.parametrize("typ", ["array", "chunked_array"])
 def test_compare_array(typ):
     if typ == "array":
-        def con(values): return pa.array(values)
+        def con(values):
+            return pa.array(values)
     else:
-        def con(values): return pa.chunked_array([values])
+        def con(values):
+            return pa.chunked_array([values])
 
     arr1 = con([1, 2, 3, 4, None])
     arr2 = con([1, 1, 4, None, 4])
@@ -1201,9 +1218,11 @@ def con(values): return pa.chunked_array([values])
 @pytest.mark.parametrize("typ", ["array", "chunked_array"])
 def test_compare_string_scalar(typ):
     if typ == "array":
-        def con(values): return pa.array(values)
+        def con(values):
+            return pa.array(values)
     else:
-        def con(values): return pa.chunked_array([values])
+        def con(values):
+            return pa.chunked_array([values])
 
     arr = con(['a', 'b', 'c', None])
     scalar = pa.scalar('b')
@@ -1236,9 +1255,11 @@ def con(values): return pa.chunked_array([values])
 @pytest.mark.parametrize("typ", ["array", "chunked_array"])
 def test_compare_scalar(typ):
     if typ == "array":
-        def con(values): return pa.array(values)
+        def con(values):
+            return pa.array(values)
     else:
-        def con(values): return pa.chunked_array([values])
+        def con(values):
+            return pa.chunked_array([values])
 
     arr = con([1, 2, 3, None])
     scalar = pa.scalar(2)
@@ -1307,6 +1328,70 @@ def test_arithmetic_multiply():
     assert result.equals(expected)
 
 
+@pytest.mark.parametrize("ty", ["round", "round_to_multiple"])
+def test_round_to_integer(ty):
+    if ty == "round":
+        round = pc.round
+        RoundOptions = partial(pc.RoundOptions, ndigits=0)
+    elif ty == "round_to_multiple":
+        round = pc.round_to_multiple
+        RoundOptions = partial(pc.RoundToMultipleOptions, multiple=1)
+
+    values = [3.2, 3.5, 3.7, 4.5, -3.2, -3.5, -3.7, None]
+    rmode_and_expected = {
+        "down": [3, 3, 3, 4, -4, -4, -4, None],
+        "up": [4, 4, 4, 5, -3, -3, -3, None],
+        "towards_zero": [3, 3, 3, 4, -3, -3, -3, None],
+        "towards_infinity": [4, 4, 4, 5, -4, -4, -4, None],
+        "half_down": [3, 3, 4, 4, -3, -4, -4, None],
+        "half_up": [3, 4, 4, 5, -3, -3, -4, None],
+        "half_towards_zero": [3, 3, 4, 4, -3, -3, -4, None],
+        "half_towards_infinity": [3, 4, 4, 5, -3, -4, -4, None],
+        "half_to_even": [3, 4, 4, 4, -3, -4, -4, None],
+        "half_to_odd": [3, 3, 4, 5, -3, -3, -4, None],
+    }
+    for round_mode, expected in rmode_and_expected.items():
+        options = RoundOptions(round_mode=round_mode)
+        result = round(values, options=options)
+        np.testing.assert_array_equal(result, pa.array(expected))
+
+
+def test_round():
+    values = [320, 3.5, 3.075, 4.5, -3.212, -35.1234, -3.045, None]
+    ndigits_and_expected = {
+        -2: [300, 0, 0, 0, -0, -0, -0, None],
+        -1: [320, 0, 0, 0, -0, -40, -0, None],
+        0: [320, 4, 3, 5, -3, -35, -3, None],
+        1: [320, 3.5, 3.1, 4.5, -3.2, -35.1, -3, None],
+        2: [320, 3.5, 3.08, 4.5, -3.21, -35.12, -3.05, None],
+    }
+    for ndigits, expected in ndigits_and_expected.items():
+        options = pc.RoundOptions(
+            ndigits=ndigits, round_mode="half_towards_infinity")
+        result = pc.round(values, options=options)
+        np.testing.assert_allclose(result, pa.array(expected), equal_nan=True)
+
+
+def test_round_to_multiple():
+    values = [320, 3.5, 3.075, 4.5, -3.212, -35.1234, -3.045, None]
+    multiple_and_expected = {
+        2: [320, 4, 4, 4, -4, -36, -4, None],
+        0.05: [320, 3.5, 3.1, 4.5, -3.2, -35.1, -3.05, None],
+        0.1: [320, 3.5, 3.1, 4.5, -3.2, -35.1, -3, None],
+        10: [320, 0, 0, 0, -0, -40, -0, None],
+        100: [300, 0, 0, 0, -0, -0, -0, None],
+    }
+    for multiple, expected in multiple_and_expected.items():
+        options = pc.RoundToMultipleOptions(
+            multiple=multiple, round_mode="half_towards_infinity")
+        result = pc.round_to_multiple(values, options=options)
+        np.testing.assert_allclose(result, pa.array(expected), equal_nan=True)
+
+    with pytest.raises(pa.ArrowInvalid,
+                       match="multiple has to be a positive value"):
+        pc.round_to_multiple(values, multiple=-2)
+
+
 def test_is_null():
     arr = pa.array([1, 2, 3, None])
     result = arr.is_null()
@@ -1431,7 +1516,7 @@ def test_logical():
 
 
 def test_cast():
-    arr = pa.array([2**63 - 1], type='int64')
+    arr = pa.array([2 ** 63 - 1], type='int64')
 
     with pytest.raises(pa.ArrowInvalid):
         pc.cast(arr, 'int32')
@@ -1487,10 +1572,18 @@ def _fix_timestamp(s):
                 expected = pa.array(_fix_timestamp(ts.strftime(fmt)))
                 assert result.equals(expected)
 
+        fmt = "%Y-%m-%dT%H:%M:%S"
+
         # Default format
         tsa = pa.array(ts, type=pa.timestamp("s", timezone))
         result = pc.strftime(tsa, options=pc.StrftimeOptions())
-        expected = pa.array(_fix_timestamp(ts.strftime("%Y-%m-%dT%H:%M:%SZ")))
+        expected = pa.array(_fix_timestamp(ts.strftime(fmt)))
+        assert result.equals(expected)
+
+        # Default format plus timezone
+        tsa = pa.array(ts, type=pa.timestamp("s", timezone))
+        result = pc.strftime(tsa, options=pc.StrftimeOptions(fmt + "%Z"))
+        expected = pa.array(_fix_timestamp(ts.strftime(fmt + "%Z")))
         assert result.equals(expected)
 
         # Pandas %S is equivalent to %S in arrow for unit="s"
@@ -1509,18 +1602,27 @@ def _fix_timestamp(s):
 
         # Test setting locale
         tsa = pa.array(ts, type=pa.timestamp("s", timezone))
-        options = pc.StrftimeOptions("%Y-%m-%dT%H:%M:%SZ", "C")
+        options = pc.StrftimeOptions(fmt, "C")
         result = pc.strftime(tsa, options=options)
-        expected = pa.array(_fix_timestamp(ts.strftime("%Y-%m-%dT%H:%M:%SZ")))
+        expected = pa.array(_fix_timestamp(ts.strftime(fmt)))
         assert result.equals(expected)
 
-    for unit in ["s", "ms", "us", "ns"]:
-        tsa = pa.array(ts, type=pa.timestamp(unit))
-        for fmt in formats:
-            with pytest.raises(pa.ArrowInvalid,
-                               match="Timestamps without a time zone "
-                                     "cannot be reliably formatted"):
-                pc.strftime(tsa, options=pc.StrftimeOptions(fmt))
+    # Test timestamps without timezone
+    fmt = "%Y-%m-%dT%H:%M:%S"
+    ts = pd.to_datetime(times)
+    tsa = pa.array(ts, type=pa.timestamp("s"))
+    result = pc.strftime(tsa, options=pc.StrftimeOptions(fmt))
+    expected = pa.array(_fix_timestamp(ts.strftime(fmt)))
+
+    assert result.equals(expected)
+    with pytest.raises(
+            pa.ArrowInvalid,
+            match="Timezone not present, cannot convert to string"):
+        pc.strftime(tsa, options=pc.StrftimeOptions(fmt + "%Z"))
+    with pytest.raises(
+            pa.ArrowInvalid,
+            match="Timezone not present, cannot convert to string"):
+        pc.strftime(tsa, options=pc.StrftimeOptions(fmt + "%z"))
 
 
 def _check_datetime_components(timestamps, timezone=None):
@@ -1530,8 +1632,8 @@ def _check_datetime_components(timestamps, timezone=None):
         "UTC").tz_convert(timezone).to_series()
     tsa = pa.array(ts, pa.timestamp("ns", tz=timezone))
 
-    subseconds = ((ts.dt.microsecond * 10**3 +
-                   ts.dt.nanosecond) * 10**-9).round(9)
+    subseconds = ((ts.dt.microsecond * 10 ** 3 +
+                   ts.dt.nanosecond) * 10 ** -9).round(9)
     iso_calendar_fields = [
         pa.field('iso_year', pa.int64()),
         pa.field('iso_week', pa.int64()),
@@ -1566,8 +1668,8 @@ def _check_datetime_components(timestamps, timezone=None):
     assert pc.hour(tsa).equals(pa.array(ts.dt.hour))
     assert pc.minute(tsa).equals(pa.array(ts.dt.minute))
     assert pc.second(tsa).equals(pa.array(ts.dt.second.values))
-    assert pc.millisecond(tsa).equals(pa.array(ts.dt.microsecond // 10**3))
-    assert pc.microsecond(tsa).equals(pa.array(ts.dt.microsecond % 10**3))
+    assert pc.millisecond(tsa).equals(pa.array(ts.dt.microsecond // 10 ** 3))
+    assert pc.microsecond(tsa).equals(pa.array(ts.dt.microsecond % 10 ** 3))
     assert pc.nanosecond(tsa).equals(pa.array(ts.dt.nanosecond))
     assert pc.subsecond(tsa).equals(pa.array(subseconds))
 
@@ -1613,6 +1715,103 @@ def test_extract_datetime_components():
             _check_datetime_components(timestamps, timezone)
 
 
+# TODO: We should test on windows once ARROW-13168 is resolved.
+@pytest.mark.pandas
+@pytest.mark.skipif(sys.platform == 'win32',
+                    reason="Timezone database is not available on Windows yet")
+def test_assume_timezone():
+    from pyarrow.vendored.version import Version
+
+    ts_type = pa.timestamp("ns")
+    timestamps = pd.to_datetime(["1970-01-01T00:00:59.123456789",
+                                 "2000-02-29T23:23:23.999999999",
+                                 "2033-05-18T03:33:20.000000000",
+                                 "2020-01-01T01:05:05.001",
+                                 "2019-12-31T02:10:10.002",
+                                 "2019-12-30T03:15:15.003",
+                                 "2009-12-31T04:20:20.004132",
+                                 "2010-01-01T05:25:25.005321",
+                                 "2010-01-03T06:30:30.006163",
+                                 "2010-01-04T07:35:35",
+                                 "2006-01-01T08:40:40",
+                                 "2005-12-31T09:45:45",
+                                 "2008-12-28",
+                                 "2008-12-29",
+                                 "2012-01-01 01:02:03"])
+    nonexistent = pd.to_datetime(["2015-03-29 02:30:00",
+                                  "2015-03-29 03:30:00"])
+    ambiguous = pd.to_datetime(["2018-10-28 01:20:00",
+                                "2018-10-28 02:36:00",
+                                "2018-10-28 03:46:00"])
+    ambiguous_array = pa.array(ambiguous, type=ts_type)
+    nonexistent_array = pa.array(nonexistent, type=ts_type)
+
+    for timezone in ["UTC", "US/Central", "Asia/Kolkata"]:
+        options = pc.AssumeTimezoneOptions(timezone)
+        ta = pa.array(timestamps, type=ts_type)
+        expected = timestamps.tz_localize(timezone)
+        result = pc.assume_timezone(ta, options=options)
+        assert result.equals(pa.array(expected))
+
+        ta_zoned = pa.array(timestamps, type=pa.timestamp("ns", timezone))
+        with pytest.raises(pa.ArrowInvalid,
+                           match="already have a timezone:"):
+            pc.assume_timezone(ta_zoned, options=options)
+
+    invalid_options = pc.AssumeTimezoneOptions("Europe/Brusselsss")
+    with pytest.raises(ValueError, match="not found in timezone database"):
+        pc.assume_timezone(ta, options=invalid_options)
+
+    timezone = "Europe/Brussels"
+
+    # nonexistent parameter was introduced in Pandas 0.24.0
+    if Version(pd.__version__) >= Version("0.24.0"):
+        options_nonexistent_raise = pc.AssumeTimezoneOptions(timezone)
+        options_nonexistent_earliest = pc.AssumeTimezoneOptions(
+            timezone, ambiguous="raise", nonexistent="earliest")
+        options_nonexistent_latest = pc.AssumeTimezoneOptions(
+            timezone, ambiguous="raise", nonexistent="latest")
+
+        with pytest.raises(
+                ValueError,
+                match=f"Timestamp doesn't exist in timezone '{timezone}'"):
+            pc.assume_timezone(nonexistent_array,
+                               options=options_nonexistent_raise)
+
+        expected = pa.array(nonexistent.tz_localize(
+            timezone, nonexistent="shift_forward"))
+        result = pc.assume_timezone(
+            nonexistent_array, options=options_nonexistent_latest)
+        expected.equals(result)
+
+        expected = pa.array(nonexistent.tz_localize(
+            timezone, nonexistent="shift_backward"))
+        result = pc.assume_timezone(
+            nonexistent_array, options=options_nonexistent_earliest)
+        expected.equals(result)
+
+    options_ambiguous_raise = pc.AssumeTimezoneOptions(timezone)
+    options_ambiguous_latest = pc.AssumeTimezoneOptions(
+        timezone, ambiguous="latest", nonexistent="raise")
+    options_ambiguous_earliest = pc.AssumeTimezoneOptions(
+        timezone, ambiguous="earliest", nonexistent="raise")
+
+    with pytest.raises(
+            ValueError,
+            match=f"Timestamp is ambiguous in timezone '{timezone}'"):
+        pc.assume_timezone(ambiguous_array, options=options_ambiguous_raise)
+
+    expected = ambiguous.tz_localize(timezone, ambiguous=[True, True, True])
+    result = pc.assume_timezone(
+        ambiguous_array, options=options_ambiguous_earliest)
+    result.equals(pa.array(expected))
+
+    expected = ambiguous.tz_localize(timezone, ambiguous=[False, False, False])
+    result = pc.assume_timezone(
+        ambiguous_array, options=options_ambiguous_latest)
+    result.equals(pa.array(expected))
+
+
 def test_count():
     arr = pa.array([1, 2, 3, None, None])
     assert pc.count(arr).as_py() == 3
@@ -1648,6 +1847,69 @@ def test_partition_nth():
                for i in range(pivot, len(data)))
 
 
+def test_select_k_array():
+    def validate_select_k(select_k_indices, arr, order, stable_sort=False):
+        sorted_indices = pc.sort_indices(arr, sort_keys=[("dummy", order)])
+        head_k_indices = sorted_indices.slice(0, len(select_k_indices))
+        if stable_sort:
+            assert select_k_indices == head_k_indices
+        else:
+            expected = pc.take(arr, head_k_indices)
+            actual = pc.take(arr, select_k_indices)
+            assert actual == expected
+
+    arr = pa.array([1, 2, None, 0])
+    for order in ["descending", "ascending"]:
+        for k in [0, 2, 4]:
+            result = pc.select_k_unstable(
+                arr, k=k, sort_keys=[("dummy", order)])
+            validate_select_k(result, arr, order)
+
+    result = pc.select_k_unstable(arr, options=pc.SelectKOptions(
+        k=2, sort_keys=[("dummy", "descending")]))
+    validate_select_k(result, arr, "descending")
+
+    result = pc.select_k_unstable(arr, options=pc.SelectKOptions(
+        k=2, sort_keys=[("dummy", "ascending")]))
+    validate_select_k(result, arr, "ascending")
+
+
+def test_select_k_table():
+    table = pa.table({"a": [1, 2, 0], "b": [1, 0, 1]})
+
+    def validate_select_k(select_k_indices, table, sort_keys,
+                          stable_sort=False):
+        sorted_indices = pc.sort_indices(table, sort_keys=sort_keys)
+        head_k_indices = sorted_indices.slice(0, len(select_k_indices))
+        if stable_sort:
+            assert select_k_indices == head_k_indices
+        else:
+            expected = pc.take(table, head_k_indices)
+            actual = pc.take(table, select_k_indices)
+            assert actual == expected
+
+    for k in [0, 2, 4]:
+        result = pc.select_k_unstable(
+            table, k=k, sort_keys=[("a", "ascending")])
+        validate_select_k(result, table, sort_keys=[("a", "ascending")])
+
+        result = pc.select_k_unstable(
+            table, k=k, sort_keys=[("a", "ascending"), ("b", "ascending")]
+        )
+        validate_select_k(result, table, sort_keys=[
+                          ("a", "ascending"), ("b", "ascending")])
+
+    with pytest.raises(ValueError,
+                       match="SelectK requires a nonnegative `k`"):
+        pc.select_k_unstable(table)
+
+    with pytest.raises(ValueError, match="not a valid order"):
+        pc.select_k_unstable(table, k=k, sort_keys=[("a", "nonscending")])
+
+    with pytest.raises(ValueError, match="Nonexistent sort key column"):
+        pc.select_k_unstable(table, k=k, sort_keys=[("unknown", "ascending")])
+
+
 def test_array_sort_indices():
     arr = pa.array([1, 2, None, 0])
     result = pc.array_sort_indices(arr)
diff --git a/python/pyarrow/tests/test_extension_type.py b/python/pyarrow/tests/test_extension_type.py
index 391149772cc..d166c2af83e 100644
--- a/python/pyarrow/tests/test_extension_type.py
+++ b/python/pyarrow/tests/test_extension_type.py
@@ -201,6 +201,34 @@ def test_ext_array_equality():
     assert not d.equals(f)
 
 
+def test_ext_array_wrap_array():
+    ty = ParamExtType(3)
+    storage = pa.array([b"foo", b"bar", None], type=pa.binary(3))
+    arr = ty.wrap_array(storage)
+    arr.validate(full=True)
+    assert isinstance(arr, pa.ExtensionArray)
+    assert arr.type == ty
+    assert arr.storage == storage
+
+    storage = pa.chunked_array([[b"abc", b"def"], [b"ghi"]],
+                               type=pa.binary(3))
+    arr = ty.wrap_array(storage)
+    arr.validate(full=True)
+    assert isinstance(arr, pa.ChunkedArray)
+    assert arr.type == ty
+    assert arr.chunk(0).storage == storage.chunk(0)
+    assert arr.chunk(1).storage == storage.chunk(1)
+
+    # Wrong storage type
+    storage = pa.array([b"foo", b"bar", None])
+    with pytest.raises(TypeError, match="Incompatible storage type"):
+        ty.wrap_array(storage)
+
+    # Not an array or chunked array
+    with pytest.raises(TypeError, match="Expected array or chunked array"):
+        ty.wrap_array(None)
+
+
 def test_ext_scalar_from_array():
     data = [b"0123456789abcdef", b"0123456789abcdef",
             b"zyxwvutsrqponmlk", None]
diff --git a/python/pyarrow/types.pxi b/python/pyarrow/types.pxi
index 06f753fa18d..5b478ed7746 100644
--- a/python/pyarrow/types.pxi
+++ b/python/pyarrow/types.pxi
@@ -708,6 +708,45 @@ cdef class BaseExtensionType(DataType):
         """
         return pyarrow_wrap_data_type(self.ext_type.storage_type())
 
+    def wrap_array(self, storage):
+        """
+        Wrap the given storage array as an extension array.
+
+        Parameters
+        ----------
+        storage : Array or ChunkedArray
+
+        Returns
+        -------
+        array : Array or ChunkedArray
+            Extension array wrapping the storage array
+        """
+        cdef:
+            shared_ptr[CDataType] c_storage_type
+
+        if isinstance(storage, Array):
+            c_storage_type = (<Array> storage).ap.type()
+        elif isinstance(storage, ChunkedArray):
+            c_storage_type = (<ChunkedArray> storage).chunked_array.type()
+        else:
+            raise TypeError(
+                f"Expected array or chunked array, got {storage.__class__}")
+
+        if not c_storage_type.get().Equals(deref(self.ext_type)
+                                           .storage_type()):
+            raise TypeError(
+                f"Incompatible storage type for {self}: "
+                f"expected {self.storage_type}, got {storage.type}")
+
+        if isinstance(storage, Array):
+            return pyarrow_wrap_array(
+                self.ext_type.WrapArray(
+                    self.sp_type, (<Array> storage).sp_array))
+        else:
+            return pyarrow_wrap_chunked_array(
+                self.ext_type.WrapArray(
+                    self.sp_type, (<ChunkedArray> storage).sp_chunked_array))
+
 
 cdef class ExtensionType(BaseExtensionType):
     """
diff --git a/python/requirements-wheel-build.txt b/python/requirements-wheel-build.txt
index b2878d2971c..c06935b8374 100644
--- a/python/requirements-wheel-build.txt
+++ b/python/requirements-wheel-build.txt
@@ -1,4 +1,5 @@
 cython>=0.29.11
+setuptools>=58
 setuptools_scm
 wheel
 numpy==1.19.4; platform_system == "Linux"   and platform_machine == "aarch64"
diff --git a/r/.gitignore b/r/.gitignore
index 76e8a8dd0bd..fbc5c8c3bfd 100644
--- a/r/.gitignore
+++ b/r/.gitignore
@@ -18,3 +18,11 @@ vignettes/nyc-taxi/
 arrow_*.tar.gz
 arrow_*.tgz
 extra-tests/files
+
+# C++ sources for an offline build. They're copied from the ../cpp directory, so ignore them here.
+/tools/cpp/
+# cmake expects .env, NOTICE.txt, and LICENSE.txt to be available one level up
+# from cpp/, but again, they're just copies
+/tools/.env
+/tools/LICENSE.txt
+/tools/NOTICE.txt
diff --git a/r/Makefile b/r/Makefile
index 7a51cbd5188..d01b1277120 100644
--- a/r/Makefile
+++ b/r/Makefile
@@ -36,9 +36,17 @@ test:
 deps:
 	R -s -e 'lib <- Sys.getenv("R_LIB", .libPaths()[1]); install.packages("devtools", repo="https://cloud.r-project.org", lib=lib); devtools::install_dev_deps(lib=lib)'
 
-build: doc
+# Note: files in tools are available at build time, but not at run time. The thirdparty
+# cmake expects .env, NOTICE.txt, and LICENSE.txt to be available one level up from cpp/
+sync-cpp:
 	cp ../NOTICE.txt inst/NOTICE.txt
-	R CMD build .
+	rsync --archive --delete --exclude 'build' --exclude 'build-support/boost_*' --exclude 'submodules' ../cpp tools/
+	cp -p ../.env tools/
+	cp -p ../NOTICE.txt tools/
+	cp -p ../LICENSE.txt tools/
+
+build: doc sync-cpp
+	R CMD build ${args} .
 
 check: build
 	-export _R_CHECK_CRAN_INCOMING_REMOTE_=FALSE && export ARROW_R_DEV=$(ARROW_R_DEV) && export _R_CHECK_TESTS_NLINES_=0 && R CMD check --as-cran --run-donttest arrow_$(VERSION).tar.gz
@@ -56,4 +64,5 @@ clean:
 	-rm src/Makevars.win
 	-rm -rf arrow.Rcheck/
 	-rm -rf libarrow/
+	-rm -rf tools/cpp/ tools/.env tools/NOTICE.txt tools/LICENSE.txt
 	-find . -name "*.orig" -delete
diff --git a/r/NAMESPACE b/r/NAMESPACE
index 8bcc58653fb..cabd8ffb5f8 100644
--- a/r/NAMESPACE
+++ b/r/NAMESPACE
@@ -187,6 +187,7 @@ export(UnionDataset)
 export(arrow_available)
 export(arrow_info)
 export(arrow_with_dataset)
+export(arrow_with_json)
 export(arrow_with_parquet)
 export(arrow_with_s3)
 export(binary)
@@ -200,6 +201,7 @@ export(codec_is_available)
 export(contains)
 export(copy_files)
 export(cpu_count)
+export(create_package_with_all_dependencies)
 export(dataset_factory)
 export(date32)
 export(date64)
@@ -290,6 +292,7 @@ importFrom(bit64,print.integer64)
 importFrom(bit64,str.integer64)
 importFrom(methods,as)
 importFrom(purrr,as_mapper)
+importFrom(purrr,imap)
 importFrom(purrr,imap_chr)
 importFrom(purrr,keep)
 importFrom(purrr,map)
@@ -303,6 +306,7 @@ importFrom(rlang,"%||%")
 importFrom(rlang,.data)
 importFrom(rlang,abort)
 importFrom(rlang,as_label)
+importFrom(rlang,as_quosure)
 importFrom(rlang,caller_env)
 importFrom(rlang,dots_n)
 importFrom(rlang,enexpr)
@@ -322,6 +326,7 @@ importFrom(rlang,is_quosure)
 importFrom(rlang,list2)
 importFrom(rlang,new_data_mask)
 importFrom(rlang,new_environment)
+importFrom(rlang,quo_get_env)
 importFrom(rlang,quo_get_expr)
 importFrom(rlang,quo_is_null)
 importFrom(rlang,quo_name)
diff --git a/r/NEWS.md b/r/NEWS.md
index 2a22681e457..381b6334909 100644
--- a/r/NEWS.md
+++ b/r/NEWS.md
@@ -19,6 +19,36 @@
 
 # arrow 5.0.0.9000
 
+There are now two ways to query Arrow data:
+
+## 1. Grouped aggregation in Arrow
+
+`dplyr::summarize()`, both grouped and ungrouped, is now implemented for Arrow Datasets, Tables, and RecordBatches. Because data is scanned in chunks, you can aggregate over larger-than-memory datasets backed by many files. Supported aggregation functions include `n()`, `n_distinct()`, `sum()`, `mean()`, `var()`, `sd()`, `any()`, and `all()`.
+
+This enhancement does change the behavior of `summarize()` and `collect()` in some cases: see "Breaking changes" below for details.
+
+New compute functions include `str_to_title()` and `strftime()`.
+
+## 2. duckdb integration
+
+If you have the [duckdb](https://duckdb.org/) package installed, you can hand off an Arrow Dataset or query object to duckdb for further querying using the `to_duckdb()` function. This allows you to use duckdb's `dbplyr` methods, as well as its SQL interface, to aggregate data. Filtering and column projection done before `to_duckdb()` is evaluated in Arrow.
+## Breaking changes
+
+* `dplyr::summarize()` on an in-memory Arrow Table or RecordBatch no longer eagerly evaluates. Call `compute()` or `collect()` to evaluate the query.
+* Row order of data from a Dataset query is no longer deterministic. If you need a stable sort order, you should explicitly `arrange()` the query result. For calls to `summarize()`, you can set `options(arrow.summarise.sort = TRUE)` to match the current `dplyr` behavior of sorting on the grouping columns.
+
+## Installation on Linux
+
+* Package installation now fails if the Arrow C++ library does not compile. In previous versions, if the C++ library failed to compile, you would get a successful R package installation that wouldn't do much useful.
+* You can disable all optional C++ components when building from source by setting the environment variable `LIBARROW_MINIMAL=true`. This will have the core Arrow/Feather components but excludes Parquet, Datasets, compression libraries, and other optional features.
+* Source packages now bundle the Arrow C++ source code, so it does not have to be downloaded in order to build the package. Because the source is included, it is now possible to build the package on an offline/airgapped system. By default, the offline build will be minimal because it cannot download third-party C++ dependencies required to support all features. To allow a fully featured offline build, the included `create_package_with_all_dependencies()` function (also available on GitHub without installing the arrow package) will download all third-party C++ dependencies and bundle them inside the R source package. Run this function on a system connected to the network to produce the "fat" source package, then copy that .tar.gz package to your offline machine and install.
+* Source builds can make use of system dependencies (such as `libz`) by setting `ARROW_DEPENDENCY_SOURCE=AUTO`. This is not the default in this release (`BUNDLED`, i.e. download and build all dependencies) but may become the default in the future.
+* The JSON library components (`read_json_arrow()`) are now optional and still on by default; set `ARROW_JSON=OFF` before building to disable them.
+
+# arrow 5.0.0.2
+
+This patch version contains fixes for some sanitizer and compiler warnings.
+
 # arrow 5.0.0
 
 ## More dplyr
diff --git a/r/R/arrow-package.R b/r/R/arrow-package.R
index 10c14a00af4..e41fe58d696 100644
--- a/r/R/arrow-package.R
+++ b/r/R/arrow-package.R
@@ -17,12 +17,12 @@
 
 #' @importFrom stats quantile median na.omit na.exclude na.pass na.fail
 #' @importFrom R6 R6Class
-#' @importFrom purrr as_mapper map map2 map_chr map2_chr map_dfr map_int map_lgl keep imap_chr
+#' @importFrom purrr as_mapper map map2 map_chr map2_chr map_dfr map_int map_lgl keep imap imap_chr
 #' @importFrom assertthat assert_that is.string
 #' @importFrom rlang list2 %||% is_false abort dots_n warn enquo quo_is_null enquos is_integerish quos
 #' @importFrom rlang eval_tidy new_data_mask syms env new_environment env_bind as_label set_names exec
-#' @importFrom rlang is_bare_character quo_get_expr quo_set_expr .data seq2 is_quosure enexpr enexprs
-#' @importFrom rlang expr caller_env is_character quo_name
+#' @importFrom rlang is_bare_character quo_get_expr quo_get_env quo_set_expr .data seq2
+#' @importFrom rlang expr caller_env is_character quo_name is_quosure enexpr enexprs as_quosure
 #' @importFrom tidyselect vars_pull vars_rename vars_select eval_select
 #' @useDynLib arrow, .registration = TRUE
 #' @keywords internal
@@ -35,7 +35,7 @@
     c(
       "select", "filter", "collect", "summarise", "group_by", "groups",
       "group_vars", "group_by_drop_default", "ungroup", "mutate", "transmute",
-      "arrange", "rename", "pull", "relocate", "compute"
+      "arrange", "rename", "pull", "relocate", "compute", "collapse"
     )
   )
   for (cl in c("Dataset", "ArrowTabular", "arrow_dplyr_query")) {
@@ -105,12 +105,14 @@
 #' * The Arrow C++ library (check with `arrow_available()`)
 #' * Arrow Dataset support enabled (check with `arrow_with_dataset()`)
 #' * Parquet support enabled (check with `arrow_with_parquet()`)
+#' * JSON support enabled (check with `arrow_with_json()`)
 #' * Amazon S3 support enabled (check with `arrow_with_s3()`)
 #' @export
 #' @examples
 #' arrow_available()
 #' arrow_with_dataset()
 #' arrow_with_parquet()
+#' arrow_with_json()
 #' arrow_with_s3()
 #' @seealso If any of these are `FALSE`, see
 #' `vignette("install", package = "arrow")` for guidance on reinstalling the
@@ -145,6 +147,14 @@ arrow_with_s3 <- function() {
   })
 }
 
+#' @rdname arrow_available
+#' @export
+arrow_with_json <- function() {
+  tryCatch(.Call(`_json_available`), error = function(e) {
+    return(FALSE)
+  })
+}
+
 option_use_threads <- function() {
   !is_false(getOption("arrow.use_threads"))
 }
@@ -174,6 +184,7 @@ arrow_info <- function() {
       capabilities = c(
         dataset = arrow_with_dataset(),
         parquet = arrow_with_parquet(),
+        json = arrow_with_json(),
         s3 = arrow_with_s3(),
         utf8proc = "utf8_upper" %in% compute_funcs,
         re2 = "replace_substring_regex" %in% compute_funcs,
diff --git a/r/R/arrowExports.R b/r/R/arrowExports.R
index 2237f818ee0..b852a3d8ca9 100644
--- a/r/R/arrowExports.R
+++ b/r/R/arrowExports.R
@@ -1,11 +1,7 @@
 # Generated by using data-raw/codegen.R -> do not edit by hand
 
-is_altrep_int_nonull <- function(x) {
-  .Call(`_arrow_is_altrep_int_nonull`, x)
-}
-
-is_altrep_dbl_nonull <- function(x) {
-  .Call(`_arrow_is_altrep_dbl_nonull`, x)
+is_altrep <- function(x) {
+  .Call(`_arrow_is_altrep`, x)
 }
 
 Array__Slice1 <- function(array, offset) {
@@ -284,8 +280,8 @@ ExecPlan_create <- function(use_threads) {
   .Call(`_arrow_ExecPlan_create`, use_threads)
 }
 
-ExecPlan_run <- function(plan, final_node) {
-  .Call(`_arrow_ExecPlan_run`, plan, final_node)
+ExecPlan_run <- function(plan, final_node, sort_options) {
+  .Call(`_arrow_ExecPlan_run`, plan, final_node, sort_options)
 }
 
 ExecNode_Scan <- function(plan, dataset, filter, materialized_field_names) {
@@ -820,6 +816,10 @@ FixedSizeListType__list_size <- function(type) {
   .Call(`_arrow_FixedSizeListType__list_size`, type)
 }
 
+compute___expr__equals <- function(lhs, rhs) {
+  .Call(`_arrow_compute___expr__equals`, lhs, rhs)
+}
+
 compute___expr__call <- function(func_name, argument_list, options) {
   .Call(`_arrow_compute___expr__call`, func_name, argument_list, options)
 }
diff --git a/r/R/compute.R b/r/R/compute.R
index 39940eedc8c..2d00bcf10e3 100644
--- a/r/R/compute.R
+++ b/r/R/compute.R
@@ -120,7 +120,7 @@ max.ArrowDatum <- function(..., na.rm = FALSE) {
   scalar_aggregate("min_max", ..., na.rm = na.rm)$GetFieldByName("max")
 }
 
-scalar_aggregate <- function(FUN, ..., na.rm = FALSE, na.min_count = 0) {
+scalar_aggregate <- function(FUN, ..., na.rm = FALSE, min_count = 0L) {
   a <- collect_arrays_from_dots(list(...))
   if (FUN == "min_max" && na.rm && a$null_count == length(a)) {
     Array$create(data.frame(min = Inf, max = -Inf))
@@ -128,7 +128,7 @@ scalar_aggregate <- function(FUN, ..., na.rm = FALSE, na.min_count = 0) {
     # Inf/-Inf, which are type double. Since Arrow is type-stable
     # and does not do that, we handle this special case here.
   } else {
-    call_function(FUN, a, options = list(na.rm = na.rm, na.min_count = na.min_count))
+    call_function(FUN, a, options = list(skip_nulls = na.rm, min_count = min_count))
   }
 }
 
diff --git a/r/R/dataset-scan.R b/r/R/dataset-scan.R
index 615b0f945a8..75108df1052 100644
--- a/r/R/dataset-scan.R
+++ b/r/R/dataset-scan.R
@@ -73,18 +73,14 @@ Scanner$create <- function(dataset,
                            projection = NULL,
                            filter = TRUE,
                            use_threads = option_use_threads(),
-                           use_async = NULL,
+                           use_async = getOption("arrow.use_async", FALSE),
                            batch_size = NULL,
                            fragment_scan_options = NULL,
                            ...) {
-  if (is.null(use_async)) {
-    use_async <- getOption("arrow.use_async", FALSE)
-  }
-
   if (inherits(dataset, "arrow_dplyr_query")) {
-    if (inherits(dataset$.data, "ArrowTabular")) {
-      # To handle mutate() on Table/RecordBatch, we need to collect(as_data_frame=FALSE) now
-      dataset <- dplyr::collect(dataset, as_data_frame = FALSE)
+    if (is_collapsed(dataset)) {
+      # TODO: Is there a way to get a RecordBatchReader rather than evaluating?
+      dataset$.data <- as_adq(dplyr::compute(dataset$.data))$.data
     }
 
     proj <- c(dataset$selected_columns, dataset$temp_columns)
@@ -117,7 +113,7 @@ Scanner$create <- function(dataset,
       ...
     ))
   }
-  if (inherits(dataset, c("data.frame", "RecordBatch", "Table"))) {
+  if (inherits(dataset, c("data.frame", "ArrowTabular"))) {
     dataset <- InMemoryDataset$create(dataset)
   }
   assert_is(dataset, "Dataset")
diff --git a/r/R/dataset-write.R b/r/R/dataset-write.R
index 8f410e284c2..b17c5f39ba8 100644
--- a/r/R/dataset-write.R
+++ b/r/R/dataset-write.R
@@ -76,6 +76,7 @@
 #' # You can obtain the same result as as the previous examples using arrow with
 #' # a dplyr pipeline. This will be the same as two_levels_tree above, but the
 #' # output directory will be different.
+#' library(dplyr)
 #' two_levels_tree_2 <- tempfile()
 #' mtcars %>%
 #'   group_by(cyl, gear) %>%
diff --git a/r/R/dplyr-arrange.R b/r/R/dplyr-arrange.R
index 345fc183295..017e1d6b302 100644
--- a/r/R/dplyr-arrange.R
+++ b/r/R/dplyr-arrange.R
@@ -30,7 +30,7 @@ arrange.arrow_dplyr_query <- function(.data, ..., .by_group = FALSE) {
     # Nothing to do
     return(.data)
   }
-  .data <- arrow_dplyr_query(.data)
+  .data <- as_adq(.data)
   # find and remove any dplyr::desc() and tidy-eval
   # the arrange expressions inside an Arrow data_mask
   sorts <- vector("list", length(exprs))
diff --git a/r/R/dplyr-collect.R b/r/R/dplyr-collect.R
index cec56ab9110..8a5488bf599 100644
--- a/r/R/dplyr-collect.R
+++ b/r/R/dplyr-collect.R
@@ -19,19 +19,8 @@
 # The following S3 methods are registered on load if dplyr is present
 
 collect.arrow_dplyr_query <- function(x, as_data_frame = TRUE, ...) {
-  x <- ensure_group_vars(x)
-  x <- ensure_arrange_vars(x) # this sets x$temp_columns
-  # Pull only the selected rows and cols into R
-  # See dataset.R for Dataset and Scanner(Builder) classes
-  tab <- Scanner$create(x)$ToTable()
-  # Arrange rows
-  if (length(x$arrange_vars) > 0) {
-    tab <- tab[
-      tab$SortIndices(names(x$arrange_vars), x$arrange_desc),
-      names(x$selected_columns), # this omits x$temp_columns from the result
-      drop = FALSE
-    ]
-  }
+  # See query-engine.R for ExecPlan/Nodes
+  tab <- do_exec_plan(x)
   if (as_data_frame) {
     df <- as.data.frame(tab)
     tab$invalidate()
@@ -47,16 +36,71 @@ collect.ArrowTabular <- function(x, as_data_frame = TRUE, ...) {
     x
   }
 }
-collect.Dataset <- function(x, ...) dplyr::collect(arrow_dplyr_query(x), ...)
+collect.Dataset <- function(x, ...) dplyr::collect(as_adq(x), ...)
 
 compute.arrow_dplyr_query <- function(x, ...) dplyr::collect(x, as_data_frame = FALSE)
 compute.ArrowTabular <- function(x, ...) x
 compute.Dataset <- compute.arrow_dplyr_query
 
 pull.arrow_dplyr_query <- function(.data, var = -1) {
-  .data <- arrow_dplyr_query(.data)
+  .data <- as_adq(.data)
   var <- vars_pull(names(.data), !!enquo(var))
   .data$selected_columns <- set_names(.data$selected_columns[var], var)
   dplyr::collect(.data)[[1]]
 }
 pull.Dataset <- pull.ArrowTabular <- pull.arrow_dplyr_query
+
+# TODO: Correctly handle group_vars after summarize; also in collapse()
+restore_dplyr_features <- function(df, query) {
+  # An arrow_dplyr_query holds some attributes that Arrow doesn't know about
+  # After calling collect(), make sure these features are carried over
+
+  if (length(query$group_by_vars) > 0) {
+    # Preserve groupings, if present
+    if (is.data.frame(df)) {
+      df <- dplyr::grouped_df(
+        df,
+        dplyr::group_vars(query),
+        drop = dplyr::group_by_drop_default(query)
+      )
+    } else {
+      # This is a Table, via compute() or collect(as_data_frame = FALSE)
+      df <- as_adq(df)
+      df$group_by_vars <- query$group_by_vars
+      df$drop_empty_groups <- query$drop_empty_groups
+    }
+  }
+  df
+}
+
+collapse.arrow_dplyr_query <- function(x, ...) {
+  # Figure out what schema will result from the query
+  x$schema <- implicit_schema(x)
+  # Nest inside a new arrow_dplyr_query
+  arrow_dplyr_query(x)
+}
+collapse.Dataset <- collapse.ArrowTabular <- function(x, ...) {
+  arrow_dplyr_query(x)
+}
+
+implicit_schema <- function(.data) {
+  .data <- ensure_group_vars(.data)
+  old_schm <- .data$.data$schema
+
+  if (is.null(.data$aggregations)) {
+    new_fields <- map(.data$selected_columns, ~ .$type(old_schm))
+  } else {
+    new_fields <- map(summarize_projection(.data), ~ .$type(old_schm))
+    # * Put group_by_vars first (this can't be done by summarize,
+    #   they have to be last per the aggregate node signature,
+    #   and they get projected to this order after aggregation)
+    # * Infer the output types from the aggregations
+    group_fields <- new_fields[.data$group_by_vars]
+    agg_fields <- imap(
+      new_fields[setdiff(names(new_fields), .data$group_by_vars)],
+      ~ output_type(.data$aggregations[[.y]][["fun"]], .x)
+    )
+    new_fields <- c(group_fields, agg_fields)
+  }
+  schema(!!!new_fields)
+}
diff --git a/r/R/dplyr-eval.R b/r/R/dplyr-eval.R
index 89eec94e4d2..c65ed605834 100644
--- a/r/R/dplyr-eval.R
+++ b/r/R/dplyr-eval.R
@@ -28,6 +28,7 @@ arrow_eval <- function(expr, mask) {
     # else, for things not supported by Arrow return a "try-error",
     # which we'll handle differently
     msg <- conditionMessage(e)
+    if (getOption("arrow.debug", FALSE)) print(msg)
     patterns <- .cache$i18ized_error_pattern
     if (is.null(patterns)) {
       patterns <- i18ize_error_messages()
diff --git a/r/R/dplyr-filter.R b/r/R/dplyr-filter.R
index a44750a9c81..61f27010e77 100644
--- a/r/R/dplyr-filter.R
+++ b/r/R/dplyr-filter.R
@@ -26,7 +26,7 @@ filter.arrow_dplyr_query <- function(.data, ..., .preserve = FALSE) {
     return(.data)
   }
 
-  .data <- arrow_dplyr_query(.data)
+  .data <- as_adq(.data)
   # tidy-eval the filter expressions inside an Arrow data_mask
   filters <- lapply(filts, arrow_eval, arrow_mask(.data))
   bad_filters <- map_lgl(filters, ~ inherits(., "try-error"))
diff --git a/r/R/dplyr-functions.R b/r/R/dplyr-functions.R
index e535546dd1b..d2f7892aee8 100644
--- a/r/R/dplyr-functions.R
+++ b/r/R/dplyr-functions.R
@@ -784,44 +784,42 @@ agg_funcs$sum <- function(x, na.rm = FALSE) {
   list(
     fun = "sum",
     data = x,
-    options = list(na.rm = na.rm, na.min_count = 0L)
+    options = list(skip_nulls = na.rm, min_count = 0L)
   )
 }
 agg_funcs$any <- function(x, na.rm = FALSE) {
   list(
     fun = "any",
     data = x,
-    options = list(na.rm = na.rm, na.min_count = 0L)
+    options = list(skip_nulls = na.rm, min_count = 0L)
   )
 }
 agg_funcs$all <- function(x, na.rm = FALSE) {
   list(
     fun = "all",
     data = x,
-    options = list(na.rm = na.rm, na.min_count = 0L)
+    options = list(skip_nulls = na.rm, min_count = 0L)
   )
 }
 agg_funcs$mean <- function(x, na.rm = FALSE) {
   list(
     fun = "mean",
     data = x,
-    options = list(na.rm = na.rm, na.min_count = 0L)
+    options = list(skip_nulls = na.rm, min_count = 0L)
   )
 }
-# na.rm not currently passed in due to ARROW-13691
 agg_funcs$sd <- function(x, na.rm = FALSE, ddof = 1) {
   list(
     fun = "stddev",
     data = x,
-    options = list(ddof = ddof)
+    options = list(skip_nulls = na.rm, min_count = 0L, ddof = ddof)
   )
 }
-# na.rm not currently passed in due to ARROW-13691
 agg_funcs$var <- function(x, na.rm = FALSE, ddof = 1) {
   list(
     fun = "variance",
     data = x,
-    options = list(ddof = ddof)
+    options = list(skip_nulls = na.rm, min_count = 0L, ddof = ddof)
   )
 }
 
@@ -840,3 +838,18 @@ agg_funcs$n <- function() {
     options = list()
   )
 }
+
+output_type <- function(fun, input_type) {
+  # These are quick and dirty heuristics.
+  if (fun %in% c("any", "all")) {
+    bool()
+  } else if (fun %in% "sum") {
+    # It may upcast to a bigger type but this is close enough
+    input_type
+  } else if (fun %in% c("mean", "stddev", "variance")) {
+    float64()
+  } else {
+    # Just so things don't error, assume the resulting type is the same
+    input_type
+  }
+}
diff --git a/r/R/dplyr-group-by.R b/r/R/dplyr-group-by.R
index 42cca039022..a89144d6c4a 100644
--- a/r/R/dplyr-group-by.R
+++ b/r/R/dplyr-group-by.R
@@ -23,7 +23,7 @@ group_by.arrow_dplyr_query <- function(.data,
                                        .add = FALSE,
                                        add = .add,
                                        .drop = dplyr::group_by_drop_default(.data)) {
-  .data <- arrow_dplyr_query(.data)
+  .data <- as_adq(.data)
   new_groups <- enquos(...)
   # ... can contain expressions (i.e. can add (or rename?) columns) and so we
   # need to identify those and add them on to the query with mutate. Specifically,
diff --git a/r/R/dplyr-mutate.R b/r/R/dplyr-mutate.R
index f19505c1958..051c5254e50 100644
--- a/r/R/dplyr-mutate.R
+++ b/r/R/dplyr-mutate.R
@@ -24,7 +24,7 @@ mutate.arrow_dplyr_query <- function(.data,
                                      .before = NULL,
                                      .after = NULL) {
   call <- match.call()
-  exprs <- quos(...)
+  exprs <- ensure_named_exprs(quos(...))
 
   .keep <- match.arg(.keep)
   .before <- enquo(.before)
@@ -35,7 +35,7 @@ mutate.arrow_dplyr_query <- function(.data,
     return(.data)
   }
 
-  .data <- arrow_dplyr_query(.data)
+  .data <- as_adq(.data)
 
   # Restrict the cases we support for now
   if (length(dplyr::group_vars(.data)) > 0) {
@@ -45,11 +45,6 @@ mutate.arrow_dplyr_query <- function(.data,
     return(abandon_ship(call, .data, "mutate() on grouped data not supported in Arrow"))
   }
 
-  # Check for unnamed expressions and fix if any
-  unnamed <- !nzchar(names(exprs))
-  # Deparse and take the first element in case they're long expressions
-  names(exprs)[unnamed] <- map_chr(exprs[unnamed], as_label)
-
   mask <- arrow_mask(.data)
   results <- list()
   for (i in seq_along(exprs)) {
@@ -133,3 +128,11 @@ check_transmute_args <- function(..., .keep, .before, .after) {
   }
   enquos(...)
 }
+
+ensure_named_exprs <- function(exprs) {
+  # Check for unnamed expressions and fix if any
+  unnamed <- !nzchar(names(exprs))
+  # Deparse and take the first element in case they're long expressions
+  names(exprs)[unnamed] <- map_chr(exprs[unnamed], as_label)
+  exprs
+}
diff --git a/r/R/dplyr-select.R b/r/R/dplyr-select.R
index ee740db4cfb..9a867ced964 100644
--- a/r/R/dplyr-select.R
+++ b/r/R/dplyr-select.R
@@ -22,13 +22,13 @@ tbl_vars.arrow_dplyr_query <- function(x) names(x$selected_columns)
 
 select.arrow_dplyr_query <- function(.data, ...) {
   check_select_helpers(enexprs(...))
-  column_select(arrow_dplyr_query(.data), !!!enquos(...))
+  column_select(as_adq(.data), !!!enquos(...))
 }
 select.Dataset <- select.ArrowTabular <- select.arrow_dplyr_query
 
 rename.arrow_dplyr_query <- function(.data, ...) {
   check_select_helpers(enexprs(...))
-  column_select(arrow_dplyr_query(.data), !!!enquos(...), .FUN = vars_rename)
+  column_select(as_adq(.data), !!!enquos(...), .FUN = vars_rename)
 }
 rename.Dataset <- rename.ArrowTabular <- rename.arrow_dplyr_query
 
@@ -60,7 +60,7 @@ relocate.arrow_dplyr_query <- function(.data, ..., .before = NULL, .after = NULL
   # at https://github.com/tidyverse/dplyr/blob/master/R/relocate.R
   # TODO: revisit this after https://github.com/tidyverse/dplyr/issues/5829
 
-  .data <- arrow_dplyr_query(.data)
+  .data <- as_adq(.data)
 
   # Assign the schema to the expressions
   map(.data$selected_columns, ~ (.$schema <- .data$.data$schema))
diff --git a/r/R/dplyr-summarize.R b/r/R/dplyr-summarize.R
index 394e5fe2ac9..459b7435a87 100644
--- a/r/R/dplyr-summarize.R
+++ b/r/R/dplyr-summarize.R
@@ -20,14 +20,21 @@
 
 summarise.arrow_dplyr_query <- function(.data, ..., .engine = c("arrow", "duckdb")) {
   call <- match.call()
-  .data <- arrow_dplyr_query(.data)
+  .data <- as_adq(.data)
   exprs <- quos(...)
   # Only retain the columns we need to do our aggregations
   vars_to_keep <- unique(c(
     unlist(lapply(exprs, all.vars)), # vars referenced in summarise
     dplyr::group_vars(.data) # vars needed for grouping
   ))
-  .data <- dplyr::select(.data, vars_to_keep)
+  # If exprs rely on the results of previous exprs
+  # (total = sum(x), mean = total / n())
+  # then not all vars will correspond to columns in the data,
+  # so don't try to select() them (use intersect() to exclude them)
+  # Note that this select() isn't useful for the Arrow summarize implementation
+  # because it will effectively project to keep what it needs anyway,
+  # but the duckdb and data.frame fallback versions do benefit from select here
+  .data <- dplyr::select(.data, intersect(vars_to_keep, names(.data)))
   if (match.arg(.engine) == "duckdb") {
     dplyr::summarise(to_duckdb(.data), ...)
   } else {
@@ -42,87 +49,180 @@ summarise.arrow_dplyr_query <- function(.data, ..., .engine = c("arrow", "duckdb
 }
 summarise.Dataset <- summarise.ArrowTabular <- summarise.arrow_dplyr_query
 
+# This is the Arrow summarize implementation
 do_arrow_summarize <- function(.data, ..., .groups = NULL) {
   if (!is.null(.groups)) {
     # ARROW-13550
     abort("`summarize()` with `.groups` argument not supported in Arrow")
   }
-  exprs <- quos(...)
-  # Check for unnamed expressions and fix if any
-  unnamed <- !nzchar(names(exprs))
-  # Deparse and take the first element in case they're long expressions
-  names(exprs)[unnamed] <- map_chr(exprs[unnamed], as_label)
-
-  mask <- arrow_mask(.data, aggregation = TRUE)
-
-  results <- list()
+  exprs <- ensure_named_exprs(quos(...))
+
+  # Create a stateful environment for recording our evaluated expressions
+  # It's more complex than other places because a single summarize() expr
+  # may result in multiple query nodes (Aggregate, Project),
+  # and we have to walk through the expressions to disentangle them.
+  ctx <- env(
+    mask = arrow_mask(.data, aggregation = TRUE),
+    aggregations = empty_named_list(),
+    post_mutate = empty_named_list()
+  )
   for (i in seq_along(exprs)) {
     # Iterate over the indices and not the names because names may be repeated
     # (which overwrites the previous name)
-    new_var <- names(exprs)[i]
-    results[[new_var]] <- arrow_eval(exprs[[i]], mask)
-    if (inherits(results[[new_var]], "try-error")) {
-      msg <- handle_arrow_not_supported(
-        results[[new_var]],
-        as_label(exprs[[i]])
-      )
-      stop(msg, call. = FALSE)
-    }
-    # Put it in the data mask too?
-    # Should we: mask[[new_var]] <- mask$.data[[new_var]] <- results[[new_var]]
+    summarize_eval(names(exprs)[i], exprs[[i]], ctx)
   }
 
-  # Now, from that, split out the data (expressions) and options
-  .data$aggregations <- lapply(results, function(x) x[c("fun", "options")])
+  # Apply the results to the .data object.
+  # First, the aggregations
+  .data$aggregations <- ctx$aggregations
+  # Then collapse the query so that the resulting query object can have
+  # additional operations applied to it
+  out <- collapse.arrow_dplyr_query(.data)
+  # The expressions may have been translated into
+  # "first, aggregate, then transform the result further"
+  # nolint start
+  # For example,
+  #   summarize(mean = sum(x) / n())
+  # is effectively implemented as
+  #   summarize(..temp0 = sum(x), ..temp1 = n()) %>%
+  #   mutate(mean = ..temp0 / ..temp1) %>%
+  #   select(-starts_with("..temp"))
+  # If this is the case, there will be expressions in post_mutate
+  # nolint end
+  if (length(ctx$post_mutate)) {
+    # Append post_mutate, and make sure order is correct
+    # according to input exprs (also dropping ..temp columns)
+    out$selected_columns <- c(
+      out$selected_columns,
+      ctx$post_mutate
+    )[c(.data$group_by_vars, names(exprs))]
+  }
+  out
+}
 
-  inputs <- lapply(results, function(x) x$data)
-  # This is essentially a projection, and the column names don't matter
-  # (but must exist)
-  names(inputs) <- as.character(seq_along(inputs))
-  .data$selected_columns <- inputs
+arrow_eval_or_stop <- function(expr, mask) {
+  # TODO: change arrow_eval error handling behavior?
+  out <- arrow_eval(expr, mask)
+  if (inherits(out, "try-error")) {
+    msg <- handle_arrow_not_supported(out, as_label(expr))
+    stop(msg, call. = FALSE)
+  }
+  out
+}
 
-  # Eventually, we will return .data here if (dataset) but do it eagerly now
-  do_exec_plan(.data, group_vars = dplyr::group_vars(.data))
+summarize_projection <- function(.data) {
+  c(
+    map(.data$aggregations, ~ .$data),
+    .data$selected_columns[.data$group_by_vars]
+  )
 }
 
-do_exec_plan <- function(.data, group_vars = NULL) {
-  plan <- ExecPlan$create()
+format_aggregation <- function(x) {
+  paste0(x$fun, "(", x$data$ToString(), ")")
+}
 
-  grouped <- length(group_vars) > 0
+# This function handles each summarize expression and turns it into the
+# appropriate combination of (1) aggregations (possibly temporary) and
+# (2) post-aggregation transformations (mutate)
+# The function returns nothing: it assigns into the `ctx` environment
+summarize_eval <- function(name, quosure, ctx, recurse = FALSE) {
+  expr <- quo_get_expr(quosure)
+  ctx$quo_env <- quo_get_env(quosure)
+
+  funs_in_expr <- all_funs(expr)
+  if (length(funs_in_expr) == 0) {
+    # If it is a scalar or field ref, no special handling required
+    ctx$aggregations[[name]] <- arrow_eval_or_stop(quosure, ctx$mask)
+    return()
+  }
 
-  # Collect the target names first because we have to add back the group vars
-  target_names <- names(.data)
+  # Start inspecting the expr to see what aggregations it involves
+  agg_funs <- names(agg_funcs)
+  outer_agg <- funs_in_expr[1] %in% agg_funs
+  inner_agg <- funs_in_expr[-1] %in% agg_funs
 
-  if (grouped) {
-    .data <- ensure_group_vars(.data)
-    # We also need to prefix all of the aggregation function names with "hash_"
-    .data$aggregations <- lapply(.data$aggregations, function(x) {
-      x[["fun"]] <- paste0("hash_", x[["fun"]])
-      x
-    })
+  # First, pull out any aggregations wrapped in other function calls
+  if (any(inner_agg)) {
+    expr <- extract_aggregations(expr, ctx)
   }
 
-  start_node <- plan$Scan(.data)
-  # ARROW-13498: Even though Scan takes the filter, apparently we have to do it again
-  if (inherits(.data$filtered_rows, "Expression")) {
-    start_node <- start_node$Filter(.data$filtered_rows)
+  # By this point, there are no more aggregation functions in expr
+  # except for possibly the outer function call:
+  # they've all been pulled out to ctx$aggregations, and in their place in expr
+  # there are variable names, which will correspond to field refs in the
+  # query object after aggregation and collapse().
+  # So if we want to know if there are any aggregations inside expr,
+  # we have to look for them by their new var names
+  inner_agg_exprs <- all_vars(expr) %in% names(ctx$aggregations)
+
+  if (outer_agg) {
+    # This is something like agg(fun(x, y)
+    # It just works by normal arrow_eval, unless there's a mix of aggs and
+    # columns in the original data like agg(fun(x, agg(x)))
+    # (but that will have been caught in extract_aggregations())
+    ctx$aggregations[[name]] <- arrow_eval_or_stop(
+      as_quosure(expr, ctx$quo_env),
+      ctx$mask
+    )
+    return()
+  } else if (all(inner_agg_exprs)) {
+    # Something like: fun(agg(x), agg(y))
+    # So based on the aggregations that have been extracted, mutate after
+    mutate_mask <- arrow_mask(
+      list(selected_columns = make_field_refs(names(ctx$aggregations)))
+    )
+    ctx$post_mutate[[name]] <- arrow_eval_or_stop(
+      as_quosure(expr, ctx$quo_env),
+      mutate_mask
+    )
+    return()
   }
-  # If any columns are derived we need to Project (otherwise this may be no-op)
-  project_node <- start_node$Project(.data$selected_columns)
-
-  final_node <- project_node$Aggregate(
-    options = .data$aggregations,
-    target_names = target_names,
-    out_field_names = names(.data$aggregations),
-    key_names = group_vars
+
+  # Backstop for any other odd cases, like fun(x, y) (i.e. no aggregation),
+  # or aggregation functions that aren't supported in Arrow (not in agg_funcs)
+  stop(
+    handle_arrow_not_supported(
+      quo_get_expr(quosure),
+      as_label(quo_get_expr(quosure))
+    ),
+    call. = FALSE
   )
+}
 
-  out <- plan$Run(final_node)
-  if (grouped) {
-    # The result will have result columns first then the grouping cols.
-    # dplyr orders group cols first, so adapt the result to meet that expectation.
-    n_results <- length(.data$aggregations)
-    out <- out[c((n_results + 1):ncol(out), seq_along(.data$aggregations))]
+# This function recurses through expr, pulls out any aggregation expressions,
+# and inserts a variable name (field ref) in place of the aggregation
+extract_aggregations <- function(expr, ctx) {
+  # Keep the input in case we need to raise an error message with it
+  original_expr <- expr
+  funs <- all_funs(expr)
+  if (length(funs) == 0) {
+    return(expr)
+  } else if (length(funs) > 1) {
+    # Recurse more
+    expr[-1] <- lapply(expr[-1], extract_aggregations, ctx)
   }
-  out
+  if (funs[1] %in% names(agg_funcs)) {
+    inner_agg_exprs <- all_vars(expr) %in% names(ctx$aggregations)
+    if (any(inner_agg_exprs) & !all(inner_agg_exprs)) {
+      # We can't aggregate over a combination of dataset columns and other
+      # aggregations (e.g. sum(x - mean(x)))
+      # TODO: support in ARROW-13926
+      # TODO: Add "because" arg to explain _why_ it's not supported?
+      # TODO: this message could also say "not supported in summarize()"
+      #       since some of these expressions may be legal elsewhere
+      stop(
+        handle_arrow_not_supported(original_expr, as_label(original_expr)),
+        call. = FALSE
+      )
+    }
+
+    # We have an aggregation expression with no other aggregations inside it,
+    # so arrow_eval the expression on the data and give it a ..temp name prefix,
+    # then insert that name (symbol) back into the expression so that we can
+    # mutate() on the result of the aggregation and reference this field.
+    tmpname <- paste0("..temp", length(ctx$aggregations))
+    ctx$aggregations[[tmpname]] <- arrow_eval_or_stop(as_quosure(expr, ctx$quo_env), ctx$mask)
+    expr <- as.symbol(tmpname)
+  }
+  expr
 }
diff --git a/r/R/dplyr.R b/r/R/dplyr.R
index b2793bdb3c3..199120887b9 100644
--- a/r/R/dplyr.R
+++ b/r/R/dplyr.R
@@ -23,14 +23,10 @@ arrow_dplyr_query <- function(.data) {
   # An arrow_dplyr_query is a container for an Arrow data object (Table,
   # RecordBatch, or Dataset) and the state of the user's dplyr query--things
   # like selected columns, filters, and group vars.
-
-  # For most dplyr methods,
-  # method.Table == method.RecordBatch == method.Dataset == method.arrow_dplyr_query
-  # This works because the functions all pass .data through arrow_dplyr_query()
-  if (inherits(.data, "arrow_dplyr_query")) {
-    return(.data)
+  # An arrow_dplyr_query can contain another arrow_dplyr_query in .data
+  if (!inherits(.data, c("Dataset", "arrow_dplyr_query"))) {
+    .data <- InMemoryDataset$create(.data)
   }
-
   # Evaluating expressions on a dataset with duplicated fieldnames will error
   dupes <- duplicated(names(.data))
   if (any(dupes)) {
@@ -42,19 +38,14 @@ arrow_dplyr_query <- function(.data) {
       )
     ))
   }
-
   structure(
     list(
-      .data = if (inherits(.data, "Dataset")) {
-        .data$clone()
-      } else {
-        InMemoryDataset$create(.data)
-      },
+      .data = .data,
       # selected_columns is a named list:
       # * contents are references/expressions pointing to the data
       # * names are the names they should be in the end (i.e. this
       #   records any renaming)
-      selected_columns = make_field_refs(names(.data)),
+      selected_columns = make_field_refs(names(.data$schema)),
       # filtered_rows will be an Expression
       filtered_rows = TRUE,
       # group_by_vars is a character vector of columns (as renamed)
@@ -75,6 +66,21 @@ arrow_dplyr_query <- function(.data) {
   )
 }
 
+# The only difference between `arrow_dplyr_query()` and `as_adq()` is that if
+# `.data` is already an `arrow_dplyr_query`, `as_adq()`, will return it as is, but
+# `arrow_dplyr_query()` will nest it inside a new `arrow_dplyr_query`. The only
+# place where `arrow_dplyr_query()` should be called directly is inside
+# `collapse()` methods; everywhere else, call `as_adq()`.
+as_adq <- function(.data) {
+  # For most dplyr methods,
+  # method.Table == method.RecordBatch == method.Dataset == method.arrow_dplyr_query
+  # This works because the functions all pass .data through as_adq()
+  if (inherits(.data, "arrow_dplyr_query")) {
+    return(.data)
+  }
+  arrow_dplyr_query(.data)
+}
+
 make_field_refs <- function(field_names) {
   set_names(lapply(field_names, Expression$field_ref), field_names)
 }
@@ -96,9 +102,14 @@ print.arrow_dplyr_query <- function(x, ...) {
     }
   })
   fields <- paste(names(types), types, sep = ": ", collapse = "\n")
-  cat(class(x$.data)[1], " (query)\n", sep = "")
+  cat(class(source_data(x))[1], " (query)\n", sep = "")
   cat(fields, "\n", sep = "")
   cat("\n")
+  if (length(x$aggregations)) {
+    cat("* Aggregations:\n")
+    aggs <- paste0(names(x$aggregations), ": ", map_chr(x$aggregations, format_aggregation), collapse = "\n")
+    cat(aggs, "\n", sep = "")
+  }
   if (!isTRUE(x$filtered_rows)) {
     filter_string <- x$filtered_rows$ToString()
     cat("* Filter: ", filter_string, "\n", sep = "")
@@ -133,7 +144,10 @@ names.arrow_dplyr_query <- function(x) names(x$selected_columns)
 dim.arrow_dplyr_query <- function(x) {
   cols <- length(names(x))
 
-  if (isTRUE(x$filtered)) {
+  if (is_collapsed(x)) {
+    # Don't evaluate just for nrow
+    rows <- NA_integer_
+  } else if (isTRUE(x$filtered)) {
     rows <- x$.data$num_rows
   } else {
     rows <- Scanner$create(x)$CountRows()
@@ -148,12 +162,14 @@ as.data.frame.arrow_dplyr_query <- function(x, row.names = NULL, optional = FALS
 
 #' @export
 head.arrow_dplyr_query <- function(x, n = 6L, ...) {
+  # TODO (ARROW-13893): refactor
   out <- head.Dataset(x, n, ...)
   restore_dplyr_features(out, x)
 }
 
 #' @export
 tail.arrow_dplyr_query <- function(x, n = 6L, ...) {
+  # TODO (ARROW-13893): refactor
   out <- tail.Dataset(x, n, ...)
   restore_dplyr_features(out, x)
 }
@@ -161,6 +177,7 @@ tail.arrow_dplyr_query <- function(x, n = 6L, ...) {
 #' @export
 `[.arrow_dplyr_query` <- `[.Dataset`
 # TODO: ^ should also probably restore_dplyr_features, and/or that should be moved down
+# TODO (ARROW-13893): refactor
 
 ensure_group_vars <- function(x) {
   if (inherits(x, "arrow_dplyr_query")) {
@@ -191,42 +208,30 @@ ensure_arrange_vars <- function(x) {
   x
 }
 
-restore_dplyr_features <- function(df, query) {
-  # An arrow_dplyr_query holds some attributes that Arrow doesn't know about
-  # After calling collect(), make sure these features are carried over
-
-  if (length(query$group_by_vars) > 0) {
-    # Preserve groupings, if present
-    if (is.data.frame(df)) {
-      df <- dplyr::grouped_df(
-        df,
-        dplyr::group_vars(query),
-        drop = dplyr::group_by_drop_default(query)
-      )
-    } else {
-      # This is a Table, via compute() or collect(as_data_frame = FALSE)
-      df <- arrow_dplyr_query(df)
-      df$group_by_vars <- query$group_by_vars
-      df$drop_empty_groups <- query$drop_empty_groups
-    }
-  }
-  df
-}
-
 # Helper to handle unsupported dplyr features
 # * For Table/RecordBatch, we collect() and then call the dplyr method in R
 # * For Dataset, we just error
 abandon_ship <- function(call, .data, msg) {
+  msg <- trimws(msg)
   dplyr_fun_name <- sub("^(.*?)\\..*", "\\1", as.character(call[[1]]))
   if (query_on_dataset(.data)) {
     stop(msg, "\nCall collect() first to pull data into R.", call. = FALSE)
   }
   # else, collect and call dplyr method
-  msg <- sub("\\n$", "", msg)
   warning(msg, "; pulling data into R", immediate. = TRUE, call. = FALSE)
   call$.data <- dplyr::collect(.data)
   call[[1]] <- get(dplyr_fun_name, envir = asNamespace("dplyr"))
   eval.parent(call, 2)
 }
 
-query_on_dataset <- function(x) !inherits(x$.data, "InMemoryDataset")
+query_on_dataset <- function(x) !inherits(source_data(x), "InMemoryDataset")
+
+source_data <- function(x) {
+  if (is_collapsed(x)) {
+    source_data(x$.data)
+  } else {
+    x$.data
+  }
+}
+
+is_collapsed <- function(x) inherits(x$.data, "arrow_dplyr_query")
diff --git a/r/R/duckdb.R b/r/R/duckdb.R
index edef5cdc143..87d1b2cfad6 100644
--- a/r/R/duckdb.R
+++ b/r/R/duckdb.R
@@ -60,7 +60,7 @@ to_duckdb <- function(.data,
                       con = arrow_duck_connection(),
                       table_name = unique_arrow_tablename(),
                       auto_disconnect = TRUE) {
-  .data <- arrow_dplyr_query(.data)
+  .data <- as_adq(.data)
   duckdb::duckdb_register_arrow(con, table_name, .data)
 
   tbl <- tbl(con, table_name)
diff --git a/r/R/expression.R b/r/R/expression.R
index aa9af9270c9..82e21ccf2e1 100644
--- a/r/R/expression.R
+++ b/r/R/expression.R
@@ -125,6 +125,9 @@ Expression <- R6Class("Expression",
   inherit = ArrowObject,
   public = list(
     ToString = function() compute___expr__ToString(self),
+    Equals = function(other, ...) {
+      inherits(other, "Expression") && compute___expr__equals(self, other)
+    },
     # TODO: Implement type determination without storing
     # schemas in Expression objects (ARROW-13186)
     schema = NULL,
diff --git a/r/R/install-arrow.R b/r/R/install-arrow.R
index 63db8ede910..3e295c543cf 100644
--- a/r/R/install-arrow.R
+++ b/r/R/install-arrow.R
@@ -70,7 +70,6 @@ install_arrow <- function(nightly = FALSE,
     }
   } else {
     Sys.setenv(
-      LIBARROW_DOWNLOAD = "true",
       LIBARROW_BINARY = binary,
       LIBARROW_MINIMAL = minimal,
       ARROW_R_DEV = verbose,
@@ -137,3 +136,104 @@ reload_arrow <- function() {
     message("Please restart R to use the 'arrow' package.")
   }
 }
+
+
+#' Create a source bundle that includes all thirdparty dependencies
+#'
+#' @param dest_file File path for the new tar.gz package. Defaults to
+#' `arrow_V.V.V_with_deps.tar.gz` in the current directory (`V.V.V` is the version)
+#' @param source_file File path for the input tar.gz package. Defaults to
+#' downloading the package from CRAN (or whatever you have set as the first in
+#' `getOption("repos")`)
+#' @return The full path to `dest_file`, invisibly
+#'
+#' This function is used for setting up an offline build. If it's possible to
+#' download at build time, don't use this function. Instead, let `cmake`
+#' download the required dependencies for you.
+#' These downloaded dependencies are only used in the build if
+#' `ARROW_DEPENDENCY_SOURCE` is unset, `BUNDLED`, or `AUTO`.
+#' https://arrow.apache.org/docs/developers/cpp/building.html#offline-builds
+#'
+#' If you're using binary packages you shouldn't need to use this function. You
+#' should download the appropriate binary from your package repository, transfer
+#' that to the offline computer, and install that. Any OS can create the source
+#' bundle, but it cannot be installed on Windows. (Instead, use a standard
+#' Windows binary package.)
+#'
+#' Note if you're using RStudio Package Manager on Linux: If you still want to
+#' make a source bundle with this function, make sure to set the first repo in
+#' `options("repos")` to be a mirror that contains source packages (that is:
+#' something other than the RSPM binary mirror URLs).
+#'
+#' ## Steps for an offline install with optional dependencies:
+#'
+#' ### Using a computer with internet access, pre-download the dependencies:
+#' * Install the `arrow` package _or_ run
+#'   `source("https://raw.githubusercontent.com/apache/arrow/master/r/R/install-arrow.R")`
+#' * Run `create_package_with_all_dependencies("my_arrow_pkg.tar.gz")`
+#' * Copy the newly created `my_arrow_pkg.tar.gz` to the computer without internet access
+#'
+#' ### On the computer without internet access, install the prepared package:
+#' * Install the `arrow` package from the copied file
+#'   * `install.packages("my_arrow_pkg.tar.gz", dependencies = c("Depends", "Imports", "LinkingTo"))`
+#'   * This installation will build from source, so `cmake` must be available
+#' * Run [arrow_info()] to check installed capabilities
+#'
+#'
+#' @examples
+#' \dontrun{
+#' new_pkg <- create_package_with_all_dependencies()
+#' # Note: this works when run in the same R session, but it's meant to be
+#' # copied to a different computer.
+#' install.packages(new_pkg, dependencies = c("Depends", "Imports", "LinkingTo"))
+#' }
+#' @export
+create_package_with_all_dependencies <- function(dest_file = NULL, source_file = NULL) {
+  if (is.null(source_file)) {
+    pkg_download_dir <- tempfile()
+    dir.create(pkg_download_dir)
+    on.exit(unlink(pkg_download_dir, recursive = TRUE), add = TRUE)
+    message("Downloading Arrow source file")
+    downloaded <- utils::download.packages("arrow", destdir = pkg_download_dir, type = "source")
+    source_file <- downloaded[1, 2, drop = TRUE]
+  }
+  if (!file.exists(source_file) || !endsWith(source_file, "tar.gz")) {
+    stop("Arrow package .tar.gz file not found")
+  }
+  if (is.null(dest_file)) {
+    # e.g. convert /path/to/arrow_5.0.0.tar.gz to ./arrow_5.0.0_with_deps.tar.gz
+    # (add 'with_deps' for clarity if the file was downloaded locally)
+    dest_file <- paste0(gsub(".tar.gz$", "", basename(source_file)), "_with_deps.tar.gz")
+  }
+  untar_dir <- tempfile()
+  on.exit(unlink(untar_dir, recursive = TRUE), add = TRUE)
+  utils::untar(source_file, exdir = untar_dir)
+  tools_dir <- file.path(untar_dir, "arrow/tools")
+  download_dependencies_sh <- file.path(tools_dir, "cpp/thirdparty/download_dependencies.sh")
+  # If you change this path, also need to edit nixlibs.R
+  download_dir <- file.path(tools_dir, "thirdparty_dependencies")
+  dir.create(download_dir)
+
+  message("Downloading files to ", download_dir)
+  download_successful <- system2(download_dependencies_sh, download_dir, stdout = FALSE) == 0
+  if (!download_successful) {
+    stop("Failed to download thirdparty dependencies")
+  }
+  # Need to change directory to untar_dir so tar() will use relative paths. That
+  # means we'll need a full, non-relative path for dest_file. (extra_flags="-C"
+  # doesn't work with R's internal tar)
+  orig_wd <- getwd()
+  on.exit(setwd(orig_wd), add = TRUE)
+  # normalizePath() may return the input unchanged if dest_file doesn't exist,
+  # so create it first.
+  file.create(dest_file)
+  dest_file <- normalizePath(dest_file, mustWork = TRUE)
+  setwd(untar_dir)
+
+  message("Repacking tar.gz file to ", dest_file)
+  tar_successful <- utils::tar(dest_file, compression = "gz") == 0
+  if (!tar_successful) {
+    stop("Failed to create new tar.gz file")
+  }
+  invisible(dest_file)
+}
diff --git a/r/R/json.R b/r/R/json.R
index 6560a07fe06..0d54c8a8aee 100644
--- a/r/R/json.R
+++ b/r/R/json.R
@@ -25,7 +25,7 @@
 #'
 #' @return A `data.frame`, or a Table if `as_data_frame = FALSE`.
 #' @export
-#' @examplesIf arrow_available()
+#' @examplesIf arrow_with_json()
 #' tf <- tempfile()
 #' on.exit(unlink(tf))
 #' writeLines('
diff --git a/r/R/query-engine.R b/r/R/query-engine.R
index 4de2f87165b..a96378671af 100644
--- a/r/R/query-engine.R
+++ b/r/R/query-engine.R
@@ -15,6 +15,19 @@
 # specific language governing permissions and limitations
 # under the License.
 
+do_exec_plan <- function(.data) {
+  plan <- ExecPlan$create()
+  final_node <- plan$Build(.data)
+  tab <- plan$Run(final_node)
+
+  if (length(final_node$sort$temp_columns) > 0) {
+    # If arrange() created $temp_columns, make sure to omit them from the result
+    tab <- tab[, setdiff(names(tab), final_node$sort$temp_columns), drop = FALSE]
+  }
+
+  tab
+}
+
 ExecPlan <- R6Class("ExecPlan",
   inherit = ArrowObject,
   public = list(
@@ -31,6 +44,7 @@ ExecPlan <- R6Class("ExecPlan",
           field_names_in_expression
         )))
         dataset <- dataset$.data
+        assert_is(dataset, "Dataset")
       } else {
         if (inherits(dataset, "ArrowTabular")) {
           dataset <- InMemoryDataset$create(dataset)
@@ -42,11 +56,97 @@ ExecPlan <- R6Class("ExecPlan",
       }
       # ScanNode needs the filter to do predicate pushdown and skip partitions,
       # and it needs to know which fields to materialize (and which are unnecessary)
-      ExecNode_Scan(self, dataset, filter, colnames)
+      ExecNode_Scan(self, dataset, filter, colnames %||% character(0))
+    },
+    Build = function(.data) {
+      # This method takes an arrow_dplyr_query and chains together the
+      # ExecNodes that they produce. It does not evaluate them--that is Run().
+      group_vars <- dplyr::group_vars(.data)
+      grouped <- length(group_vars) > 0
+
+      # Collect the target names first because we have to add back the group vars
+      target_names <- names(.data)
+      .data <- ensure_group_vars(.data)
+      .data <- ensure_arrange_vars(.data) # this sets .data$temp_columns
+
+      if (inherits(.data$.data, "arrow_dplyr_query")) {
+        # We have a nested query. Recurse.
+        node <- self$Build(.data$.data)
+      } else {
+        node <- self$Scan(.data)
+      }
+
+      # ARROW-13498: Even though Scan takes the filter, apparently we have to do it again
+      if (inherits(.data$filtered_rows, "Expression")) {
+        node <- node$Filter(.data$filtered_rows)
+      }
+
+      if (!is.null(.data$aggregations)) {
+        # Project to include just the data required for each aggregation,
+        # plus group_by_vars (last)
+        # TODO: validate that none of names(aggregations) are the same as names(group_by_vars)
+        # dplyr does not error on this but the result it gives isn't great
+        node <- node$Project(summarize_projection(.data))
+
+        if (grouped) {
+          # We need to prefix all of the aggregation function names with "hash_"
+          .data$aggregations <- lapply(.data$aggregations, function(x) {
+            x[["fun"]] <- paste0("hash_", x[["fun"]])
+            x
+          })
+        }
+
+        node <- node$Aggregate(
+          options = map(.data$aggregations, ~ .[c("fun", "options")]),
+          target_names = names(.data$aggregations),
+          out_field_names = names(.data$aggregations),
+          key_names = group_vars
+        )
+
+        if (grouped) {
+          # The result will have result columns first then the grouping cols.
+          # dplyr orders group cols first, so adapt the result to meet that expectation.
+          node <- node$Project(
+            make_field_refs(c(group_vars, names(.data$aggregations)))
+          )
+          if (getOption("arrow.summarise.sort", FALSE)) {
+            # Add sorting instructions for the rows too to match dplyr
+            # (see below about why sorting isn't itself a Node)
+            node$sort <- list(
+              names = group_vars,
+              orders = rep(0L, length(group_vars))
+            )
+          }
+        }
+      } else {
+        # If any columns are derived, reordered, or renamed we need to Project
+        # If there are aggregations, the projection was already handled above
+        # We have to project at least once to eliminate some junk columns
+        # that the ExecPlan adds:
+        # __fragment_index, __batch_index, __last_in_fragment
+        # Presumably extraneous repeated projection of the same thing
+        # (as when we've done collapse() and not projected after) is cheap/no-op
+        projection <- c(.data$selected_columns, .data$temp_columns)
+        node <- node$Project(projection)
+      }
+
+      # Apply sorting: this is currently not an ExecNode itself, it is a
+      # sink node option.
+      # TODO: handle some cases:
+      # (1) arrange > summarize > arrange
+      # (2) ARROW-13779: arrange then operation where order matters (e.g. cumsum)
+      if (length(.data$arrange_vars)) {
+        node$sort <- list(
+          names = names(.data$arrange_vars),
+          orders = as.integer(.data$arrange_desc),
+          temp_columns = names(.data$temp_columns)
+        )
+      }
+      node
     },
     Run = function(node) {
       assert_is(node, "ExecNode")
-      ExecPlan_run(self, node)
+      ExecPlan_run(self, node, node$sort %||% list())
     }
   )
 )
@@ -57,16 +157,30 @@ ExecPlan$create <- function(use_threads = option_use_threads()) {
 ExecNode <- R6Class("ExecNode",
   inherit = ArrowObject,
   public = list(
+    # `sort` is a slight hack to be able to keep around arrange() params,
+    # which don't currently yield their own ExecNode but rather are consumed
+    # in the SinkNode (in ExecPlan$run())
+    sort = NULL,
+    preserve_sort = function(new_node) {
+      new_node$sort <- self$sort
+      new_node
+    },
     Project = function(cols) {
-      assert_is_list_of(cols, "Expression")
-      ExecNode_Project(self, cols, names(cols))
+      if (length(cols)) {
+        assert_is_list_of(cols, "Expression")
+        self$preserve_sort(ExecNode_Project(self, cols, names(cols)))
+      } else {
+        self$preserve_sort(ExecNode_Project(self, character(0), character(0)))
+      }
     },
     Filter = function(expr) {
       assert_is(expr, "Expression")
-      ExecNode_Filter(self, expr)
+      self$preserve_sort(ExecNode_Filter(self, expr))
     },
     Aggregate = function(options, target_names, out_field_names, key_names) {
-      ExecNode_Aggregate(self, options, target_names, out_field_names, key_names)
+      self$preserve_sort(
+        ExecNode_Aggregate(self, options, target_names, out_field_names, key_names)
+      )
     }
   )
 )
diff --git a/r/R/util.R b/r/R/util.R
index 5958b0b3111..4811d5dbfbb 100644
--- a/r/R/util.R
+++ b/r/R/util.R
@@ -58,21 +58,10 @@ r_symbolic_constants <- c(
   "NA_integer_", "NA_real_", "NA_complex_", "NA_character_"
 )
 
-is_function <- function(expr, name) {
-  if (!is.call(expr)) {
-    return(FALSE)
-  } else {
-    if (deparse1(expr[[1]]) == name) {
-      return(TRUE)
-    }
-    out <- lapply(expr, is_function, name)
-  }
-  any(vapply(out, isTRUE, TRUE))
-}
-
 all_funs <- function(expr) {
-  names <- all_names(expr)
-  names[vapply(names, function(name) is_function(expr, name), TRUE)]
+  # Don't use setdiff so that we preserve duplicates
+  out <- all.names(expr)
+  out[!(out %in% all.vars(expr))]
 }
 
 all_vars <- function(expr) {
diff --git a/r/_pkgdown.yml b/r/_pkgdown.yml
index 90d900ddf28..c0127a8b53a 100644
--- a/r/_pkgdown.yml
+++ b/r/_pkgdown.yml
@@ -175,6 +175,7 @@ reference:
       - arrow_available
       - install_arrow
       - install_pyarrow
+      - create_package_with_all_dependencies
 
 repo:
   jira_projects: [ARROW]
diff --git a/r/configure b/r/configure
index d56fc9040f0..cd2314949bf 100755
--- a/r/configure
+++ b/r/configure
@@ -39,7 +39,7 @@ FORCE_AUTOBREW=`echo $FORCE_AUTOBREW | tr '[:upper:]' '[:lower:]'`
 FORCE_BUNDLED_BUILD=`echo $FORCE_BUNDLED_BUILD | tr '[:upper:]' '[:lower:]'`
 ARROW_USE_PKG_CONFIG=`echo $ARROW_USE_PKG_CONFIG | tr '[:upper:]' '[:lower:]'`
 LIBARROW_MINIMAL=`echo $LIBARROW_MINIMAL | tr '[:upper:]' '[:lower:]'`
-LIBARROW_DOWNLOAD=`echo $LIBARROW_DOWNLOAD | tr '[:upper:]' '[:lower:]'`
+TEST_OFFLINE_BUILD=`echo $TEST_OFFLINE_BUILD | tr '[:upper:]' '[:lower:]'`
 NOT_CRAN=`echo $NOT_CRAN | tr '[:upper:]' '[:lower:]'`
 
 VERSION=`grep '^Version' DESCRIPTION | sed s/Version:\ //`
@@ -129,18 +129,14 @@ else
         # autobrew sets `PKG_LIBS`, `PKG_DIRS`, and `PKG_CFLAGS`
       fi
     else
-      # Set some default values/backwards compatibility
-      if [ "${LIBARROW_DOWNLOAD}" = "" ] && [ "${NOT_CRAN}" != "" ]; then
-        LIBARROW_DOWNLOAD=$NOT_CRAN; export LIBARROW_DOWNLOAD
-      fi
-      if [ "${LIBARROW_BINARY}" = "" ] && [ "${LIBARROW_DOWNLOAD}" != "" ]; then
-        LIBARROW_BINARY=$LIBARROW_DOWNLOAD; export LIBARROW_BINARY
-      fi
-      if [ "${LIBARROW_MINIMAL}" = "" ] && [ "${LIBARROW_DOWNLOAD}" = "true" ]; then
-        LIBARROW_MINIMAL=false; export LIBARROW_MINIMAL
-      fi
-      if [ "${LIBARROW_MINIMAL}" = "" ] && [ "${NOT_CRAN}" = "true" ]; then
-        LIBARROW_MINIMAL=false; export LIBARROW_MINIMAL
+      if [ "${NOT_CRAN}" = "true" ]; then
+        # Set some default values
+        if [ "${LIBARROW_BINARY}" = "" ]; then
+          LIBARROW_BINARY=true; export LIBARROW_BINARY
+        fi
+        if [ "${LIBARROW_MINIMAL}" = "" ]; then
+          LIBARROW_MINIMAL=false; export LIBARROW_MINIMAL
+        fi
       fi
 
       # find openssl on macos. macOS ships with libressl. openssl is installable
@@ -267,6 +263,11 @@ if [ $? -eq 0 ]; then
       BUNDLED_LIBS="$BUNDLED_LIBS -lssl -lcrypto -lcurl"
     fi
   fi
+  # Check for JSON
+  grep 'set(ARROW_JSON "ON")' $ARROW_OPTS_CMAKE >/dev/null 2>&1
+  if [ $? -eq 0 ]; then
+    PKG_CFLAGS="$PKG_CFLAGS -DARROW_R_WITH_JSON"
+  fi
   # prepend PKG_DIRS and append BUNDLED_LIBS to PKG_LIBS
   PKG_LIBS="$PKG_DIRS $PKG_LIBS $BUNDLED_LIBS"
   echo "PKG_CFLAGS=$PKG_CFLAGS"
diff --git a/r/configure.win b/r/configure.win
index d830a238c39..6d731bb0988 100644
--- a/r/configure.win
+++ b/r/configure.win
@@ -49,7 +49,7 @@ AWS_LIBS="-laws-cpp-sdk-config -laws-cpp-sdk-transfer -laws-cpp-sdk-identity-man
 
 # NOTE: If you make changes to the libraries below, you should also change
 # ci/scripts/r_windows_build.sh and ci/scripts/PKGBUILD
-PKG_CFLAGS="-I${RWINLIB}/include -DARROW_STATIC -DPARQUET_STATIC -DARROW_DS_STATIC -DARROW_R_WITH_ARROW -DARROW_R_WITH_PARQUET -DARROW_R_WITH_DATASET"
+PKG_CFLAGS="-I${RWINLIB}/include -DARROW_STATIC -DPARQUET_STATIC -DARROW_DS_STATIC -DARROW_R_WITH_ARROW -DARROW_R_WITH_PARQUET -DARROW_R_WITH_DATASET -DARROW_R_WITH_JSON"
 PKG_LIBS="-L${RWINLIB}/lib"'$(subst gcc,,$(COMPILED_BY))$(R_ARCH) '"-L${RWINLIB}/lib"'$(R_ARCH)$(CRT) '"-lparquet -larrow_dataset -larrow -larrow_bundled_dependencies -lutf8proc -lthrift -lsnappy -lz -lzstd -llz4 -lole32 ${MIMALLOC_LIBS} ${OPENSSL_LIBS}"
 
 # S3 and re2 support only for Rtools40 (i.e. R >= 4.0)
diff --git a/r/data-raw/codegen.R b/r/data-raw/codegen.R
index bb0e92eb640..46b02fd64bf 100644
--- a/r/data-raw/codegen.R
+++ b/r/data-raw/codegen.R
@@ -44,7 +44,7 @@
 # Ensure that all machines are sorting the same way
 invisible(Sys.setlocale("LC_COLLATE", "C"))
 
-features <- c("arrow", "dataset", "parquet", "s3")
+features <- c("arrow", "dataset", "parquet", "s3", "json")
 
 suppressPackageStartupMessages({
   library(decor)
@@ -216,7 +216,7 @@ glue::glue('\n
   R_useDynamicSymbols(dll, FALSE);
 
   #if defined(ARROW_R_WITH_ARROW) && defined(HAS_ALTREP)
-  arrow::r::Init_Altrep_classes(dll);
+  arrow::r::altrep::Init_Altrep_classes(dll);
   #endif
 
 }
diff --git a/r/inst/build_arrow_static.sh b/r/inst/build_arrow_static.sh
index 84a9f971246..5f01ae0a75f 100755
--- a/r/inst/build_arrow_static.sh
+++ b/r/inst/build_arrow_static.sh
@@ -59,7 +59,7 @@ ${CMAKE} -DARROW_BOOST_USE_SHARED=OFF \
     -DARROW_FILESYSTEM=ON \
     -DARROW_JEMALLOC=${ARROW_JEMALLOC:-$ARROW_DEFAULT_PARAM} \
     -DARROW_MIMALLOC=${ARROW_MIMALLOC:-ON} \
-    -DARROW_JSON=ON \
+    -DARROW_JSON=${ARROW_JSON:-ON} \
     -DARROW_PARQUET=${ARROW_PARQUET:-ON} \
     -DARROW_S3=${ARROW_S3:-$ARROW_DEFAULT_PARAM} \
     -DARROW_WITH_BROTLI=${ARROW_WITH_BROTLI:-$ARROW_DEFAULT_PARAM} \
@@ -70,6 +70,7 @@ ${CMAKE} -DARROW_BOOST_USE_SHARED=OFF \
     -DARROW_WITH_UTF8PROC=${ARROW_WITH_UTF8PROC:-ON} \
     -DARROW_WITH_ZLIB=${ARROW_WITH_ZLIB:-$ARROW_DEFAULT_PARAM} \
     -DARROW_WITH_ZSTD=${ARROW_WITH_ZSTD:-$ARROW_DEFAULT_PARAM} \
+    -DARROW_VERBOSE_THIRDPARTY_BUILD=${ARROW_VERBOSE_THIRDPARTY_BUILD:-OFF} \
     -DCMAKE_BUILD_TYPE=${CMAKE_BUILD_TYPE:-Release} \
     -DCMAKE_INSTALL_LIBDIR=lib \
     -DCMAKE_INSTALL_PREFIX=${DEST_DIR} \
diff --git a/r/man/arrow_available.Rd b/r/man/arrow_available.Rd
index fdb23dfba30..3061d10dc9c 100644
--- a/r/man/arrow_available.Rd
+++ b/r/man/arrow_available.Rd
@@ -5,6 +5,7 @@
 \alias{arrow_with_dataset}
 \alias{arrow_with_parquet}
 \alias{arrow_with_s3}
+\alias{arrow_with_json}
 \title{Is the C++ Arrow library available?}
 \usage{
 arrow_available()
@@ -14,6 +15,8 @@ arrow_with_dataset()
 arrow_with_parquet()
 
 arrow_with_s3()
+
+arrow_with_json()
 }
 \value{
 \code{TRUE} or \code{FALSE} depending on whether the package was installed
@@ -22,6 +25,7 @@ with:
 \item The Arrow C++ library (check with \code{arrow_available()})
 \item Arrow Dataset support enabled (check with \code{arrow_with_dataset()})
 \item Parquet support enabled (check with \code{arrow_with_parquet()})
+\item JSON support enabled (check with \code{arrow_with_json()})
 \item Amazon S3 support enabled (check with \code{arrow_with_s3()})
 }
 }
@@ -33,6 +37,7 @@ for diagnostic purposes.
 arrow_available()
 arrow_with_dataset()
 arrow_with_parquet()
+arrow_with_json()
 arrow_with_s3()
 }
 \seealso{
diff --git a/r/man/create_package_with_all_dependencies.Rd b/r/man/create_package_with_all_dependencies.Rd
new file mode 100644
index 00000000000..b2da8c2491a
--- /dev/null
+++ b/r/man/create_package_with_all_dependencies.Rd
@@ -0,0 +1,70 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/install-arrow.R
+\name{create_package_with_all_dependencies}
+\alias{create_package_with_all_dependencies}
+\title{Create a source bundle that includes all thirdparty dependencies}
+\usage{
+create_package_with_all_dependencies(dest_file = NULL, source_file = NULL)
+}
+\arguments{
+\item{dest_file}{File path for the new tar.gz package. Defaults to
+\code{arrow_V.V.V_with_deps.tar.gz} in the current directory (\code{V.V.V} is the version)}
+
+\item{source_file}{File path for the input tar.gz package. Defaults to
+downloading the package from CRAN (or whatever you have set as the first in
+\code{getOption("repos")})}
+}
+\value{
+The full path to \code{dest_file}, invisibly
+
+This function is used for setting up an offline build. If it's possible to
+download at build time, don't use this function. Instead, let \code{cmake}
+download the required dependencies for you.
+These downloaded dependencies are only used in the build if
+\code{ARROW_DEPENDENCY_SOURCE} is unset, \code{BUNDLED}, or \code{AUTO}.
+https://arrow.apache.org/docs/developers/cpp/building.html#offline-builds
+
+If you're using binary packages you shouldn't need to use this function. You
+should download the appropriate binary from your package repository, transfer
+that to the offline computer, and install that. Any OS can create the source
+bundle, but it cannot be installed on Windows. (Instead, use a standard
+Windows binary package.)
+
+Note if you're using RStudio Package Manager on Linux: If you still want to
+make a source bundle with this function, make sure to set the first repo in
+\code{options("repos")} to be a mirror that contains source packages (that is:
+something other than the RSPM binary mirror URLs).
+\subsection{Steps for an offline install with optional dependencies:}{
+\subsection{Using a computer with internet access, pre-download the dependencies:}{
+\itemize{
+\item Install the \code{arrow} package \emph{or} run
+\code{source("https://raw.githubusercontent.com/apache/arrow/master/r/R/install-arrow.R")}
+\item Run \code{create_package_with_all_dependencies("my_arrow_pkg.tar.gz")}
+\item Copy the newly created \code{my_arrow_pkg.tar.gz} to the computer without internet access
+}
+}
+
+\subsection{On the computer without internet access, install the prepared package:}{
+\itemize{
+\item Install the \code{arrow} package from the copied file
+\itemize{
+\item \code{install.packages("my_arrow_pkg.tar.gz", dependencies = c("Depends", "Imports", "LinkingTo"))}
+\item This installation will build from source, so \code{cmake} must be available
+}
+\item Run \code{\link[=arrow_info]{arrow_info()}} to check installed capabilities
+}
+}
+
+}
+}
+\description{
+Create a source bundle that includes all thirdparty dependencies
+}
+\examples{
+\dontrun{
+new_pkg <- create_package_with_all_dependencies()
+# Note: this works when run in the same R session, but it's meant to be
+# copied to a different computer.
+install.packages(new_pkg, dependencies = c("Depends", "Imports", "LinkingTo"))
+}
+}
diff --git a/r/man/read_json_arrow.Rd b/r/man/read_json_arrow.Rd
index 53d7107ae81..610867ca403 100644
--- a/r/man/read_json_arrow.Rd
+++ b/r/man/read_json_arrow.Rd
@@ -39,7 +39,7 @@ A \code{data.frame}, or a Table if \code{as_data_frame = FALSE}.
 Using \link{JsonTableReader}
 }
 \examples{
-\dontshow{if (arrow_available()) (if (getRversion() >= "3.4") withAutoprint else force)(\{ # examplesIf}
+\dontshow{if (arrow_with_json()) (if (getRversion() >= "3.4") withAutoprint else force)(\{ # examplesIf}
 tf <- tempfile()
 on.exit(unlink(tf))
 writeLines('
diff --git a/r/man/write_dataset.Rd b/r/man/write_dataset.Rd
index f29a9ee2189..6f36f8e72e8 100644
--- a/r/man/write_dataset.Rd
+++ b/r/man/write_dataset.Rd
@@ -64,3 +64,44 @@ This function allows you to write a dataset. By writing to more efficient
 binary storage formats, and by specifying relevant partitioning, you can
 make it much faster to read and query.
 }
+\examples{
+\dontshow{if (arrow_with_dataset() & arrow_with_parquet() & requireNamespace("dplyr", quietly = TRUE)) (if (getRversion() >= "3.4") withAutoprint else force)(\{ # examplesIf}
+# You can write datasets partitioned by the values in a column (here: "cyl").
+# This creates a structure of the form cyl=X/part-Z.parquet.
+one_level_tree <- tempfile()
+write_dataset(mtcars, one_level_tree, partitioning = "cyl")
+list.files(one_level_tree, recursive = TRUE)
+
+# You can also partition by the values in multiple columns
+# (here: "cyl" and "gear").
+# This creates a structure of the form cyl=X/gear=Y/part-Z.parquet.
+two_levels_tree <- tempfile()
+write_dataset(mtcars, two_levels_tree, partitioning = c("cyl", "gear"))
+list.files(two_levels_tree, recursive = TRUE)
+
+# In the two previous examples we would have:
+# X = {4,6,8}, the number of cylinders.
+# Y = {3,4,5}, the number of forward gears.
+# Z = {0,1,2}, the number of saved parts, starting from 0.
+
+# You can obtain the same result as as the previous examples using arrow with
+# a dplyr pipeline. This will be the same as two_levels_tree above, but the
+# output directory will be different.
+library(dplyr)
+two_levels_tree_2 <- tempfile()
+mtcars \%>\%
+  group_by(cyl, gear) \%>\%
+  write_dataset(two_levels_tree_2)
+list.files(two_levels_tree_2, recursive = TRUE)
+
+# And you can also turn off the Hive-style directory naming where the column
+# name is included with the values by using `hive_style = FALSE`.
+
+# Write a structure X/Y/part-Z.parquet.
+two_levels_tree_no_hive <- tempfile()
+mtcars \%>\%
+  group_by(cyl, gear) \%>\%
+  write_dataset(two_levels_tree_no_hive, hive_style = FALSE)
+list.files(two_levels_tree_no_hive, recursive = TRUE)
+\dontshow{\}) # examplesIf}
+}
diff --git a/r/src/altrep.cpp b/r/src/altrep.cpp
index b07cbe70ed3..ec68ade1ba9 100644
--- a/r/src/altrep.cpp
+++ b/r/src/altrep.cpp
@@ -19,9 +19,16 @@
 
 #if defined(ARROW_R_WITH_ARROW)
 
+#include <arrow/array.h>
+#include <arrow/compute/api.h>
+#include <arrow/util/bitmap_reader.h>
+
 #include <cpp11/altrep.hpp>
 #if defined(HAS_ALTREP)
 
+// defined in array_to_vector.cpp
+SEXP Array__as_vector(const std::shared_ptr<arrow::Array>& array);
+
 #if R_VERSION < R_Version(3, 6, 0)
 
 // workaround because R's <R_ext/Altrep.h> not so conveniently uses `class`
@@ -43,144 +50,484 @@ extern "C" {
 #include <R_ext/Altrep.h>
 #endif
 
-#include <arrow/array.h>
+#include "./r_task_group.h"
 
 namespace arrow {
 namespace r {
 
+namespace altrep {
+
+template <typename c_type>
+R_xlen_t Standard_Get_region(SEXP data2, R_xlen_t i, R_xlen_t n, c_type* buf);
+
+template <>
+R_xlen_t Standard_Get_region<double>(SEXP data2, R_xlen_t i, R_xlen_t n, double* buf) {
+  return REAL_GET_REGION(data2, i, n, buf);
+}
+
+template <>
+R_xlen_t Standard_Get_region<int>(SEXP data2, R_xlen_t i, R_xlen_t n, int* buf) {
+  return INTEGER_GET_REGION(data2, i, n, buf);
+}
+
+// altrep R vector shadowing an Array.
+//
+// This tries as much as possible to directly use the data
+// from the Array and minimize data copies.
+//
+// Both slots of the altrep object (data1 and data2) are used:
+//
+// data1: always used, stores an R external pointer to a
+//        shared pointer of the Array
+// data2: starts as NULL, and becomes a standard R vector with the same
+//        data if necessary (if materialization is needed)
 template <int sexp_type>
-struct ArrayNoNull {
-  using data_type = typename std::conditional<sexp_type == INTSXP, int, double>::type;
+struct AltrepArrayPrimitive {
   static void DeleteArray(std::shared_ptr<Array>* ptr) { delete ptr; }
   using Pointer = cpp11::external_pointer<std::shared_ptr<Array>, DeleteArray>;
 
-  // altrep object around an Array with no nulls
-  // data1: an external pointer to a shared pointer to the Array
-  // data2: not used
+  using c_type = typename std::conditional<sexp_type == REALSXP, double, int>::type;
 
-  static SEXP Make(R_altrep_class_t class_t, const std::shared_ptr<Array>& array) {
-    // we don't need the whole r6 object, just an external pointer
-    // that retain the array
-    Pointer xp(new std::shared_ptr<Array>(array));
-
-    SEXP res = R_new_altrep(class_t, xp, R_NilValue);
-    MARK_NOT_MUTABLE(res);
+  // singleton altrep class description
+  static R_altrep_class_t class_t;
 
-    return res;
+  // the altrep R object
+  SEXP alt_;
+
+  // This constructor is used to create the altrep object from
+  // an Array. Used by MakeAltrepArrayPrimitive() which is used
+  // in array_to_vector.cpp
+  explicit AltrepArrayPrimitive(const std::shared_ptr<Array>& array)
+      : alt_(R_new_altrep(class_t, Pointer(new std::shared_ptr<Array>(array)),
+                          R_NilValue)) {
+    // force duplicate on modify
+    MARK_NOT_MUTABLE(alt_);
   }
 
-  static Rboolean Inspect(SEXP x, int pre, int deep, int pvec,
-                          void (*inspect_subtree)(SEXP, int, int, int)) {
-    const auto& array = Get(x);
-    Rprintf("arrow::Array<%s, NONULL> len=%d, Array=<%p>\n",
-            array->type()->ToString().c_str(), array->length(), array.get());
-    inspect_subtree(R_altrep_data1(x), pre, deep + 1, pvec);
-    return TRUE;
+  // This constructor is used when R calls altrep methods.
+  //
+  // For example in the Length() method below:
+  //
+  // template <typename AltrepClass>
+  // R_xlen_t Length(SEXP alt) {
+  //   return AltrepClass(alt).Length();
+  // }
+  explicit AltrepArrayPrimitive(SEXP alt) : alt_(alt) {}
+
+  // the arrow::Array that is being wrapped by the altrep object
+  // this is only valid before data2 has been materialized
+  const std::shared_ptr<Array>& array() const { return *Pointer(R_altrep_data1(alt_)); }
+
+  R_xlen_t Length() { return array()->length(); }
+
+  // Does the data2 slot of the altrep object contain a
+  // standard R vector with the same data as the array
+  bool IsMaterialized() const { return !Rf_isNull(R_altrep_data2(alt_)); }
+
+  // Force materialization. After calling this, the data2 slot of the altrep
+  // object contains a standard R vector with the same data, with
+  // R sentinels where the Array has nulls.
+  void Materialize() {
+    if (!IsMaterialized()) {
+      auto size = array()->length();
+
+      // create a standard R vector
+      SEXP copy = PROTECT(Rf_allocVector(sexp_type, size));
+
+      // copy the data from the array, through Get_region
+      Get_region(0, size, reinterpret_cast<c_type*>(DATAPTR(copy)));
+
+      // store as data2, this is now considered materialized
+      R_set_altrep_data2(alt_, copy);
+      MARK_NOT_MUTABLE(copy);
+
+      UNPROTECT(1);
+    }
   }
 
-  static const std::shared_ptr<Array>& Get(SEXP vec) {
-    return *Pointer(R_altrep_data1(vec));
+  // Duplication is done by first materializing the vector and
+  // then make a lazy duplicate of data2
+  SEXP Duplicate(Rboolean /* deep */) {
+    Materialize();
+    return Rf_lazy_duplicate(R_altrep_data2(alt_));
   }
 
-  static R_xlen_t Length(SEXP vec) { return Get(vec)->length(); }
+  // What gets printed on .Internal(inspect(<the altrep object>))
+  Rboolean Inspect(int pre, int deep, int pvec,
+                   void (*inspect_subtree)(SEXP, int, int, int)) {
+    const auto& array_ = array();
+    Rprintf("arrow::Array<%s, %d nulls, %s> len=%d, Array=<%p>\n",
+            array_->type()->ToString().c_str(), array_->null_count(),
+            IsMaterialized() ? "materialized" : "not materialized", array_->length(),
+            array_.get());
+    inspect_subtree(R_altrep_data1(alt_), pre, deep + 1, pvec);
+    if (IsMaterialized()) {
+      inspect_subtree(R_altrep_data2(alt_), pre, deep + 1, pvec);
+    }
+
+    return TRUE;
+  }
 
-  static const void* Dataptr_or_null(SEXP vec) {
-    return Get(vec)->data()->template GetValues<data_type>(1);
+  // R calls this to get a pointer to the start of the vector data
+  // but only if this is possible without allocating (in the R sense).
+  //
+  // For this implementation we can return the data in these cases
+  // - data2 has been created, and so the R sentinels are in place where the array has
+  // nulls
+  // - the Array has no nulls, we can directly return the start of its data
+  //
+  // Otherwise: if the array has nulls and data2 has not been generated: give up
+  const void* Dataptr_or_null() {
+    if (IsMaterialized()) {
+      return DATAPTR_RO(R_altrep_data2(alt_));
+    }
+
+    const auto& array_ = array();
+    if (array_->null_count() == 0) {
+      return reinterpret_cast<const void*>(array_->data()->template GetValues<c_type>(1));
+    }
+
+    return NULL;
   }
 
-  static SEXP Duplicate(SEXP vec, Rboolean) {
-    const auto& array = Get(vec);
-    auto size = array->length();
+  // R calls this to get a pointer to the start of the data, R allocations are allowed.
+  //
+  // If the object hasn't been materialized, and the array has no
+  // nulls we can directly point to the array data.
+  //
+  // Otherwise, the object is materialized DATAPTR(data2) is returned.
+  void* Dataptr(Rboolean writeable) {
+    if (!IsMaterialized()) {
+      const auto& array_ = array();
+
+      if (array_->null_count() == 0) {
+        return reinterpret_cast<void*>(
+            const_cast<c_type*>(array_->data()->template GetValues<c_type>(1)));
+      }
+    }
+
+    // Otherwise we have to materialize and hand the pointer to data2
+    //
+    // NOTE: this returns the DATAPTR() of data2 even in the case writeable = TRUE
+    //
+    // which is risky because C(++) clients of this object might
+    // modify data2, and therefore make it diverge from the data of the Array,
+    // but the object was marked as immutable on creation, so doing this is
+    // disregarding the R api.
+    //
+    // Simply stop() when `writeable = TRUE` is too strong, e.g. this fails
+    // identical() which calls DATAPTR() even though DATAPTR_RO() would
+    // be enough
+    Materialize();
+    return DATAPTR(R_altrep_data2(alt_));
+  }
 
-    SEXP copy = PROTECT(Rf_allocVector(sexp_type, array->length()));
+  // Does the Array have no nulls ?
+  int No_NA() const { return array()->null_count() != 0; }
 
-    memcpy(DATAPTR(copy), Dataptr_or_null(vec), size * sizeof(data_type));
+  int Is_sorted() const { return UNKNOWN_SORTEDNESS; }
 
-    UNPROTECT(1);
-    return copy;
+  // The value at position i
+  c_type Elt(R_xlen_t i) {
+    const auto& array_ = array();
+    return array_->IsNull(i) ? cpp11::na<c_type>()
+                             : array_->data()->template GetValues<c_type>(1)[i];
   }
 
-  static void* Dataptr(SEXP vec, Rboolean writeable) {
-    return const_cast<void*>(Dataptr_or_null(vec));
+  // R calls this when it wants data from position `i` to `i + n` copied into `buf`
+  // The returned value is the number of values that were really copied
+  // (this can be lower than n)
+  R_xlen_t Get_region(R_xlen_t i, R_xlen_t n, c_type* buf) {
+    // If we have data2, we can just copy the region into buf
+    // using the standard Get_region for this R type
+    if (IsMaterialized()) {
+      return Standard_Get_region<c_type>(R_altrep_data2(alt_), i, n, buf);
+    }
+
+    // The vector was not materialized, aka we don't have data2
+    //
+    // In that case, we copy the data from the Array, and then
+    // do a second pass to force the R sentinels for where the
+    // array has nulls
+    //
+    // This only materialize the region, into buf. Not the entire vector.
+    auto slice = array()->Slice(i, n);
+    R_xlen_t ncopy = slice->length();
+
+    // first copy the data buffer
+    memcpy(buf, slice->data()->template GetValues<c_type>(1), ncopy * sizeof(c_type));
+
+    // then set the R NA sentinels if needed
+    if (slice->null_count() > 0) {
+      internal::BitmapReader bitmap_reader(slice->null_bitmap()->data(), slice->offset(),
+                                           ncopy);
+
+      for (R_xlen_t j = 0; j < ncopy; j++, bitmap_reader.Next()) {
+        if (bitmap_reader.IsNotSet()) {
+          buf[j] = cpp11::na<c_type>();
+        }
+      }
+    }
+
+    return ncopy;
   }
 
-  // by definition, there are no NA
-  static int No_NA(SEXP vec) { return 1; }
+  // This cannot keep the external pointer to an Arrow object through
+  // R serialization, so return the materialized
+  SEXP Serialized_state() {
+    Materialize();
+    return R_altrep_data2(alt_);
+  }
 
-  static void Init(R_altrep_class_t class_t, DllInfo* dll) {
-    // altrep
-    R_set_altrep_Length_method(class_t, ArrayNoNull::Length);
-    R_set_altrep_Inspect_method(class_t, ArrayNoNull::Inspect);
-    R_set_altrep_Duplicate_method(class_t, ArrayNoNull::Duplicate);
+  static SEXP Unserialize(SEXP /* class_ */, SEXP state) { return state; }
 
-    // altvec
-    R_set_altvec_Dataptr_method(class_t, ArrayNoNull::Dataptr);
-    R_set_altvec_Dataptr_or_null_method(class_t, ArrayNoNull::Dataptr_or_null);
+  SEXP Coerce(int type) {
+    // Just let R handle it for now
+    return NULL;
   }
 };
+template <int sexp_type>
+R_altrep_class_t AltrepArrayPrimitive<sexp_type>::class_t;
 
-struct DoubleArrayNoNull {
-  static R_altrep_class_t class_t;
+// The methods below are how R interacts with the altrep objects.
+//
+// They all use the same pattern: create a C++ object of the
+// class parameter, and then call the method.
+template <typename AltrepClass>
+R_xlen_t Length(SEXP alt) {
+  return AltrepClass(alt).Length();
+}
 
-  static void Init(DllInfo* dll) {
-    class_t = R_make_altreal_class("array_nonull_dbl_vector", "arrow", dll);
-    ArrayNoNull<REALSXP>::Init(class_t, dll);
-    R_set_altreal_No_NA_method(class_t, ArrayNoNull<REALSXP>::No_NA);
-  }
+template <typename AltrepClass>
+Rboolean Inspect(SEXP alt, int pre, int deep, int pvec,
+                 void (*inspect_subtree)(SEXP, int, int, int)) {
+  return AltrepClass(alt).Inspect(pre, deep, pvec, inspect_subtree);
+}
 
-  static SEXP Make(const std::shared_ptr<Array>& array) {
-    return ArrayNoNull<REALSXP>::Make(class_t, array);
-  }
-};
+template <typename AltrepClass>
+const void* Dataptr_or_null(SEXP alt) {
+  return AltrepClass(alt).Dataptr_or_null();
+}
 
-struct Int32ArrayNoNull {
-  static R_altrep_class_t class_t;
+template <typename AltrepClass>
+void* Dataptr(SEXP alt, Rboolean writeable) {
+  return AltrepClass(alt).Dataptr(writeable);
+}
+
+template <typename AltrepClass>
+SEXP Duplicate(SEXP alt, Rboolean deep) {
+  return AltrepClass(alt).Duplicate(deep);
+}
+
+template <typename AltrepClass>
+auto Elt(SEXP alt, R_xlen_t i) -> decltype(AltrepClass(alt).Elt(i)) {
+  return AltrepClass(alt).Elt(i);
+}
+
+template <typename AltrepClass>
+int No_NA(SEXP alt) {
+  return AltrepClass(alt).No_NA();
+}
+
+template <typename AltrepClass>
+int Is_sorted(SEXP alt) {
+  return AltrepClass(alt).Is_sorted();
+}
+
+template <typename AltrepClass>
+R_xlen_t Get_region(SEXP alt, R_xlen_t i, R_xlen_t n, typename AltrepClass::c_type* buf) {
+  return AltrepClass(alt).Get_region(i, n, buf);
+}
+
+template <typename AltrepClass>
+SEXP Serialized_state(SEXP alt) {
+  return AltrepClass(alt).Serialized_state();
+}
+
+template <typename AltrepClass>
+SEXP Unserialize(SEXP class_, SEXP state) {
+  return AltrepClass::Unserialize(class_, state);
+}
 
-  static void Init(DllInfo* dll) {
-    class_t = R_make_altinteger_class("array_nonull_int_vector", "arrow", dll);
-    ArrayNoNull<INTSXP>::Init(class_t, dll);
-    R_set_altinteger_No_NA_method(class_t, ArrayNoNull<INTSXP>::No_NA);
+template <typename AltrepClass>
+SEXP Coerce(SEXP alt, int type) {
+  return AltrepClass(alt).Coerce(type);
+}
+
+static std::shared_ptr<arrow::compute::ScalarAggregateOptions> NaRmOptions(
+    const std::shared_ptr<Array>& array, bool na_rm) {
+  auto options = std::make_shared<arrow::compute::ScalarAggregateOptions>(
+      arrow::compute::ScalarAggregateOptions::Defaults());
+  options->min_count = 0;
+  options->skip_nulls = na_rm;
+  return options;
+}
+
+template <int sexp_type, bool Min>
+SEXP MinMax(SEXP alt, Rboolean narm) {
+  using data_type = typename std::conditional<sexp_type == REALSXP, double, int>::type;
+  using scalar_type =
+      typename std::conditional<sexp_type == INTSXP, Int32Scalar, DoubleScalar>::type;
+
+  AltrepArrayPrimitive<sexp_type> alt_(alt);
+
+  const auto& array = alt_.array();
+  bool na_rm = narm == TRUE;
+  auto n = array->length();
+  auto null_count = array->null_count();
+  if ((na_rm || n == 0) && null_count == n) {
+    return Rf_ScalarReal(Min ? R_PosInf : R_NegInf);
   }
+  if (!na_rm && null_count > 0) {
+    return cpp11::as_sexp(cpp11::na<data_type>());
+  }
+
+  auto options = NaRmOptions(array, na_rm);
+
+  const auto& minmax =
+      ValueOrStop(arrow::compute::CallFunction("min_max", {array}, options.get()));
+  const auto& minmax_scalar =
+      internal::checked_cast<const StructScalar&>(*minmax.scalar());
+
+  const auto& result_scalar = internal::checked_cast<const scalar_type&>(
+      *ValueOrStop(minmax_scalar.field(Min ? "min" : "max")));
+  return cpp11::as_sexp(result_scalar.value);
+}
+
+template <int sexp_type>
+SEXP Min(SEXP alt, Rboolean narm) {
+  return MinMax<sexp_type, true>(alt, narm);
+}
+
+template <int sexp_type>
+SEXP Max(SEXP alt, Rboolean narm) {
+  return MinMax<sexp_type, false>(alt, narm);
+}
+
+template <int sexp_type>
+static SEXP Sum(SEXP alt, Rboolean narm) {
+  using data_type = typename std::conditional<sexp_type == REALSXP, double, int>::type;
+
+  AltrepArrayPrimitive<sexp_type> alt_(alt);
+
+  const auto& array = alt_.array();
+  bool na_rm = narm == TRUE;
+  auto null_count = array->null_count();
 
-  static SEXP Make(const std::shared_ptr<Array>& array) {
-    return ArrayNoNull<INTSXP>::Make(class_t, array);
+  if (!na_rm && null_count > 0) {
+    return cpp11::as_sexp(cpp11::na<data_type>());
   }
-};
+  auto options = NaRmOptions(array, na_rm);
+
+  const auto& sum =
+      ValueOrStop(arrow::compute::CallFunction("sum", {array}, options.get()));
+
+  if (sexp_type == INTSXP) {
+    // When calling the "sum" function on an int32 array, we get an Int64 scalar
+    // in case of overflow, make it a double like R
+    int64_t value = internal::checked_cast<const Int64Scalar&>(*sum.scalar()).value;
+    if (value <= INT32_MIN || value > INT32_MAX) {
+      return Rf_ScalarReal(static_cast<double>(value));
+    } else {
+      return Rf_ScalarInteger(static_cast<int>(value));
+    }
+  } else {
+    return Rf_ScalarReal(
+        internal::checked_cast<const DoubleScalar&>(*sum.scalar()).value);
+  }
+}
 
-R_altrep_class_t Int32ArrayNoNull::class_t;
-R_altrep_class_t DoubleArrayNoNull::class_t;
+// initialize altrep, altvec, altreal, and altinteger methods
+template <typename AltrepClass>
+void InitAltrepMethods(R_altrep_class_t class_t, DllInfo* dll) {
+  R_set_altrep_Length_method(class_t, Length<AltrepClass>);
+  R_set_altrep_Inspect_method(class_t, Inspect<AltrepClass>);
+  R_set_altrep_Duplicate_method(class_t, Duplicate<AltrepClass>);
+  R_set_altrep_Serialized_state_method(class_t, Serialized_state<AltrepClass>);
+  R_set_altrep_Unserialize_method(class_t, Unserialize<AltrepClass>);
+  R_set_altrep_Coerce_method(class_t, Coerce<AltrepClass>);
+}
 
-void Init_Altrep_classes(DllInfo* dll) {
-  DoubleArrayNoNull::Init(dll);
-  Int32ArrayNoNull::Init(dll);
+template <typename AltrepClass>
+void InitAltvecMethods(R_altrep_class_t class_t, DllInfo* dll) {
+  R_set_altvec_Dataptr_method(class_t, Dataptr<AltrepClass>);
+  R_set_altvec_Dataptr_or_null_method(class_t, Dataptr_or_null<AltrepClass>);
+}
+
+template <typename AltrepClass>
+void InitAltRealMethods(R_altrep_class_t class_t, DllInfo* dll) {
+  R_set_altreal_No_NA_method(class_t, No_NA<AltrepClass>);
+  R_set_altreal_Is_sorted_method(class_t, Is_sorted<AltrepClass>);
+
+  R_set_altreal_Sum_method(class_t, Sum<REALSXP>);
+  R_set_altreal_Min_method(class_t, Min<REALSXP>);
+  R_set_altreal_Max_method(class_t, Max<REALSXP>);
+
+  R_set_altreal_Elt_method(class_t, Elt<AltrepClass>);
+  R_set_altreal_Get_region_method(class_t, Get_region<AltrepClass>);
 }
 
-SEXP MakeDoubleArrayNoNull(const std::shared_ptr<Array>& array) {
-  return DoubleArrayNoNull::Make(array);
+template <typename AltrepClass>
+void InitAltIntegerMethods(R_altrep_class_t class_t, DllInfo* dll) {
+  R_set_altinteger_No_NA_method(class_t, No_NA<AltrepClass>);
+  R_set_altinteger_Is_sorted_method(class_t, Is_sorted<AltrepClass>);
+
+  R_set_altinteger_Sum_method(class_t, Sum<INTSXP>);
+  R_set_altinteger_Min_method(class_t, Min<INTSXP>);
+  R_set_altinteger_Max_method(class_t, Max<INTSXP>);
+
+  R_set_altinteger_Elt_method(class_t, Elt<AltrepClass>);
+  R_set_altinteger_Get_region_method(class_t, Get_region<AltrepClass>);
 }
 
-SEXP MakeInt32ArrayNoNull(const std::shared_ptr<Array>& array) {
-  return Int32ArrayNoNull::Make(array);
+template <typename AltrepClass>
+void InitAltRealClass(DllInfo* dll, const char* name) {
+  AltrepClass::class_t = R_make_altreal_class(name, "arrow", dll);
+  InitAltrepMethods<AltrepClass>(AltrepClass::class_t, dll);
+  InitAltvecMethods<AltrepClass>(AltrepClass::class_t, dll);
+  InitAltRealMethods<AltrepClass>(AltrepClass::class_t, dll);
 }
 
-}  // namespace r
-}  // namespace arrow
+template <typename AltrepClass>
+void InitAltIntegerClass(DllInfo* dll, const char* name) {
+  AltrepClass::class_t = R_make_altinteger_class(name, "arrow", dll);
+  InitAltrepMethods<AltrepClass>(AltrepClass::class_t, dll);
+  InitAltvecMethods<AltrepClass>(AltrepClass::class_t, dll);
+  InitAltIntegerMethods<AltrepClass>(AltrepClass::class_t, dll);
+}
 
-#endif
+// initialize the altrep classes
+void Init_Altrep_classes(DllInfo* dll) {
+  InitAltRealClass<AltrepArrayPrimitive<REALSXP>>(dll, "array_dbl_vector");
+  InitAltIntegerClass<AltrepArrayPrimitive<INTSXP>>(dll, "array_int_vector");
+}
 
-// [[arrow::export]]
-bool is_altrep_int_nonull(SEXP x) {
-#if defined(HAS_ALTREP)
-  return R_altrep_inherits(x, arrow::r::Int32ArrayNoNull::class_t);
-#else
-  return false;
-#endif
+// return an altrep R vector that shadows the array if possible
+SEXP MakeAltrepArrayPrimitive(const std::shared_ptr<Array>& array) {
+  switch (array->type()->id()) {
+    case arrow::Type::DOUBLE:
+      return altrep::AltrepArrayPrimitive<REALSXP>(array).alt_;
+
+    case arrow::Type::INT32:
+      return altrep::AltrepArrayPrimitive<INTSXP>(array).alt_;
+
+    default:
+      break;
+  }
+
+  return R_NilValue;
 }
 
+}  // namespace altrep
+}  // namespace r
+}  // namespace arrow
+
+#endif  // HAS_ALTREP
+
 // [[arrow::export]]
-bool is_altrep_dbl_nonull(SEXP x) {
+bool is_altrep(SEXP x) {
 #if defined(HAS_ALTREP)
-  return R_altrep_inherits(x, arrow::r::DoubleArrayNoNull::class_t);
+  return ALTREP(x);
 #else
   return false;
 #endif
diff --git a/r/src/array_to_vector.cpp b/r/src/array_to_vector.cpp
index ae6c97e169c..772e816a131 100644
--- a/r/src/array_to_vector.cpp
+++ b/r/src/array_to_vector.cpp
@@ -69,15 +69,13 @@ class Converter {
     // special case when there is only one array
     if (chunked_array_->num_chunks() == 1) {
       const auto& array = chunked_array_->chunk(0);
-      if (arrow::r::GetBoolOption("arrow.use_altrep", true) && array->length() > 0 &&
-          array->null_count() == 0) {
-        switch (array->type()->id()) {
-          case arrow::Type::DOUBLE:
-            return arrow::r::MakeDoubleArrayNoNull(array);
-          case arrow::Type::INT32:
-            return arrow::r::MakeInt32ArrayNoNull(array);
-          default:
-            break;
+      // using altrep if
+      // - the arrow.use_altrep is set to TRUE or unset (implicit TRUE)
+      // - the array has at least one element
+      if (arrow::r::GetBoolOption("arrow.use_altrep", true) && array->length() > 0) {
+        SEXP alt = altrep::MakeAltrepArrayPrimitive(array);
+        if (!Rf_isNull(alt)) {
+          return alt;
         }
       }
     }
diff --git a/r/src/arrowExports.cpp b/r/src/arrowExports.cpp
index 5ef39215c73..f33b81c08f0 100644
--- a/r/src/arrowExports.cpp
+++ b/r/src/arrowExports.cpp
@@ -6,31 +6,16 @@
 
 // altrep.cpp
 #if defined(ARROW_R_WITH_ARROW)
-bool is_altrep_int_nonull(SEXP x);
-extern "C" SEXP _arrow_is_altrep_int_nonull(SEXP x_sexp){
+bool is_altrep(SEXP x);
+extern "C" SEXP _arrow_is_altrep(SEXP x_sexp){
 BEGIN_CPP11
 	arrow::r::Input<SEXP>::type x(x_sexp);
-	return cpp11::as_sexp(is_altrep_int_nonull(x));
+	return cpp11::as_sexp(is_altrep(x));
 END_CPP11
 }
 #else
-extern "C" SEXP _arrow_is_altrep_int_nonull(SEXP x_sexp){
-	Rf_error("Cannot call is_altrep_int_nonull(). See https://arrow.apache.org/docs/r/articles/install.html for help installing Arrow C++ libraries. ");
-}
-#endif
-
-// altrep.cpp
-#if defined(ARROW_R_WITH_ARROW)
-bool is_altrep_dbl_nonull(SEXP x);
-extern "C" SEXP _arrow_is_altrep_dbl_nonull(SEXP x_sexp){
-BEGIN_CPP11
-	arrow::r::Input<SEXP>::type x(x_sexp);
-	return cpp11::as_sexp(is_altrep_dbl_nonull(x));
-END_CPP11
-}
-#else
-extern "C" SEXP _arrow_is_altrep_dbl_nonull(SEXP x_sexp){
-	Rf_error("Cannot call is_altrep_dbl_nonull(). See https://arrow.apache.org/docs/r/articles/install.html for help installing Arrow C++ libraries. ");
+extern "C" SEXP _arrow_is_altrep(SEXP x_sexp){
+	Rf_error("Cannot call is_altrep(). See https://arrow.apache.org/docs/r/articles/install.html for help installing Arrow C++ libraries. ");
 }
 #endif
 
@@ -1109,16 +1094,17 @@ extern "C" SEXP _arrow_ExecPlan_create(SEXP use_threads_sexp){
 
 // compute-exec.cpp
 #if defined(ARROW_R_WITH_ARROW)
-std::shared_ptr<arrow::Table> ExecPlan_run(const std::shared_ptr<compute::ExecPlan>& plan, const std::shared_ptr<compute::ExecNode>& final_node);
-extern "C" SEXP _arrow_ExecPlan_run(SEXP plan_sexp, SEXP final_node_sexp){
+std::shared_ptr<arrow::Table> ExecPlan_run(const std::shared_ptr<compute::ExecPlan>& plan, const std::shared_ptr<compute::ExecNode>& final_node, cpp11::list sort_options);
+extern "C" SEXP _arrow_ExecPlan_run(SEXP plan_sexp, SEXP final_node_sexp, SEXP sort_options_sexp){
 BEGIN_CPP11
 	arrow::r::Input<const std::shared_ptr<compute::ExecPlan>&>::type plan(plan_sexp);
 	arrow::r::Input<const std::shared_ptr<compute::ExecNode>&>::type final_node(final_node_sexp);
-	return cpp11::as_sexp(ExecPlan_run(plan, final_node));
+	arrow::r::Input<cpp11::list>::type sort_options(sort_options_sexp);
+	return cpp11::as_sexp(ExecPlan_run(plan, final_node, sort_options));
 END_CPP11
 }
 #else
-extern "C" SEXP _arrow_ExecPlan_run(SEXP plan_sexp, SEXP final_node_sexp){
+extern "C" SEXP _arrow_ExecPlan_run(SEXP plan_sexp, SEXP final_node_sexp, SEXP sort_options_sexp){
 	Rf_error("Cannot call ExecPlan_run(). See https://arrow.apache.org/docs/r/articles/install.html for help installing Arrow C++ libraries. ");
 }
 #endif
@@ -3188,6 +3174,22 @@ extern "C" SEXP _arrow_FixedSizeListType__list_size(SEXP type_sexp){
 }
 #endif
 
+// expression.cpp
+#if defined(ARROW_R_WITH_ARROW)
+bool compute___expr__equals(const std::shared_ptr<compute::Expression>& lhs, const std::shared_ptr<compute::Expression>& rhs);
+extern "C" SEXP _arrow_compute___expr__equals(SEXP lhs_sexp, SEXP rhs_sexp){
+BEGIN_CPP11
+	arrow::r::Input<const std::shared_ptr<compute::Expression>&>::type lhs(lhs_sexp);
+	arrow::r::Input<const std::shared_ptr<compute::Expression>&>::type rhs(rhs_sexp);
+	return cpp11::as_sexp(compute___expr__equals(lhs, rhs));
+END_CPP11
+}
+#else
+extern "C" SEXP _arrow_compute___expr__equals(SEXP lhs_sexp, SEXP rhs_sexp){
+	Rf_error("Cannot call compute___expr__equals(). See https://arrow.apache.org/docs/r/articles/install.html for help installing Arrow C++ libraries. ");
+}
+#endif
+
 // expression.cpp
 #if defined(ARROW_R_WITH_ARROW)
 std::shared_ptr<compute::Expression> compute___expr__call(std::string func_name, cpp11::list argument_list, cpp11::list options);
@@ -4423,7 +4425,7 @@ extern "C" SEXP _arrow_io___BufferOutputStream__Write(SEXP stream_sexp, SEXP byt
 #endif
 
 // json.cpp
-#if defined(ARROW_R_WITH_ARROW)
+#if defined(ARROW_R_WITH_JSON)
 std::shared_ptr<arrow::json::ReadOptions> json___ReadOptions__initialize(bool use_threads, int block_size);
 extern "C" SEXP _arrow_json___ReadOptions__initialize(SEXP use_threads_sexp, SEXP block_size_sexp){
 BEGIN_CPP11
@@ -4439,7 +4441,7 @@ extern "C" SEXP _arrow_json___ReadOptions__initialize(SEXP use_threads_sexp, SEX
 #endif
 
 // json.cpp
-#if defined(ARROW_R_WITH_ARROW)
+#if defined(ARROW_R_WITH_JSON)
 std::shared_ptr<arrow::json::ParseOptions> json___ParseOptions__initialize1(bool newlines_in_values);
 extern "C" SEXP _arrow_json___ParseOptions__initialize1(SEXP newlines_in_values_sexp){
 BEGIN_CPP11
@@ -4454,7 +4456,7 @@ extern "C" SEXP _arrow_json___ParseOptions__initialize1(SEXP newlines_in_values_
 #endif
 
 // json.cpp
-#if defined(ARROW_R_WITH_ARROW)
+#if defined(ARROW_R_WITH_JSON)
 std::shared_ptr<arrow::json::ParseOptions> json___ParseOptions__initialize2(bool newlines_in_values, const std::shared_ptr<arrow::Schema>& explicit_schema);
 extern "C" SEXP _arrow_json___ParseOptions__initialize2(SEXP newlines_in_values_sexp, SEXP explicit_schema_sexp){
 BEGIN_CPP11
@@ -4470,7 +4472,7 @@ extern "C" SEXP _arrow_json___ParseOptions__initialize2(SEXP newlines_in_values_
 #endif
 
 // json.cpp
-#if defined(ARROW_R_WITH_ARROW)
+#if defined(ARROW_R_WITH_JSON)
 std::shared_ptr<arrow::json::TableReader> json___TableReader__Make(const std::shared_ptr<arrow::io::InputStream>& input, const std::shared_ptr<arrow::json::ReadOptions>& read_options, const std::shared_ptr<arrow::json::ParseOptions>& parse_options);
 extern "C" SEXP _arrow_json___TableReader__Make(SEXP input_sexp, SEXP read_options_sexp, SEXP parse_options_sexp){
 BEGIN_CPP11
@@ -4487,7 +4489,7 @@ extern "C" SEXP _arrow_json___TableReader__Make(SEXP input_sexp, SEXP read_optio
 #endif
 
 // json.cpp
-#if defined(ARROW_R_WITH_ARROW)
+#if defined(ARROW_R_WITH_JSON)
 std::shared_ptr<arrow::Table> json___TableReader__Read(const std::shared_ptr<arrow::json::TableReader>& table_reader);
 extern "C" SEXP _arrow_json___TableReader__Read(SEXP table_reader_sexp){
 BEGIN_CPP11
@@ -7035,13 +7037,22 @@ return Rf_ScalarLogical(
 #endif
 );
 }
+extern "C" SEXP _json_available() {
+return Rf_ScalarLogical(
+#if defined(ARROW_R_WITH_JSON)
+  TRUE
+#else
+  FALSE
+#endif
+);
+}
 static const R_CallMethodDef CallEntries[] = {
 		{ "_arrow_available", (DL_FUNC)& _arrow_available, 0 },
 		{ "_dataset_available", (DL_FUNC)& _dataset_available, 0 },
 		{ "_parquet_available", (DL_FUNC)& _parquet_available, 0 },
 		{ "_s3_available", (DL_FUNC)& _s3_available, 0 },
-		{ "_arrow_is_altrep_int_nonull", (DL_FUNC) &_arrow_is_altrep_int_nonull, 1}, 
-		{ "_arrow_is_altrep_dbl_nonull", (DL_FUNC) &_arrow_is_altrep_dbl_nonull, 1}, 
+		{ "_json_available", (DL_FUNC)& _json_available, 0 },
+		{ "_arrow_is_altrep", (DL_FUNC) &_arrow_is_altrep, 1}, 
 		{ "_arrow_Array__Slice1", (DL_FUNC) &_arrow_Array__Slice1, 2}, 
 		{ "_arrow_Array__Slice2", (DL_FUNC) &_arrow_Array__Slice2, 3}, 
 		{ "_arrow_Array__IsNull", (DL_FUNC) &_arrow_Array__IsNull, 2}, 
@@ -7111,7 +7122,7 @@ static const R_CallMethodDef CallEntries[] = {
 		{ "_arrow_io___CompressedOutputStream__Make", (DL_FUNC) &_arrow_io___CompressedOutputStream__Make, 2}, 
 		{ "_arrow_io___CompressedInputStream__Make", (DL_FUNC) &_arrow_io___CompressedInputStream__Make, 2}, 
 		{ "_arrow_ExecPlan_create", (DL_FUNC) &_arrow_ExecPlan_create, 1}, 
-		{ "_arrow_ExecPlan_run", (DL_FUNC) &_arrow_ExecPlan_run, 2}, 
+		{ "_arrow_ExecPlan_run", (DL_FUNC) &_arrow_ExecPlan_run, 3}, 
 		{ "_arrow_ExecNode_Scan", (DL_FUNC) &_arrow_ExecNode_Scan, 4}, 
 		{ "_arrow_ExecNode_Filter", (DL_FUNC) &_arrow_ExecNode_Filter, 2}, 
 		{ "_arrow_ExecNode_Project", (DL_FUNC) &_arrow_ExecNode_Project, 3}, 
@@ -7245,6 +7256,7 @@ static const R_CallMethodDef CallEntries[] = {
 		{ "_arrow_FixedSizeListType__value_field", (DL_FUNC) &_arrow_FixedSizeListType__value_field, 1}, 
 		{ "_arrow_FixedSizeListType__value_type", (DL_FUNC) &_arrow_FixedSizeListType__value_type, 1}, 
 		{ "_arrow_FixedSizeListType__list_size", (DL_FUNC) &_arrow_FixedSizeListType__list_size, 1}, 
+		{ "_arrow_compute___expr__equals", (DL_FUNC) &_arrow_compute___expr__equals, 2}, 
 		{ "_arrow_compute___expr__call", (DL_FUNC) &_arrow_compute___expr__call, 3}, 
 		{ "_arrow_field_names_in_expression", (DL_FUNC) &_arrow_field_names_in_expression, 1}, 
 		{ "_arrow_compute___expr__get_field_ref_name", (DL_FUNC) &_arrow_compute___expr__get_field_ref_name, 1}, 
@@ -7492,7 +7504,7 @@ extern "C" void R_init_arrow(DllInfo* dll){
   R_useDynamicSymbols(dll, FALSE);
 
   #if defined(ARROW_R_WITH_ARROW) && defined(HAS_ALTREP)
-  arrow::r::Init_Altrep_classes(dll);
+  arrow::r::altrep::Init_Altrep_classes(dll);
   #endif
 
 }
diff --git a/r/src/arrow_types.h b/r/src/arrow_types.h
index 4ecb99174b5..88a3339dd1e 100644
--- a/r/src/arrow_types.h
+++ b/r/src/arrow_types.h
@@ -43,7 +43,11 @@
 #include <arrow/filesystem/type_fwd.h>
 #include <arrow/io/type_fwd.h>
 #include <arrow/ipc/type_fwd.h>
+
+#if defined(ARROW_R_WITH_JSON)
 #include <arrow/json/type_fwd.h>
+#endif
+
 #include <arrow/type_fwd.h>
 #include <arrow/util/type_fwd.h>
 
@@ -101,6 +105,7 @@ auto ValueOrStop(R&& result) -> decltype(std::forward<R>(result).ValueOrDie()) {
 }
 
 namespace r {
+class RTasks;
 
 std::shared_ptr<arrow::DataType> InferArrowType(SEXP x);
 std::shared_ptr<arrow::Array> vec_to_arrow__reuse_memory(SEXP x);
@@ -174,9 +179,13 @@ arrow::Status AddMetadataFromDots(SEXP lst, int num_fields,
                                   std::shared_ptr<arrow::Schema>& schema);
 
 #if defined(HAS_ALTREP)
+
+namespace altrep {
+
 void Init_Altrep_classes(DllInfo* dll);
-SEXP MakeInt32ArrayNoNull(const std::shared_ptr<Array>& array);
-SEXP MakeDoubleArrayNoNull(const std::shared_ptr<Array>& array);
+SEXP MakeAltrepArrayPrimitive(const std::shared_ptr<Array>& array);
+
+}  // namespace altrep
 #endif
 
 }  // namespace r
@@ -216,9 +225,11 @@ R6_CLASS_NAME(parquet::arrow::FileWriter, "ParquetFileWriter");
 
 R6_CLASS_NAME(arrow::ipc::feather::Reader, "FeatherReader");
 
+#if defined(ARROW_R_WITH_JSON)
 R6_CLASS_NAME(arrow::json::ReadOptions, "JsonReadOptions");
 R6_CLASS_NAME(arrow::json::ParseOptions, "JsonParseOptions");
 R6_CLASS_NAME(arrow::json::TableReader, "JsonTableReader");
+#endif
 
 #undef R6_CLASS_NAME
 
diff --git a/r/src/compute-exec.cpp b/r/src/compute-exec.cpp
index 3d0bbca63d2..ea80c8587b0 100644
--- a/r/src/compute-exec.cpp
+++ b/r/src/compute-exec.cpp
@@ -57,12 +57,22 @@ std::shared_ptr<compute::ExecNode> MakeExecNodeOrStop(
 // [[arrow::export]]
 std::shared_ptr<arrow::Table> ExecPlan_run(
     const std::shared_ptr<compute::ExecPlan>& plan,
-    const std::shared_ptr<compute::ExecNode>& final_node) {
+    const std::shared_ptr<compute::ExecNode>& final_node, cpp11::list sort_options) {
   // For now, don't require R to construct SinkNodes.
   // Instead, just pass the node we should collect as an argument.
   arrow::AsyncGenerator<arrow::util::optional<compute::ExecBatch>> sink_gen;
-  MakeExecNodeOrStop("sink", plan.get(), {final_node.get()},
-                     compute::SinkNodeOptions{&sink_gen});
+
+  // Sorting uses a different sink node; there is no general sort yet
+  if (sort_options.size() > 0) {
+    MakeExecNodeOrStop("order_by_sink", plan.get(), {final_node.get()},
+                       compute::OrderBySinkNodeOptions{
+                           *std::dynamic_pointer_cast<compute::SortOptions>(
+                               make_compute_options("sort_indices", sort_options)),
+                           &sink_gen});
+  } else {
+    MakeExecNodeOrStop("sink", plan.get(), {final_node.get()},
+                       compute::SinkNodeOptions{&sink_gen});
+  }
 
   StopIfNotOk(plan->Validate());
   StopIfNotOk(plan->StartProducing());
@@ -90,6 +100,7 @@ std::shared_ptr<compute::ExecNode> ExecNode_Scan(
   auto options = std::make_shared<arrow::dataset::ScanOptions>();
 
   options->use_async = true;
+  options->use_threads = arrow::r::GetBoolOption("arrow.use_threads", true);
 
   options->dataset_schema = dataset->schema();
 
diff --git a/r/src/compute.cpp b/r/src/compute.cpp
index e84f70016a5..c6ba0a28046 100644
--- a/r/src/compute.cpp
+++ b/r/src/compute.cpp
@@ -177,11 +177,11 @@ std::shared_ptr<arrow::compute::FunctionOptions> make_compute_options(
       func_name == "hash_all") {
     using Options = arrow::compute::ScalarAggregateOptions;
     auto out = std::make_shared<Options>(Options::Defaults());
-    if (!Rf_isNull(options["na.min_count"])) {
-      out->min_count = cpp11::as_cpp<int>(options["na.min_count"]);
+    if (!Rf_isNull(options["min_count"])) {
+      out->min_count = cpp11::as_cpp<int>(options["min_count"]);
     }
-    if (!Rf_isNull(options["na.rm"])) {
-      out->skip_nulls = cpp11::as_cpp<bool>(options["na.rm"]);
+    if (!Rf_isNull(options["skip_nulls"])) {
+      out->skip_nulls = cpp11::as_cpp<bool>(options["skip_nulls"]);
     }
     return out;
   }
@@ -225,6 +225,12 @@ std::shared_ptr<arrow::compute::FunctionOptions> make_compute_options(
           cpp11::as_cpp<enum arrow::compute::QuantileOptions::Interpolation>(
               interpolation);
     }
+    if (!Rf_isNull(options["min_count"])) {
+      out->min_count = cpp11::as_cpp<int64_t>(options["min_count"]);
+    }
+    if (!Rf_isNull(options["skip_nulls"])) {
+      out->skip_nulls = cpp11::as_cpp<int64_t>(options["skip_nulls"]);
+    }
     return out;
   }
 
@@ -281,7 +287,9 @@ std::shared_ptr<arrow::compute::FunctionOptions> make_compute_options(
 
   if (func_name == "match_substring" || func_name == "match_substring_regex" ||
       func_name == "find_substring" || func_name == "find_substring_regex" ||
-      func_name == "match_like") {
+      func_name == "match_like" || func_name == "starts_with" ||
+      func_name == "ends_with" || func_name == "count_substring" ||
+      func_name == "count_substring_regex") {
     using Options = arrow::compute::MatchSubstringOptions;
     bool ignore_case = false;
     if (!Rf_isNull(options["ignore_case"])) {
@@ -302,6 +310,11 @@ std::shared_ptr<arrow::compute::FunctionOptions> make_compute_options(
                                      max_replacements);
   }
 
+  if (func_name == "extract_regex") {
+    using Options = arrow::compute::ExtractRegexOptions;
+    return std::make_shared<Options>(cpp11::as_cpp<std::string>(options["pattern"]));
+  }
+
   if (func_name == "day_of_week") {
     using Options = arrow::compute::DayOfWeekOptions;
     bool one_based_numbering = true;
@@ -319,6 +332,22 @@ std::shared_ptr<arrow::compute::FunctionOptions> make_compute_options(
         cpp11::as_cpp<arrow::TimeUnit::type>(options["unit"]));
   }
 
+  if (func_name == "assume_timezone") {
+    using Options = arrow::compute::AssumeTimezoneOptions;
+    enum Options::Ambiguous ambiguous;
+    enum Options::Nonexistent nonexistent;
+
+    if (!Rf_isNull(options["ambiguous"])) {
+      ambiguous = cpp11::as_cpp<enum Options::Ambiguous>(options["ambiguous"]);
+    }
+    if (!Rf_isNull(options["nonexistent"])) {
+      nonexistent = cpp11::as_cpp<enum Options::Nonexistent>(options["nonexistent"]);
+    }
+
+    return std::make_shared<Options>(cpp11::as_cpp<std::string>(options["timezone"]),
+                                     ambiguous, nonexistent);
+  }
+
   if (func_name == "split_pattern" || func_name == "split_pattern_regex") {
     using Options = arrow::compute::SplitPatternOptions;
     int64_t max_splits = -1;
@@ -354,6 +383,13 @@ std::shared_ptr<arrow::compute::FunctionOptions> make_compute_options(
     return std::make_shared<Options>(max_splits, reverse);
   }
 
+  if (func_name == "utf8_trim" || func_name == "utf8_ltrim" ||
+      func_name == "utf8_rtrim" || func_name == "ascii_trim" ||
+      func_name == "ascii_ltrim" || func_name == "ascii_rtrim") {
+    using Options = arrow::compute::TrimOptions;
+    return std::make_shared<Options>(cpp11::as_cpp<std::string>(options["characters"]));
+  }
+
   if (func_name == "utf8_slice_codeunits") {
     using Options = arrow::compute::SliceOptions;
 
@@ -371,20 +407,48 @@ std::shared_ptr<arrow::compute::FunctionOptions> make_compute_options(
                                      step);
   }
 
+  if (func_name == "utf8_replace_slice" || func_name == "binary_replace_slice") {
+    using Options = arrow::compute::ReplaceSliceOptions;
+
+    return std::make_shared<Options>(cpp11::as_cpp<int64_t>(options["start"]),
+                                     cpp11::as_cpp<int64_t>(options["stop"]),
+                                     cpp11::as_cpp<std::string>(options["replacement"]));
+  }
+
   if (func_name == "variance" || func_name == "stddev" || func_name == "hash_variance" ||
       func_name == "hash_stddev") {
     using Options = arrow::compute::VarianceOptions;
     auto out = std::make_shared<Options>();
     out->ddof = cpp11::as_cpp<int64_t>(options["ddof"]);
-    if (!Rf_isNull(options["na.min_count"])) {
-      out->min_count = cpp11::as_cpp<int64_t>(options["na.min_count"]);
+    if (!Rf_isNull(options["min_count"])) {
+      out->min_count = cpp11::as_cpp<int64_t>(options["min_count"]);
+    }
+    if (!Rf_isNull(options["skip_nulls"])) {
+      out->skip_nulls = cpp11::as_cpp<bool>(options["skip_nulls"]);
+    }
+    return out;
+  }
+
+  if (func_name == "mode") {
+    using Options = arrow::compute::ModeOptions;
+    auto out = std::make_shared<Options>(Options::Defaults());
+    if (!Rf_isNull(options["n"])) {
+      out->n = cpp11::as_cpp<int64_t>(options["n"]);
     }
-    if (!Rf_isNull(options["na.rm"])) {
-      out->skip_nulls = cpp11::as_cpp<int64_t>(options["na.rm"]);
+    if (!Rf_isNull(options["min_count"])) {
+      out->min_count = cpp11::as_cpp<uint32_t>(options["min_count"]);
+    }
+    if (!Rf_isNull(options["skip_nulls"])) {
+      out->skip_nulls = cpp11::as_cpp<bool>(options["skip_nulls"]);
     }
     return out;
   }
 
+  if (func_name == "partition_nth_indices") {
+    using Options = arrow::compute::PartitionNthOptions;
+    return std::make_shared<Options>(cpp11::as_cpp<int64_t>(options["pivot"]));
+  }
+
   return nullptr;
 }
 
diff --git a/r/src/expression.cpp b/r/src/expression.cpp
index 3fcba46e911..97a8a746bba 100644
--- a/r/src/expression.cpp
+++ b/r/src/expression.cpp
@@ -27,6 +27,11 @@ namespace compute = ::arrow::compute;
 std::shared_ptr<compute::FunctionOptions> make_compute_options(std::string func_name,
                                                                cpp11::list options);
 
+// [[arrow::export]]
+bool compute___expr__equals(const std::shared_ptr<compute::Expression>& lhs,
+                            const std::shared_ptr<compute::Expression>& rhs) {
+  return lhs->Equals(*rhs);
+}
 // [[arrow::export]]
 std::shared_ptr<compute::Expression> compute___expr__call(std::string func_name,
                                                           cpp11::list argument_list,
diff --git a/r/src/json.cpp b/r/src/json.cpp
index edc5e075754..ec00e54be6c 100644
--- a/r/src/json.cpp
+++ b/r/src/json.cpp
@@ -16,11 +16,11 @@
 // under the License.
 
 #include "./arrow_types.h"
-#if defined(ARROW_R_WITH_ARROW)
+#if defined(ARROW_R_WITH_JSON)
 
 #include <arrow/json/reader.h>
 
-// [[arrow::export]]
+// [[json::export]]
 std::shared_ptr<arrow::json::ReadOptions> json___ReadOptions__initialize(bool use_threads,
                                                                          int block_size) {
   auto res =
@@ -30,7 +30,7 @@ std::shared_ptr<arrow::json::ReadOptions> json___ReadOptions__initialize(bool us
   return res;
 }
 
-// [[arrow::export]]
+// [[json::export]]
 std::shared_ptr<arrow::json::ParseOptions> json___ParseOptions__initialize1(
     bool newlines_in_values) {
   auto res =
@@ -39,7 +39,7 @@ std::shared_ptr<arrow::json::ParseOptions> json___ParseOptions__initialize1(
   return res;
 }
 
-// [[arrow::export]]
+// [[json::export]]
 std::shared_ptr<arrow::json::ParseOptions> json___ParseOptions__initialize2(
     bool newlines_in_values, const std::shared_ptr<arrow::Schema>& explicit_schema) {
   auto res =
@@ -49,7 +49,7 @@ std::shared_ptr<arrow::json::ParseOptions> json___ParseOptions__initialize2(
   return res;
 }
 
-// [[arrow::export]]
+// [[json::export]]
 std::shared_ptr<arrow::json::TableReader> json___TableReader__Make(
     const std::shared_ptr<arrow::io::InputStream>& input,
     const std::shared_ptr<arrow::json::ReadOptions>& read_options,
@@ -58,7 +58,7 @@ std::shared_ptr<arrow::json::TableReader> json___TableReader__Make(
                                                     *read_options, *parse_options));
 }
 
-// [[arrow::export]]
+// [[json::export]]
 std::shared_ptr<arrow::Table> json___TableReader__Read(
     const std::shared_ptr<arrow::json::TableReader>& table_reader) {
   return ValueOrStop(table_reader->Read());
diff --git a/r/tests/testthat/helper-skip.R b/r/tests/testthat/helper-skip.R
index 906963e38d1..3ec18a63019 100644
--- a/r/tests/testthat/helper-skip.R
+++ b/r/tests/testthat/helper-skip.R
@@ -25,6 +25,10 @@ skip_if_not_available <- function(feature) {
   if (feature == "re2") {
     # RE2 does not support valgrind (on purpose): https://github.com/google/re2/issues/177
     skip_on_valgrind()
+  } else if (feature == "dataset") {
+    # These tests often hang on 32-bit windows rtools35, and we haven't been
+    # able to figure out how to make them work safely
+    skip_if_multithreading_disabled()
   }
 
   yes <- feature %in% names(build_features) && build_features[feature]
@@ -35,6 +39,7 @@ skip_if_not_available <- function(feature) {
 
 skip_if_no_pyarrow <- function() {
   skip_on_valgrind()
+  skip_on_os("windows")
 
   skip_if_not_installed("reticulate")
   if (!reticulate::py_module_available("pyarrow")) {
@@ -68,6 +73,15 @@ skip_on_valgrind <- function() {
   }
 }
 
+skip_if_multithreading_disabled <- function() {
+  is_32bit <- .Machine$sizeof.pointer < 8
+  is_old_r <- getRversion() < "4.0.0"
+  is_windows <- tolower(Sys.info()[["sysname"]]) == "windows"
+  if (is_32bit && is_old_r && is_windows) {
+    skip("Multithreading does not work properly on this system")
+  }
+}
+
 process_is_running <- function(x) {
   cmd <- sprintf("ps aux | grep '%s' | grep -v grep", x)
   tryCatch(system(cmd, ignore.stdout = TRUE) == 0, error = function(e) FALSE)
diff --git a/r/tests/testthat/test-altrep.R b/r/tests/testthat/test-altrep.R
index 42784b61442..8cb989b1d4c 100644
--- a/r/tests/testthat/test-altrep.R
+++ b/r/tests/testthat/test-altrep.R
@@ -26,30 +26,30 @@ test_that("altrep vectors from int32 and dbl arrays with no nulls", {
   c_int <- ChunkedArray$create(1:1000)
   c_dbl <- ChunkedArray$create(as.numeric(1:1000))
 
-  expect_true(is_altrep_int_nonull(as.vector(v_int)))
-  expect_true(is_altrep_int_nonull(as.vector(v_int$Slice(1))))
-  expect_true(is_altrep_dbl_nonull(as.vector(v_dbl)))
-  expect_true(is_altrep_dbl_nonull(as.vector(v_dbl$Slice(1))))
+  expect_true(is_altrep(as.vector(v_int)))
+  expect_true(is_altrep(as.vector(v_int$Slice(1))))
+  expect_true(is_altrep(as.vector(v_dbl)))
+  expect_true(is_altrep(as.vector(v_dbl$Slice(1))))
 
   expect_equal(c_int$num_chunks, 1L)
-  expect_true(is_altrep_int_nonull(as.vector(c_int)))
-  expect_true(is_altrep_int_nonull(as.vector(c_int$Slice(1))))
+  expect_true(is_altrep(as.vector(c_int)))
+  expect_true(is_altrep(as.vector(c_int$Slice(1))))
 
   expect_equal(c_dbl$num_chunks, 1L)
-  expect_true(is_altrep_dbl_nonull(as.vector(c_dbl)))
-  expect_true(is_altrep_dbl_nonull(as.vector(c_dbl$Slice(1))))
+  expect_true(is_altrep(as.vector(c_dbl)))
+  expect_true(is_altrep(as.vector(c_dbl$Slice(1))))
 
   withr::local_options(list(arrow.use_altrep = NULL))
-  expect_true(is_altrep_int_nonull(as.vector(v_int)))
-  expect_true(is_altrep_int_nonull(as.vector(v_int$Slice(1))))
-  expect_true(is_altrep_dbl_nonull(as.vector(v_dbl)))
-  expect_true(is_altrep_dbl_nonull(as.vector(v_dbl$Slice(1))))
+  expect_true(is_altrep(as.vector(v_int)))
+  expect_true(is_altrep(as.vector(v_int$Slice(1))))
+  expect_true(is_altrep(as.vector(v_dbl)))
+  expect_true(is_altrep(as.vector(v_dbl$Slice(1))))
 
   withr::local_options(list(arrow.use_altrep = FALSE))
-  expect_false(is_altrep_int_nonull(as.vector(v_int)))
-  expect_false(is_altrep_int_nonull(as.vector(v_int$Slice(1))))
-  expect_false(is_altrep_dbl_nonull(as.vector(v_dbl)))
-  expect_false(is_altrep_dbl_nonull(as.vector(v_dbl$Slice(1))))
+  expect_false(is_altrep(as.vector(v_int)))
+  expect_false(is_altrep(as.vector(v_int$Slice(1))))
+  expect_false(is_altrep(as.vector(v_dbl)))
+  expect_false(is_altrep(as.vector(v_dbl$Slice(1))))
 })
 
 test_that("altrep vectors from int32 and dbl arrays with nulls", {
@@ -59,31 +59,30 @@ test_that("altrep vectors from int32 and dbl arrays with nulls", {
   c_int <- ChunkedArray$create(c(1L, NA, 3L))
   c_dbl <- ChunkedArray$create(c(1, NA, 3))
 
-  # cannot be altrep because one NA
-  expect_false(is_altrep_int_nonull(as.vector(v_int)))
-  expect_false(is_altrep_int_nonull(as.vector(v_int$Slice(1))))
-  expect_false(is_altrep_dbl_nonull(as.vector(v_dbl)))
-  expect_false(is_altrep_dbl_nonull(as.vector(v_dbl$Slice(1))))
-  expect_false(is_altrep_int_nonull(as.vector(c_int)))
-  expect_false(is_altrep_int_nonull(as.vector(c_int$Slice(1))))
-  expect_false(is_altrep_dbl_nonull(as.vector(c_dbl)))
-  expect_false(is_altrep_dbl_nonull(as.vector(c_dbl$Slice(1))))
-
-  # but then, no NA beyond, so can be altrep again
-  expect_true(is_altrep_int_nonull(as.vector(v_int$Slice(2))))
-  expect_true(is_altrep_dbl_nonull(as.vector(v_dbl$Slice(2))))
-  expect_true(is_altrep_int_nonull(as.vector(c_int$Slice(2))))
-  expect_true(is_altrep_dbl_nonull(as.vector(c_dbl$Slice(2))))
+  expect_true(is_altrep(as.vector(v_int)))
+  expect_true(is_altrep(as.vector(v_int$Slice(1))))
+  expect_true(is_altrep(as.vector(v_dbl)))
+  expect_true(is_altrep(as.vector(v_dbl$Slice(1))))
+  expect_true(is_altrep(as.vector(c_int)))
+  expect_true(is_altrep(as.vector(c_int$Slice(1))))
+  expect_true(is_altrep(as.vector(c_dbl)))
+  expect_true(is_altrep(as.vector(c_dbl$Slice(1))))
+
+  expect_true(is_altrep(as.vector(v_int$Slice(2))))
+  expect_true(is_altrep(as.vector(v_dbl$Slice(2))))
+  expect_true(is_altrep(as.vector(c_int$Slice(2))))
+  expect_true(is_altrep(as.vector(c_dbl$Slice(2))))
 
   # chunked array with 2 chunks cannot be altrep
   c_int <- ChunkedArray$create(0L, c(1L, NA, 3L))
   c_dbl <- ChunkedArray$create(0, c(1, NA, 3))
   expect_equal(c_int$num_chunks, 2L)
   expect_equal(c_dbl$num_chunks, 2L)
-  expect_false(is_altrep_int_nonull(as.vector(c_int)))
-  expect_false(is_altrep_dbl_nonull(as.vector(c_dbl)))
-  expect_true(is_altrep_int_nonull(as.vector(c_int$Slice(3))))
-  expect_true(is_altrep_dbl_nonull(as.vector(c_dbl$Slice(3))))
+
+  expect_false(is_altrep(as.vector(c_int)))
+  expect_false(is_altrep(as.vector(c_dbl)))
+  expect_true(is_altrep(as.vector(c_int$Slice(3))))
+  expect_true(is_altrep(as.vector(c_dbl$Slice(3))))
 })
 
 test_that("empty vectors are not altrep", {
@@ -91,8 +90,8 @@ test_that("empty vectors are not altrep", {
   v_int <- Array$create(integer())
   v_dbl <- Array$create(numeric())
 
-  expect_false(is_altrep_int_nonull(as.vector(v_int)))
-  expect_false(is_altrep_dbl_nonull(as.vector(v_dbl)))
+  expect_false(is_altrep(as.vector(v_int)))
+  expect_false(is_altrep(as.vector(v_dbl)))
 })
 
 test_that("as.data.frame(<Table>, <RecordBatch>) can create altrep vectors", {
@@ -100,11 +99,109 @@ test_that("as.data.frame(<Table>, <RecordBatch>) can create altrep vectors", {
 
   table <- Table$create(int = c(1L, 2L, 3L), dbl = c(1, 2, 3))
   df_table <- as.data.frame(table)
-  expect_true(is_altrep_int_nonull(df_table$int))
-  expect_true(is_altrep_dbl_nonull(df_table$dbl))
+  expect_true(is_altrep(df_table$int))
+  expect_true(is_altrep(df_table$dbl))
 
   batch <- RecordBatch$create(int = c(1L, 2L, 3L), dbl = c(1, 2, 3))
   df_batch <- as.data.frame(batch)
-  expect_true(is_altrep_int_nonull(df_batch$int))
-  expect_true(is_altrep_dbl_nonull(df_batch$dbl))
+  expect_true(is_altrep(df_batch$int))
+  expect_true(is_altrep(df_batch$dbl))
+})
+
+expect_altrep_rountrip <- function(x, fn, ...) {
+  alt <- Array$create(x)$as_vector()
+
+  expect_true(is_altrep(alt))
+  expect_identical(fn(x, ...), fn(alt, ...))
+  expect_true(is_altrep(alt))
+}
+
+test_that("altrep min/max/sum identical to R versions for double", {
+  x <- c(1, 2, 3)
+  expect_altrep_rountrip(x, min, na.rm = TRUE)
+  expect_altrep_rountrip(x, max, na.rm = TRUE)
+  expect_altrep_rountrip(x, sum, na.rm = TRUE)
+
+  expect_altrep_rountrip(x, min)
+  expect_altrep_rountrip(x, max)
+  expect_altrep_rountrip(x, sum)
+
+  x <- c(1, 2, NA_real_)
+  expect_altrep_rountrip(x, min, na.rm = TRUE)
+  expect_altrep_rountrip(x, max, na.rm = TRUE)
+  expect_altrep_rountrip(x, sum, na.rm = TRUE)
+
+  expect_altrep_rountrip(x, min)
+  expect_altrep_rountrip(x, max)
+  expect_altrep_rountrip(x, sum)
+
+  x <- rep(NA_real_, 3)
+  expect_warning(
+    expect_altrep_rountrip(x, min, na.rm = TRUE),
+    "no non-missing arguments to min"
+  )
+  expect_warning(
+    expect_altrep_rountrip(x, max, na.rm = TRUE),
+    "no non-missing arguments to max"
+  )
+  expect_altrep_rountrip(x, sum, na.rm = TRUE)
+
+  expect_altrep_rountrip(x, min)
+  expect_altrep_rountrip(x, max)
+  expect_altrep_rountrip(x, sum)
+})
+
+test_that("altrep min/max/sum identical to R versions for int", {
+  x <- c(1L, 2L, 3L)
+  expect_altrep_rountrip(x, min, na.rm = TRUE)
+  expect_altrep_rountrip(x, max, na.rm = TRUE)
+  expect_altrep_rountrip(x, sum, na.rm = TRUE)
+
+  expect_altrep_rountrip(x, min)
+  expect_altrep_rountrip(x, max)
+  expect_altrep_rountrip(x, sum)
+
+  x <- c(1L, 2L, NA_integer_)
+  expect_altrep_rountrip(x, min, na.rm = TRUE)
+  expect_altrep_rountrip(x, max, na.rm = TRUE)
+  expect_altrep_rountrip(x, sum, na.rm = TRUE)
+
+  expect_altrep_rountrip(x, min)
+  expect_altrep_rountrip(x, max)
+  expect_altrep_rountrip(x, sum)
+
+  x <- rep(NA_integer_, 3)
+  expect_warning(
+    expect_altrep_rountrip(x, min, na.rm = TRUE),
+    "no non-missing arguments to min"
+  )
+  expect_warning(
+    expect_altrep_rountrip(x, max, na.rm = TRUE),
+    "no non-missing arguments to max"
+  )
+  expect_altrep_rountrip(x, sum, na.rm = TRUE)
+
+  expect_altrep_rountrip(x, min)
+  expect_altrep_rountrip(x, max)
+  expect_altrep_rountrip(x, sum)
+
+  # sum(x) is INT_MIN -> convert to double.
+  x <- as.integer(c(-2^31 + 1L, -1L))
+  expect_altrep_rountrip(x, sum)
+})
+
+test_that("altrep vectors handle serialization", {
+  ints <- c(1L, 2L, NA_integer_)
+  dbls <- c(1, 2, NA_real_)
+
+  expect_identical(ints, unserialize(serialize(Array$create(ints)$as_vector(), NULL)))
+  expect_identical(dbls, unserialize(serialize(Array$create(dbls)$as_vector(), NULL)))
+})
+
+test_that("altrep vectors handle coercion", {
+  ints <- c(1L, 2L, NA_integer_)
+  dbls <- c(1, 2, NA_real_)
+
+  expect_identical(ints, as.integer(Array$create(dbls)$as_vector()))
+  expect_identical(dbls, as.numeric(Array$create(ints)$as_vector()))
 })
diff --git a/r/tests/testthat/test-compute-no-bindings.R b/r/tests/testthat/test-compute-no-bindings.R
new file mode 100644
index 00000000000..f47ed12d4f8
--- /dev/null
+++ b/r/tests/testthat/test-compute-no-bindings.R
@@ -0,0 +1,187 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+
+test_that("non-bound compute kernels using TrimOptions", {
+  skip_if_not_available("utf8proc")
+  expect_equal(
+    call_function(
+      "utf8_trim",
+      Scalar$create("abracadabra"),
+      options = list(characters = "ab")
+    ),
+    Scalar$create("racadabr")
+  )
+
+  expect_equal(
+    call_function(
+      "utf8_ltrim",
+      Scalar$create("abracadabra"),
+      options = list(characters = "ab")
+    ),
+    Scalar$create("racadabra")
+  )
+
+  expect_equal(
+    call_function(
+      "utf8_rtrim",
+      Scalar$create("abracadabra"),
+      options = list(characters = "ab")
+    ),
+    Scalar$create("abracadabr")
+  )
+
+  expect_equal(
+    call_function(
+      "utf8_rtrim",
+      Scalar$create("abracadabra"),
+      options = list(characters = "ab")
+    ),
+    Scalar$create("abracadabr")
+  )
+
+  expect_equal(
+    call_function(
+      "ascii_ltrim",
+      Scalar$create("abracadabra"),
+      options = list(characters = "ab")
+    ),
+    Scalar$create("racadabra")
+  )
+
+  expect_equal(
+    call_function(
+      "ascii_rtrim",
+      Scalar$create("abracadabra"),
+      options = list(characters = "ab")
+    ),
+    Scalar$create("abracadabr")
+  )
+
+  expect_equal(
+    call_function(
+      "ascii_rtrim",
+      Scalar$create("abracadabra"),
+      options = list(characters = "ab")
+    ),
+    Scalar$create("abracadabr")
+  )
+})
+
+test_that("non-bound compute kernels using ReplaceSliceOptions", {
+  skip_if_not_available("utf8proc")
+
+  expect_equal(
+    call_function(
+      "binary_replace_slice",
+      Array$create("I need to fix this string"),
+      options = list(start = 1, stop = 1, replacement = " don't")
+    ),
+    Array$create("I don't need to fix this string")
+  )
+
+  expect_equal(
+    call_function(
+      "utf8_replace_slice",
+      Array$create("I need to fix this string"),
+      options = list(start = 1, stop = 1, replacement = " don't")
+    ),
+    Array$create("I don't need to fix this string")
+  )
+})
+
+test_that("non-bound compute kernels using ModeOptions", {
+  expect_equal(
+    as.vector(
+      call_function("mode", Array$create(c(1:10, 10, 9, NA)), options = list(n = 3))
+    ),
+    tibble::tibble("mode" = c(9, 10, 1), "count" = c(2L, 2L, 1L))
+  )
+
+  expect_equal(
+    as.vector(
+      call_function("mode", Array$create(c(1:10, 10, 9, NA)), options = list(n = 3, skip_nulls = FALSE))
+    ),
+    tibble::tibble("mode" = numeric(), "count" = integer())
+  )
+})
+
+test_that("non-bound compute kernels using PartitionNthOptions", {
+  expect_equal(
+    as.vector(call_function("partition_nth_indices", Array$create(c(1:10)), options = list(pivot = 5))),
+    c(1L, 0L, 4L, 3L, 2L, 5L, 6L, 7L, 8L, 9L)
+  )
+})
+
+
+test_that("non-bound compute kernels using MatchSubstringOptions", {
+  skip_if_not_available("utf8proc")
+
+  # Remove this test when ARROW-13924 has been completed
+  expect_equal(
+    call_function(
+      "starts_with",
+      Array$create(c("abracadabra", "abacus", "abdicate", "abrasive")),
+      options = list(pattern = "abr")
+    ),
+    Array$create(c(TRUE, FALSE, FALSE, TRUE))
+  )
+
+  # Remove this test when ARROW-13924 has been completed
+  expect_equal(
+    call_function(
+      "ends_with",
+      Array$create(c("abracadabra", "abacus", "abdicate", "abrasive")),
+      options = list(pattern = "e")
+    ),
+    Array$create(c(FALSE, FALSE, TRUE, TRUE))
+  )
+
+  # Remove this test when ARROW-13156 has been completed
+  expect_equal(
+    as.vector(
+      call_function(
+        "count_substring",
+        Array$create(c("abracadabra", "abacus", "abdicate", "abrasive")),
+        options = list(pattern = "e")
+      )
+    ),
+    c(0, 0, 1, 1)
+  )
+
+  skip_if_not_available("re2")
+
+  # Remove this test when ARROW-13156 has been completed
+  expect_equal(
+    as.vector(
+      call_function(
+        "count_substring_regex",
+        Array$create(c("abracadabra", "abacus", "abdicate", "abrasive")),
+        options = list(pattern = "e")
+      )
+    ),
+    c(0, 0, 1, 1)
+  )
+})
+
+test_that("non-bound compute kernels using ExtractRegexOptions", {
+  skip_if_not_available("re2")
+  expect_equal(
+    call_function("extract_regex", Scalar$create("abracadabra"), options = list(pattern = "(?P<letter>[a])")),
+    Scalar$create(tibble::tibble(letter = "a"))
+  )
+})
diff --git a/r/tests/testthat/test-dataset.R b/r/tests/testthat/test-dataset.R
index b027dc98702..41265f0e638 100644
--- a/r/tests/testthat/test-dataset.R
+++ b/r/tests/testthat/test-dataset.R
@@ -27,15 +27,6 @@ ipc_dir <- make_temp_dir()
 csv_dir <- make_temp_dir()
 tsv_dir <- make_temp_dir()
 
-skip_if_multithreading_disabled <- function() {
-  is_32bit <- .Machine$sizeof.pointer < 8
-  is_old_r <- getRversion() < "4.0.0"
-  is_windows <- tolower(Sys.info()[["sysname"]]) == "windows"
-  if (is_32bit && is_old_r && is_windows) {
-    skip("Multithreading does not work properly on this system")
-  }
-}
-
 
 first_date <- lubridate::ymd_hms("2015-04-29 03:12:39")
 df1 <- tibble(
@@ -133,7 +124,7 @@ test_that("Simple interface for datasets", {
 
   # Collecting virtual partition column works
   expect_equal(
-    collect(ds) %>% pull(part),
+    ds %>% arrange(part) %>% pull(part),
     c(rep(1, 10), rep(2, 10))
   )
 })
@@ -348,13 +339,12 @@ test_that("IPC/Feather format data", {
 
   # Collecting virtual partition column works
   expect_equal(
-    collect(ds) %>% pull(part),
+    ds %>% arrange(part) %>% pull(part),
     c(rep(3, 10), rep(4, 10))
   )
 })
 
 test_that("CSV dataset", {
-  skip_if_multithreading_disabled()
   ds <- open_dataset(csv_dir, partitioning = "part", format = "csv")
   expect_r6_class(ds$format, "CsvFileFormat")
   expect_r6_class(ds$filesystem, "LocalFileSystem")
@@ -376,13 +366,12 @@ test_that("CSV dataset", {
   )
   # Collecting virtual partition column works
   expect_equal(
-    collect(ds) %>% pull(part),
+    collect(ds) %>% arrange(part) %>% pull(part),
     c(rep(5, 10), rep(6, 10))
   )
 })
 
 test_that("CSV scan options", {
-  skip_if_multithreading_disabled()
   options <- FragmentScanOptions$create("text")
   expect_equal(options$type, "csv")
   options <- FragmentScanOptions$create("csv",
@@ -429,7 +418,6 @@ test_that("CSV scan options", {
 })
 
 test_that("compressed CSV dataset", {
-  skip_if_multithreading_disabled()
   skip_if_not_available("gzip")
   dst_dir <- make_temp_dir()
   dst_file <- file.path(dst_dir, "data.csv.gz")
@@ -453,7 +441,6 @@ test_that("compressed CSV dataset", {
 })
 
 test_that("CSV dataset options", {
-  skip_if_multithreading_disabled()
   dst_dir <- make_temp_dir()
   dst_file <- file.path(dst_dir, "data.csv")
   df <- tibble(chr = letters[1:10])
@@ -481,7 +468,6 @@ test_that("CSV dataset options", {
 })
 
 test_that("Other text delimited dataset", {
-  skip_if_multithreading_disabled()
   ds1 <- open_dataset(tsv_dir, partitioning = "part", format = "tsv")
   expect_equivalent(
     ds1 %>%
@@ -510,7 +496,6 @@ test_that("Other text delimited dataset", {
 })
 
 test_that("readr parse options", {
-  skip_if_multithreading_disabled()
   arrow_opts <- names(formals(CsvParseOptions$create))
   readr_opts <- names(formals(readr_to_csv_parse_options))
 
@@ -804,7 +789,7 @@ test_that("filter scalar validation doesn't crash (ARROW-7772)", {
 test_that("collect() on Dataset works (if fits in memory)", {
   skip_if_not_available("parquet")
   expect_equal(
-    collect(open_dataset(dataset_dir)),
+    collect(open_dataset(dataset_dir)) %>% arrange(int),
     rbind(df1, df2)
   )
 })
@@ -1662,7 +1647,6 @@ test_that("Writing a dataset: Parquet format options", {
 })
 
 test_that("Writing a dataset: CSV format options", {
-  skip_if_multithreading_disabled()
   df <- tibble(
     int = 1:10,
     dbl = as.numeric(1:10),
diff --git a/r/tests/testthat/test-dplyr-arrange.R b/r/tests/testthat/test-dplyr-arrange.R
index fc24df58ca7..b28d5792880 100644
--- a/r/tests/testthat/test-dplyr-arrange.R
+++ b/r/tests/testthat/test-dplyr-arrange.R
@@ -148,7 +148,6 @@ test_that("arrange() on datetime columns", {
       collect(),
     tbl
   )
-  skip("Sorting by only a single timestamp column fails (ARROW-12087)")
   expect_dplyr_equal(
     input %>%
       arrange(dttm) %>%
diff --git a/r/tests/testthat/test-dplyr-collapse.R b/r/tests/testthat/test-dplyr-collapse.R
new file mode 100644
index 00000000000..b36f70db232
--- /dev/null
+++ b/r/tests/testthat/test-dplyr-collapse.R
@@ -0,0 +1,220 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+skip_if_not_available("dataset")
+
+withr::local_options(list(arrow.summarise.sort = TRUE))
+
+library(dplyr)
+library(stringr)
+
+tbl <- example_data
+# Add some better string data
+tbl$verses <- verses[[1]]
+# c(" a ", "  b  ", "   c   ", ...) increasing padding
+# nchar =   3  5  7  9 11 13 15 17 19 21
+tbl$padded_strings <- stringr::str_pad(letters[1:10], width = 2 * (1:10) + 1, side = "both")
+tbl$some_grouping <- rep(c(1, 2), 5)
+
+tab <- Table$create(tbl)
+
+test_that("implicit_schema with select", {
+  expect_equal(
+    tab %>%
+      select(int, lgl) %>%
+      implicit_schema(),
+    schema(int = int32(), lgl = bool())
+  )
+})
+
+test_that("implicit_schema with rename", {
+  expect_equal(
+    tab %>%
+      select(numbers = int, lgl) %>%
+      implicit_schema(),
+    schema(numbers = int32(), lgl = bool())
+  )
+})
+
+test_that("implicit_schema with mutate", {
+  expect_equal(
+    tab %>%
+      transmute(
+        numbers = int * 4,
+        words = as.character(int)
+      ) %>%
+      implicit_schema(),
+    schema(numbers = float64(), words = utf8())
+  )
+})
+
+test_that("implicit_schema with summarize", {
+  expect_equal(
+    tab %>%
+      summarize(
+        avg = mean(int)
+      ) %>%
+      implicit_schema(),
+    schema(avg = float64())
+  )
+})
+
+test_that("implicit_schema with group_by summarize", {
+  expect_equal(
+    tab %>%
+      group_by(some_grouping) %>%
+      summarize(
+        avg = mean(int * 5L)
+      ) %>%
+      implicit_schema(),
+    schema(some_grouping = float64(), avg = float64())
+  )
+})
+
+test_that("collapse", {
+  q <- tab %>%
+    filter(dbl > 2, chr == "d" | chr == "f") %>%
+    select(chr, int, lgl) %>%
+    mutate(twice = int * 2L)
+  expect_false(is_collapsed(q))
+  expect_true(is_collapsed(collapse(q)))
+
+  expect_dplyr_equal(
+    input %>%
+      filter(dbl > 2, chr == "d" | chr == "f") %>%
+      select(chr, int, lgl) %>%
+      mutate(twice = int * 2L) %>%
+      collapse() %>%
+      filter(int < 5) %>%
+      select(int, twice) %>%
+      collect(),
+    tbl
+  )
+
+  expect_dplyr_equal(
+    input %>%
+      filter(dbl > 2, chr == "d" | chr == "f") %>%
+      collapse() %>%
+      select(chr, int, lgl) %>%
+      collapse() %>%
+      filter(int < 5) %>%
+      select(int, chr) %>%
+      collect(),
+    tbl
+  )
+})
+
+test_that("Properties of collapsed query", {
+  q <- tab %>%
+    filter(dbl > 2) %>%
+    select(chr, int, lgl) %>%
+    mutate(twice = int * 2L) %>%
+    group_by(lgl) %>%
+    summarize(total = sum(int, na.rm = TRUE)) %>%
+    mutate(extra = total * 5)
+
+  # print(tbl %>%
+  #   filter(dbl > 2) %>%
+  #   select(chr, int, lgl) %>%
+  #   mutate(twice = int * 2L) %>%
+  #   group_by(lgl) %>%
+  #   summarize(total = sum(int, na.rm = TRUE)) %>%
+  #   mutate(extra = total * 5))
+
+  #   # A tibble: 3 × 3
+  #   lgl   total extra
+  #   <lgl> <int> <dbl>
+  # 1 FALSE     8    40
+  # 2 TRUE      8    40
+  # 3 NA       25   125
+
+  # Avoid evaluating just for nrow
+  expect_identical(dim(q), c(NA_integer_, 3L))
+
+  expect_output(
+    print(q),
+    "InMemoryDataset (query)
+lgl: bool
+total: int32
+extra: double (multiply_checked(total, 5))
+
+See $.data for the source Arrow object",
+    fixed = TRUE
+  )
+  expect_output(
+    print(q$.data),
+    "InMemoryDataset (query)
+int: int32
+lgl: bool
+
+* Aggregations:
+total: sum(int)
+* Filter: (dbl > 2)
+* Grouped by lgl
+See $.data for the source Arrow object",
+    fixed = TRUE
+  )
+
+  skip_if(getRversion() < "3.6.0", "TODO investigate why these aren't equal")
+  # On older R versions:
+  #  ── Failure (test-dplyr-collapse.R:172:3): Properties of collapsed query ────────
+  # head(q, 1) %>% collect() not equal to tibble::tibble(lgl = FALSE, total = 8L, extra = 40).
+  # Component "total": Mean relative difference: 0.3846154
+  # Component "extra": Mean relative difference: 0.3846154
+  # ── Failure (test-dplyr-collapse.R:176:3): Properties of collapsed query ────────
+  # tail(q, 1) %>% collect() not equal to tibble::tibble(lgl = NA, total = 25L, extra = 125).
+  # Component "total": Mean relative difference: 0.9230769
+  # Component "extra": Mean relative difference: 0.9230769
+  expect_equal(
+    q %>% head(1) %>% collect(),
+    tibble::tibble(lgl = FALSE, total = 8L, extra = 40)
+  )
+  expect_equal(
+    q %>% tail(1) %>% collect(),
+    tibble::tibble(lgl = NA, total = 25L, extra = 125)
+  )
+})
+
+test_that("query_on_dataset handles collapse()", {
+  expect_false(query_on_dataset(
+    tab %>%
+      select(int, chr)
+  ))
+  expect_false(query_on_dataset(
+    tab %>%
+      select(int, chr) %>%
+      collapse() %>%
+      select(int)
+  ))
+
+  ds_dir <- tempfile()
+  dir.create(ds_dir)
+  on.exit(unlink(ds_dir))
+  write_parquet(tab, file.path(ds_dir, "file.parquet"))
+  ds <- open_dataset(ds_dir)
+
+  expect_true(query_on_dataset(
+    ds %>%
+      select(int, chr)
+  ))
+  expect_true(query_on_dataset(
+    ds %>%
+      select(int, chr) %>%
+      collapse() %>%
+      select(int)
+  ))
+})
diff --git a/r/tests/testthat/test-dplyr-lubridate.R b/r/tests/testthat/test-dplyr-lubridate.R
index 64bb42a0ecf..b61f238e9a9 100644
--- a/r/tests/testthat/test-dplyr-lubridate.R
+++ b/r/tests/testthat/test-dplyr-lubridate.R
@@ -33,20 +33,98 @@ if (tolower(Sys.info()[["sysname"]]) == "windows") {
   test_date <- as.POSIXct("2017-01-01 00:00:12.3456789", tz = "Pacific/Marquesas")
 }
 test_df <- tibble::tibble(date = test_date)
+test_date_df <- tibble::tibble(date = as.Date(as.character(test_date)))
 
-# We can support this feature when ARROW-13138 is resolved
-test_that("date32 objects are not supported", {
-  date <- ymd("2017-01-01")
-  df <- tibble::tibble(date = date)
-
-  expect_error(
-    Table$create(df) %>%
+test_that("extract year from date32 objects", {
+  expect_equivalent(
+    test_date_df %>%
       mutate(x = year(date)) %>%
-      collect(),
-    "Function year has no kernel matching input types"
+      collect() %>%
+      select(x),
+    test_df %>%
+      mutate(x = year(date)) %>%
+      collect() %>%
+      select(x)
+  )
+})
+
+test_that("extract isoyear from date32 objects", {
+  expect_equivalent(
+    test_date_df %>%
+      mutate(x = isoyear(date)) %>%
+      collect() %>%
+      select(x),
+    test_df %>%
+      mutate(x = isoyear(date)) %>%
+      collect() %>%
+      select(x)
   )
 })
 
+test_that("extract quarter from date32 objects", {
+  expect_equivalent(
+    test_date_df %>%
+      mutate(x = quarter(date)) %>%
+      collect() %>%
+      select(x),
+    test_df %>%
+      mutate(x = quarter(date)) %>%
+      collect() %>%
+      select(x)
+  )
+})
+
+test_that("extract month from date32 objects", {
+  expect_equivalent(
+    test_date_df %>%
+      mutate(x = month(date)) %>%
+      collect() %>%
+      select(x),
+    test_df %>%
+      mutate(x = month(date)) %>%
+      collect() %>%
+      select(x)
+  )
+})
+
+test_that("extract isoweek from date32 objects", {
+  expect_equivalent(
+    test_date_df %>%
+      mutate(x = isoweek(date)) %>%
+      collect() %>%
+      select(x),
+    test_df %>%
+      mutate(x = isoweek(date)) %>%
+      collect() %>%
+      select(x)
+  )
+})
+
+test_that("extract day from date32 objects", {
+  expect_equivalent(
+    test_date_df %>%
+      mutate(x = day(date)) %>%
+      collect() %>%
+      select(x),
+    test_df %>%
+      mutate(x = day(date)) %>%
+      collect() %>%
+      select(x)
+  )
+})
+
+test_that("extract yday from date32 objects", {
+  expect_equivalent(
+    test_date_df %>%
+      mutate(x = yday(date)) %>%
+      collect() %>%
+      select(x),
+    test_df %>%
+      mutate(x = yday(date)) %>%
+      collect() %>%
+      select(x)
+  )
+})
 
 test_that("extract year from date", {
   expect_dplyr_equal(
diff --git a/r/tests/testthat/test-dplyr-aggregate.R b/r/tests/testthat/test-dplyr-summarize.R
similarity index 56%
rename from r/tests/testthat/test-dplyr-aggregate.R
rename to r/tests/testthat/test-dplyr-summarize.R
index 3a04b6d2314..fa4bffe30d7 100644
--- a/r/tests/testthat/test-dplyr-aggregate.R
+++ b/r/tests/testthat/test-dplyr-summarize.R
@@ -17,6 +17,8 @@
 
 skip_if_not_available("dataset")
 
+withr::local_options(list(arrow.summarise.sort = TRUE))
+
 library(dplyr)
 library(stringr)
 
@@ -33,7 +35,8 @@ test_that("summarize", {
     input %>%
       select(int, chr) %>%
       filter(int > 5) %>%
-      summarize(min_int = min(int)),
+      summarize(min_int = min(int)) %>%
+      collect(),
     tbl,
     warning = TRUE
   )
@@ -42,12 +45,27 @@ test_that("summarize", {
     input %>%
       select(int, chr) %>%
       filter(int > 5) %>%
-      summarize(min_int = min(int) / 2),
+      summarize(min_int = min(int) / 2) %>%
+      collect(),
     tbl,
     warning = TRUE
   )
 })
 
+test_that("summarize() doesn't evaluate eagerly", {
+  expect_s3_class(
+    Table$create(tbl) %>%
+      summarize(total = sum(int)),
+    "arrow_dplyr_query"
+  )
+  expect_r6_class(
+    Table$create(tbl) %>%
+      summarize(total = sum(int)) %>%
+      compute(),
+    "ArrowTabular"
+  )
+})
+
 test_that("Can aggregate in Arrow", {
   expect_dplyr_equal(
     input %>%
@@ -68,7 +86,6 @@ test_that("Group by sum on dataset", {
     input %>%
       group_by(some_grouping) %>%
       summarize(total = sum(int, na.rm = TRUE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
@@ -77,7 +94,6 @@ test_that("Group by sum on dataset", {
     input %>%
       group_by(some_grouping) %>%
       summarize(total = sum(int * 4, na.rm = TRUE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
@@ -86,7 +102,6 @@ test_that("Group by sum on dataset", {
     input %>%
       group_by(some_grouping) %>%
       summarize(total = sum(int)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl,
   )
@@ -97,7 +112,6 @@ test_that("Group by mean on dataset", {
     input %>%
       group_by(some_grouping) %>%
       summarize(mean = mean(int, na.rm = TRUE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
@@ -106,7 +120,6 @@ test_that("Group by mean on dataset", {
     input %>%
       group_by(some_grouping) %>%
       summarize(mean = mean(int, na.rm = FALSE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
@@ -117,17 +130,14 @@ test_that("Group by sd on dataset", {
     input %>%
       group_by(some_grouping) %>%
       summarize(sd = sd(int, na.rm = TRUE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
 
-  skip("ARROW-13691 - na.rm not yet implemented for VarianceOptions")
   expect_dplyr_equal(
     input %>%
       group_by(some_grouping) %>%
       summarize(sd = sd(int, na.rm = FALSE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
@@ -138,24 +148,20 @@ test_that("Group by var on dataset", {
     input %>%
       group_by(some_grouping) %>%
       summarize(var = var(int, na.rm = TRUE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
 
-  skip("ARROW-13691 - na.rm not yet implemented for VarianceOptions")
   expect_dplyr_equal(
     input %>%
       group_by(some_grouping) %>%
       summarize(var = var(int, na.rm = FALSE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
 })
 
 test_that("n()", {
-  withr::local_options(list(arrow.debug = TRUE))
   expect_dplyr_equal(
     input %>%
       summarize(counts = n()) %>%
@@ -178,7 +184,6 @@ test_that("Group by any/all", {
     input %>%
       group_by(some_grouping) %>%
       summarize(any(lgl, na.rm = TRUE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
@@ -186,7 +191,6 @@ test_that("Group by any/all", {
     input %>%
       group_by(some_grouping) %>%
       summarize(all(lgl, na.rm = TRUE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
@@ -194,7 +198,6 @@ test_that("Group by any/all", {
     input %>%
       group_by(some_grouping) %>%
       summarize(any(lgl, na.rm = FALSE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
@@ -202,7 +205,6 @@ test_that("Group by any/all", {
     input %>%
       group_by(some_grouping) %>%
       summarize(all(lgl, na.rm = FALSE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
@@ -212,7 +214,6 @@ test_that("Group by any/all", {
       mutate(has_words = nchar(verses) < 0) %>%
       group_by(some_grouping) %>%
       summarize(any(has_words, na.rm = TRUE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
@@ -221,7 +222,6 @@ test_that("Group by any/all", {
       mutate(has_words = nchar(verses) < 0) %>%
       group_by(some_grouping) %>%
       summarize(all(has_words, na.rm = TRUE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
@@ -229,7 +229,6 @@ test_that("Group by any/all", {
     input %>%
       group_by(some_grouping) %>%
       summarize(has_words = all(nchar(verses) < 0, na.rm = TRUE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
@@ -274,7 +273,6 @@ test_that("Filter and aggregate", {
       filter(some_grouping == 2) %>%
       group_by(some_grouping) %>%
       summarize(total = sum(int, na.rm = TRUE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
@@ -284,8 +282,189 @@ test_that("Filter and aggregate", {
       filter(int > 5) %>%
       group_by(some_grouping) %>%
       summarize(total = sum(int, na.rm = TRUE)) %>%
-      arrange(some_grouping) %>%
       collect(),
     tbl
   )
 })
+
+test_that("Group by edge cases", {
+  expect_dplyr_equal(
+    input %>%
+      group_by(some_grouping * 2) %>%
+      summarize(total = sum(int, na.rm = TRUE)) %>%
+      collect(),
+    tbl
+  )
+
+  expect_dplyr_equal(
+    input %>%
+      group_by(alt = some_grouping * 2) %>%
+      summarize(total = sum(int, na.rm = TRUE)) %>%
+      collect(),
+    tbl
+  )
+})
+
+test_that("Do things after summarize", {
+  group2_sum <- tbl %>%
+    group_by(some_grouping) %>%
+    filter(int > 5) %>%
+    summarize(total = sum(int, na.rm = TRUE)) %>%
+    pull() %>%
+    tail(1)
+
+  expect_dplyr_equal(
+    input %>%
+      group_by(some_grouping) %>%
+      filter(int > 5) %>%
+      summarize(total = sum(int, na.rm = TRUE)) %>%
+      filter(total == group2_sum) %>%
+      mutate(extra = total * 5) %>%
+      collect(),
+    tbl
+  )
+
+  expect_dplyr_equal(
+    input %>%
+      filter(dbl > 2) %>%
+      select(chr, int, lgl) %>%
+      mutate(twice = int * 2L) %>%
+      group_by(lgl) %>%
+      summarize(
+        count = n(),
+        total = sum(twice, na.rm = TRUE)
+      ) %>%
+      mutate(mean = total / count) %>%
+      collect(),
+    tbl
+  )
+})
+
+test_that("Expressions on aggregations", {
+  # This is what it effectively is
+  expect_dplyr_equal(
+    input %>%
+      group_by(some_grouping) %>%
+      summarize(
+        any = any(lgl),
+        all = all(lgl)
+      ) %>%
+      ungroup() %>% # TODO: loosen the restriction on mutate after group_by
+      mutate(some = any & !all) %>%
+      select(some_grouping, some) %>%
+      collect(),
+    tbl
+  )
+  # More concisely:
+  expect_dplyr_equal(
+    input %>%
+      group_by(some_grouping) %>%
+      summarize(any(lgl) & !all(lgl)) %>%
+      collect(),
+    tbl
+  )
+
+  # Save one of the aggregates first
+  expect_dplyr_equal(
+    input %>%
+      group_by(some_grouping) %>%
+      summarize(
+        any_lgl = any(lgl),
+        some = any_lgl & !all(lgl)
+      ) %>%
+      collect(),
+    tbl
+  )
+
+  # Make sure order of columns in result is correct
+  expect_dplyr_equal(
+    input %>%
+      group_by(some_grouping) %>%
+      summarize(
+        any_lgl = any(lgl),
+        some = any_lgl & !all(lgl),
+        n()
+      ) %>%
+      collect(),
+    tbl
+  )
+
+  # Aggregate on an aggregate (trivial but dplyr allows)
+  skip("Not supported")
+  expect_dplyr_equal(
+    input %>%
+      group_by(some_grouping) %>%
+      summarize(
+        any_lgl = any(any(lgl))
+      ) %>%
+      collect(),
+    tbl
+  )
+})
+
+test_that("Summarize with 0 arguments", {
+  expect_dplyr_equal(
+    input %>%
+      group_by(some_grouping) %>%
+      summarize() %>%
+      collect(),
+    tbl
+  )
+})
+
+test_that("Not (yet) supported: implicit join", {
+  withr::local_options(list(arrow.debug = TRUE))
+  expect_dplyr_equal(
+    input %>%
+      group_by(some_grouping) %>%
+      summarize(
+        sum((dbl - mean(dbl))^2)
+      ) %>%
+      collect(),
+    tbl,
+    warning = "Expression sum\\(\\(dbl - mean\\(dbl\\)\\)\\^2\\) not supported in Arrow; pulling data into R"
+  )
+  expect_dplyr_equal(
+    input %>%
+      group_by(some_grouping) %>%
+      summarize(
+        sum(dbl - mean(dbl))
+      ) %>%
+      collect(),
+    tbl,
+    warning = "Expression sum\\(dbl - mean\\(dbl\\)\\) not supported in Arrow; pulling data into R"
+  )
+  expect_dplyr_equal(
+    input %>%
+      group_by(some_grouping) %>%
+      summarize(
+        sqrt(sum((dbl - mean(dbl))^2) / (n() - 1L))
+      ) %>%
+      collect(),
+    tbl,
+    warning = "Expression sum\\(\\(dbl - mean\\(dbl\\)\\)\\^2\\) not supported in Arrow; pulling data into R"
+  )
+
+  expect_dplyr_equal(
+    input %>%
+      group_by(some_grouping) %>%
+      summarize(
+        dbl - mean(dbl)
+      ) %>%
+      collect(),
+    tbl,
+    warning = "Expression dbl - mean\\(dbl\\) not supported in Arrow; pulling data into R"
+  )
+
+  # This one could possibly be supported--in mutate()
+  expect_dplyr_equal(
+    input %>%
+      group_by(some_grouping) %>%
+      summarize(
+        dbl - int
+      ) %>%
+      collect(),
+    tbl,
+    warning = "Expression dbl - int not supported in Arrow; pulling data into R"
+  )
+})
diff --git a/r/tests/testthat/test-duckdb.R b/r/tests/testthat/test-duckdb.R
index cdfcb62d02d..56343ad729e 100644
--- a/r/tests/testthat/test-duckdb.R
+++ b/r/tests/testthat/test-duckdb.R
@@ -18,6 +18,7 @@
 skip_if_not_installed("duckdb", minimum_version = "0.2.8")
 skip_if_not_installed("dbplyr")
 skip_if_not_available("dataset")
+
 # when we remove this, we should also remove the FALSE in run_duckdb_examples
 skip("These tests are flaking: https://github.com/duckdb/duckdb/issues/2100")
 library(duckdb)
diff --git a/r/tests/testthat/test-json.R b/r/tests/testthat/test-json.R
index 668b040d868..c39e1b7a423 100644
--- a/r/tests/testthat/test-json.R
+++ b/r/tests/testthat/test-json.R
@@ -15,6 +15,8 @@
 # specific language governing permissions and limitations
 # under the License.
 
+skip_if_not_available("json")
+
 context("JsonTableReader")
 
 test_that("Can read json file with scalars columns (ARROW-5503)", {
diff --git a/r/tests/testthat/test-metadata.R b/r/tests/testthat/test-metadata.R
index bc6d285b333..6ae5b54fbf3 100644
--- a/r/tests/testthat/test-metadata.R
+++ b/r/tests/testthat/test-metadata.R
@@ -239,9 +239,10 @@ test_that("metadata of list elements (ARROW-10386)", {
   ds <- open_dataset(dst_dir)
   expect_warning(
     df_from_ds <- collect(ds),
-    "Row-level metadata is not compatible with this operation and has been ignored"
+    NA # TODO: ARROW-13852
+    # "Row-level metadata is not compatible with this operation and has been ignored"
   )
-  expect_equal(df_from_ds[c(1, 4, 3, 2), ], df, check.attributes = FALSE)
+  expect_equal(arrange(df_from_ds, int), arrange(df, int), check.attributes = FALSE)
 
   # however there is *no* warning if we don't select the metadata column
   expect_warning(
diff --git a/r/tests/testthat/test-python.R b/r/tests/testthat/test-python.R
index 9e67219e19a..d5815247d51 100644
--- a/r/tests/testthat/test-python.R
+++ b/r/tests/testthat/test-python.R
@@ -20,9 +20,10 @@ context("To/from Python")
 test_that("install_pyarrow", {
   skip_on_cran()
   skip_if_not_dev_mode()
-  # Python problems on Apple M1 still
-  skip_if(grepl("arm-apple|aarch64.*darwin", R.Version()$platform))
+  # Windows CI machine doesn't pick up the right python or something
+  skip_on_os("windows")
   skip_if_not_installed("reticulate")
+
   venv <- try(reticulate::virtualenv_create("arrow-test"))
   # Bail out if virtualenv isn't available
   skip_if(inherits(venv, "try-error"))
diff --git a/r/tests/testthat/test-s3-minio.R b/r/tests/testthat/test-s3-minio.R
index 94451e5351a..a2a13cbf887 100644
--- a/r/tests/testthat/test-s3-minio.R
+++ b/r/tests/testthat/test-s3-minio.R
@@ -86,8 +86,8 @@ if (arrow_with_s3() && process_is_running("minio server")) {
     test_that("open_dataset with an S3 file (not directory) URI", {
       skip_if_not_available("parquet")
       expect_identical(
-        open_dataset(minio_uri("test.parquet")) %>% collect(),
-        example_data
+        open_dataset(minio_uri("test.parquet")) %>% collect() %>% arrange(int),
+        example_data %>% arrange(int)
       )
     })
 
@@ -96,8 +96,10 @@ if (arrow_with_s3() && process_is_running("minio server")) {
         open_dataset(
           c(minio_uri("test.feather"), minio_uri("test2.feather")),
           format = "feather"
-        ) %>% collect(),
-        rbind(example_data, example_data)
+        ) %>%
+          arrange(int) %>%
+          collect(),
+        rbind(example_data, example_data) %>% arrange(int)
       )
     })
 
@@ -153,8 +155,8 @@ if (arrow_with_s3() && process_is_running("minio server")) {
     test_that("open_dataset with fs", {
       ds <- open_dataset(fs$path(minio_path("hive_dir")))
       expect_identical(
-        ds %>% select(dbl, lgl) %>% collect(),
-        rbind(df1[, c("dbl", "lgl")], df2[, c("dbl", "lgl")])
+        ds %>% select(int, dbl, lgl) %>% collect() %>% arrange(int),
+        rbind(df1[, c("int", "dbl", "lgl")], df2[, c("int", "dbl", "lgl")]) %>% arrange(int)
       )
     })
 
@@ -170,16 +172,16 @@ if (arrow_with_s3() && process_is_running("minio server")) {
       expect_length(dir(td), 2)
       ds <- open_dataset(td)
       expect_identical(
-        ds %>% select(dbl, lgl) %>% collect(),
-        rbind(df1[, c("dbl", "lgl")], df2[, c("dbl", "lgl")])
+        ds %>% select(int, dbl, lgl) %>% collect() %>% arrange(int),
+        rbind(df1[, c("int", "dbl", "lgl")], df2[, c("int", "dbl", "lgl")]) %>% arrange(int)
       )
 
       # Let's copy the other way and use a SubTreeFileSystem rather than URI
       copy_files(td, fs$path(minio_path("hive_dir2")))
       ds2 <- open_dataset(fs$path(minio_path("hive_dir2")))
       expect_identical(
-        ds2 %>% select(dbl, lgl) %>% collect(),
-        rbind(df1[, c("dbl", "lgl")], df2[, c("dbl", "lgl")])
+        ds2 %>% select(int, dbl, lgl) %>% collect() %>% arrange(int),
+        rbind(df1[, c("int", "dbl", "lgl")], df2[, c("int", "dbl", "lgl")]) %>% arrange(int)
       )
     })
   }
diff --git a/r/tools/autobrew b/r/tools/autobrew
index 0288a6eacd3..d40729e18aa 100644
--- a/r/tools/autobrew
+++ b/r/tools/autobrew
@@ -60,7 +60,7 @@ for FILE in $BREWDIR/Cellar/*/*/lib/*.a; do
   PKG_LIBS=`echo $PKG_LIBS | sed "s/-l$LIBNAME/-lbrew$LIBNAME/g"`
 done
 
-PKG_CFLAGS="-I$BREWDIR/opt/$PKG_BREW_NAME/include"
+PKG_CFLAGS="-I$BREWDIR/opt/$PKG_BREW_NAME/include -DARROW_R_WITH_PARQUET -DARROW_R_WITH_DATASET -DARROW_R_WITH_JSON -DARROW_R_WITH_S3"
 
 unset HOMEBREW_NO_ANALYTICS
 unset HOMEBREW_NO_AUTO_UPDATE
diff --git a/r/tools/nixlibs.R b/r/tools/nixlibs.R
index e28dae79f5d..ea0b5d874f8 100644
--- a/r/tools/nixlibs.R
+++ b/r/tools/nixlibs.R
@@ -30,16 +30,6 @@ options(.arrow.cleanup = character()) # To collect dirs to rm on exit
 on.exit(unlink(getOption(".arrow.cleanup")))
 
 env_is <- function(var, value) identical(tolower(Sys.getenv(var)), value)
-# * no download, build_ok: Only build with local git checkout
-# * download_ok, no build: Only use prebuilt binary, if found
-# * neither: Get the arrow-without-arrow package
-# Download and build are OK unless you say not to
-download_ok <- !env_is("LIBARROW_DOWNLOAD", "false")
-build_ok <- !env_is("LIBARROW_BUILD", "false")
-# But binary defaults to not OK
-binary_ok <- !identical(tolower(Sys.getenv("LIBARROW_BINARY", "false")), "false")
-# For local debugging, set ARROW_R_DEV=TRUE to make this script print more
-quietly <- !env_is("ARROW_R_DEV", "true")
 
 try_download <- function(from_url, to_file) {
   status <- try(
@@ -52,6 +42,26 @@ try_download <- function(from_url, to_file) {
   !inherits(status, "try-error") && status == 0
 }
 
+# For local debugging, set ARROW_R_DEV=TRUE to make this script print more
+quietly <- !env_is("ARROW_R_DEV", "true")
+
+# Default is build from source, not download a binary
+build_ok <- !env_is("LIBARROW_BUILD", "false")
+binary_ok <- env_is("LIBARROW_BINARY", "true")
+
+# Check if we're doing an offline build.
+# (Note that cmake will still be downloaded if necessary
+#  https://arrow.apache.org/docs/developers/cpp/building.html#offline-builds)
+download_ok <- !env_is("TEST_OFFLINE_BUILD", "true") && try_download("https://github.com", tempfile())
+
+# This "tools/thirdparty_dependencies" path, within the tar file, might exist if
+# create_package_with_all_dependencies() was run, or if someone has created it
+# manually before running make build.
+# If you change this path, you also need to edit
+# `create_package_with_all_dependencies()` in install-arrow.R
+thirdparty_dependency_dir <- Sys.getenv("ARROW_THIRDPARTY_DEPENDENCY_DIR", "tools/thirdparty_dependencies")
+
+
 download_binary <- function(os = identify_os()) {
   libfile <- tempfile()
   if (!is.null(os)) {
@@ -82,7 +92,7 @@ download_binary <- function(os = identify_os()) {
 # * `TRUE` (not case-sensitive), to try to discover your current OS, or
 # * some other string, presumably a related "distro-version" that has binaries
 #   built that work for your OS
-identify_os <- function(os = Sys.getenv("LIBARROW_BINARY", Sys.getenv("LIBARROW_DOWNLOAD"))) {
+identify_os <- function(os = Sys.getenv("LIBARROW_BINARY")) {
   if (tolower(os) %in% c("", "false")) {
     # Env var says not to download a binary
     return(NULL)
@@ -209,73 +219,40 @@ find_available_binary <- function(os) {
   os
 }
 
-download_source <- function() {
-  tf1 <- tempfile()
-  src_dir <- tempfile()
-
-  # Given VERSION as x.y.z.p
-  p <- package_version(VERSION)[1, 4]
-  if (is.na(p)) {
-    # This is just x.y.z so download the official Apache release
-    if (apache_download(VERSION, tf1)) {
-      untar(tf1, exdir = src_dir)
-      unlink(tf1)
-      src_dir <- paste0(src_dir, "/apache-arrow-", VERSION, "/cpp")
-    }
-  } else if (p != 9000) {
-    # This is a custom dev version (x.y.z.9999) or a nightly (x.y.z.20210505)
-    # (Don't try to download on the default dev .9000 version)
-    if (nightly_download(VERSION, tf1)) {
-      unzip(tf1, exdir = src_dir)
-      unlink(tf1)
-      src_dir <- paste0(src_dir, "/cpp")
-    }
-  }
-
-  if (dir.exists(src_dir)) {
-    cat("*** Successfully retrieved C++ source\n")
-    options(.arrow.cleanup = c(getOption(".arrow.cleanup"), src_dir))
-    # These scripts need to be executable
-    system(
-      sprintf("chmod 755 %s/build-support/*.sh", src_dir),
-      ignore.stdout = quietly, ignore.stderr = quietly
-    )
-    return(src_dir)
-  } else {
-    return(NULL)
-  }
-}
-
-nightly_download <- function(version, destfile) {
-  source_url <- paste0(arrow_repo, "src/arrow-", version, ".zip")
-  try_download(source_url, destfile)
-}
-
-apache_download <- function(version, destfile, n_mirrors = 3) {
-  apache_path <- paste0("arrow/arrow-", version, "/apache-arrow-", version, ".tar.gz")
-  apache_urls <- c(
-    # This returns a different mirror each time
-    rep("https://www.apache.org/dyn/closer.lua?action=download&filename=", n_mirrors),
-    "https://downloads.apache.org/" # The backup
+find_local_source <- function() {
+  # We'll take the first of these that exists
+  # The first case probably occurs if we're in the arrow git repo
+  # The second probably occurs if we're installing the arrow R package
+  cpp_dir_options <- c(
+    file.path(Sys.getenv("ARROW_SOURCE_HOME", ".."), "cpp"),
+    "tools/cpp"
   )
-  downloaded <- FALSE
-  for (u in apache_urls) {
-    downloaded <- try_download(paste0(u, apache_path), destfile)
-    if (downloaded) {
-      break
+  for (cpp_dir in cpp_dir_options) {
+    if (file.exists(file.path(cpp_dir, "src/arrow/api.h"))) {
+      cat(paste0("*** Found local C++ source: '", cpp_dir, "'\n"))
+      return(cpp_dir)
     }
   }
-  downloaded
+  NULL
 }
 
-find_local_source <- function(arrow_home = Sys.getenv("ARROW_SOURCE_HOME", "..")) {
-  if (file.exists(paste0(arrow_home, "/cpp/src/arrow/api.h"))) {
-    # We're in a git checkout of arrow, so we can build it
-    cat("*** Found local C++ source\n")
-    return(paste0(arrow_home, "/cpp"))
-  } else {
-    return(NULL)
+env_vars_as_string <- function(env_var_list) {
+  # Do some basic checks on env_var_list:
+  # Check that env_var_list has names, that those names are valid POSIX
+  # environment variables, and that none of the values contain `'`.
+  stopifnot(
+    length(env_var_list) == length(names(env_var_list)),
+    all(grepl("^[^0-9]", names(env_var_list))),
+    all(grepl("^[A-Z0-9_]+$", names(env_var_list))),
+    !any(grepl("'", env_var_list, fixed = TRUE))
+  )
+  env_var_string <- paste0(names(env_var_list), "='", env_var_list, "'", collapse = " ")
+  if (nchar(env_var_string) > 30000) {
+    # This could happen if the full paths in *_SOURCE_URL were *very* long.
+    # A more formal check would look at getconf ARG_MAX, but this shouldn't matter
+    cat("*** Warning: Environment variables are very long. This could cause issues on some shells.\n")
   }
+  env_var_string
 }
 
 build_libarrow <- function(src_dir, dst_dir) {
@@ -320,25 +297,46 @@ build_libarrow <- function(src_dir, dst_dir) {
     BUILD_DIR = build_dir,
     DEST_DIR = dst_dir,
     CMAKE = cmake,
+    # EXTRA_CMAKE_FLAGS will often be "", but it's convenient later to have it defined
+    EXTRA_CMAKE_FLAGS = Sys.getenv("EXTRA_CMAKE_FLAGS"),
     # Make sure we build with the same compiler settings that R is using
     CC = R_CMD_config("CC"),
     CXX = paste(R_CMD_config("CXX11"), R_CMD_config("CXX11STD")),
     # CXXFLAGS = R_CMD_config("CXX11FLAGS"), # We don't want the same debug symbols
     LDFLAGS = R_CMD_config("LDFLAGS")
   )
-  env_vars <- paste0(names(env_var_list), '="', env_var_list, '"', collapse = " ")
-  env_vars <- with_s3_support(env_vars)
-  env_vars <- with_mimalloc(env_vars)
-  if (tolower(Sys.info()[["sysname"]]) %in% "sunos") {
-    # jemalloc doesn't seem to build on Solaris
-    # nor does thrift, so turn off parquet,
-    # and arrowExports.cpp requires parquet for dataset (ARROW-11994), so turn that off
-    # xsimd doesn't compile, so set SIMD level to NONE to skip it
-    # re2 and utf8proc do compile,
-    # but `ar` fails to build libarrow_bundled_dependencies, so turn them off
-    # so that there are no bundled deps
-    env_vars <- paste(env_vars, "ARROW_JEMALLOC=OFF ARROW_PARQUET=OFF ARROW_DATASET=OFF ARROW_WITH_RE2=OFF ARROW_WITH_UTF8PROC=OFF EXTRA_CMAKE_FLAGS=-DARROW_SIMD_LEVEL=NONE")
+  env_var_list <- with_s3_support(env_var_list)
+  env_var_list <- with_mimalloc(env_var_list)
+
+  # turn_off_all_optional_features() needs to happen after with_mimalloc() and
+  # with_s3_support(), since those might turn features ON.
+  thirdparty_deps_unavailable <- !download_ok &&
+    !dir.exists(thirdparty_dependency_dir) &&
+    !env_is("ARROW_DEPENDENCY_SOURCE", "system")
+  on_solaris <- tolower(Sys.info()[["sysname"]]) %in% "sunos"
+  do_minimal_build <- on_solaris || env_is("LIBARROW_MINIMAL", "true")
+
+  if (do_minimal_build) {
+    # Note that JSON support does work on Solaris, but will be turned off with
+    # the rest of the optional dependencies.
+    # All other dependencies don't compile (e.g thrift, jemalloc, and xsimd)
+    # or do compile but `ar` fails to build
+    # libarrow_bundled_dependencies (e.g. re2 and utf8proc).
+    env_var_list <- turn_off_all_optional_features(env_var_list)
+  } else if (thirdparty_deps_unavailable) {
+    cat(paste0(
+      "*** Building C++ library from source, but downloading thirdparty dependencies\n",
+      "    is not possible, so this build will turn off all thirdparty features.\n",
+      "    See install vignette for details:\n",
+      "    https://cran.r-project.org/web/packages/arrow/vignettes/install.html\n"
+    ))
+    env_var_list <- turn_off_all_optional_features(env_var_list)
+  } else if (dir.exists(thirdparty_dependency_dir)) {
+    # Add the *_SOURCE_URL env vars
+    env_var_list <- set_thirdparty_urls(env_var_list)
   }
+  env_vars <- env_vars_as_string(env_var_list)
+
   cat("**** arrow", ifelse(quietly, "", paste("with", env_vars)), "\n")
   status <- suppressWarnings(system(
     paste(env_vars, "inst/build_arrow_static.sh"),
@@ -346,7 +344,11 @@ build_libarrow <- function(src_dir, dst_dir) {
   ))
   if (status != 0) {
     # It failed :(
-    cat("**** Error building Arrow C++. Re-run with ARROW_R_DEV=true for debug information.\n")
+    cat(
+      "**** Error building Arrow C++.",
+      ifelse(env_is("ARROW_R_DEV", "true"), "", "Re-run with ARROW_R_DEV=true for debug information."),
+      "\n"
+    )
   }
   invisible(status)
 }
@@ -373,7 +375,15 @@ ensure_cmake <- function() {
     )
     cmake_tar <- tempfile()
     cmake_dir <- tempfile()
-    try_download(cmake_binary_url, cmake_tar)
+    download_successful <- try_download(cmake_binary_url, cmake_tar)
+    if (!download_successful) {
+      cat(paste0(
+        "*** cmake was not found locally and download failed.\n",
+        "    Make sure cmake >= 3.10 is installed and available on your PATH,\n",
+        "    or download ", cmake_binary_url, "\n",
+        "    and define the CMAKE environment variable.\n"
+      ))
+    }
     untar(cmake_tar, exdir = cmake_dir)
     unlink(cmake_tar)
     options(.arrow.cleanup = c(getOption(".arrow.cleanup"), cmake_dir))
@@ -413,53 +423,121 @@ cmake_version <- function(cmd = "cmake") {
   )
 }
 
-with_s3_support <- function(env_vars) {
-  arrow_s3 <- toupper(Sys.getenv("ARROW_S3")) == "ON" || tolower(Sys.getenv("LIBARROW_MINIMAL")) == "false"
-  # but if ARROW_S3=OFF explicitly, we are definitely off, so override
-  if (toupper(Sys.getenv("ARROW_S3")) == "OFF") {
-    arrow_s3 <- FALSE
+turn_off_all_optional_features <- function(env_var_list) {
+  # Because these are done as environment variables (as opposed to build flags),
+  # setting these to "OFF" overrides any previous setting. We don't need to
+  # check the existing value.
+  turn_off <- c(
+    "ARROW_MIMALLOC" = "OFF",
+    "ARROW_JEMALLOC" = "OFF",
+    "ARROW_JSON" = "OFF",
+    "ARROW_PARQUET" = "OFF", # depends on thrift
+    "ARROW_DATASET" = "OFF", # depends on parquet
+    "ARROW_S3" = "OFF",
+    "ARROW_WITH_BROTLI" = "OFF",
+    "ARROW_WITH_BZ2" = "OFF",
+    "ARROW_WITH_LZ4" = "OFF",
+    "ARROW_WITH_SNAPPY" = "OFF",
+    "ARROW_WITH_ZLIB" = "OFF",
+    "ARROW_WITH_ZSTD" = "OFF",
+    "ARROW_WITH_RE2" = "OFF",
+    "ARROW_WITH_UTF8PROC" = "OFF",
+    # The syntax to turn off XSIMD is different.
+    # Pull existing value of EXTRA_CMAKE_FLAGS first (must be defined)
+    "EXTRA_CMAKE_FLAGS" = paste(
+      env_var_list[["EXTRA_CMAKE_FLAGS"]],
+      "-DARROW_SIMD_LEVEL=NONE -DARROW_RUNTIME_SIMD_LEVEL=NONE"
+    )
+  )
+  # Create a new env_var_list, with the values of turn_off set.
+  # replace() also adds new values if they didn't exist before
+  replace(env_var_list, names(turn_off), turn_off)
+}
+
+set_thirdparty_urls <- function(env_var_list) {
+  # This function does *not* check if existing *_SOURCE_URL variables are set.
+  # The directory tools/thirdparty_dependencies is created by
+  # create_package_with_all_dependencies() and saved in the tar file.
+  files <- list.files(thirdparty_dependency_dir, full.names = FALSE)
+  url_env_varname <- toupper(sub("(.*?)-.*", "ARROW_\\1_URL", files))
+  # Special handling for the aws dependencies, which have extra `-`
+  aws <- grepl("^aws", files)
+  url_env_varname[aws] <- sub(
+    "AWS_SDK_CPP", "AWSSDK",
+    gsub(
+      "-", "_",
+      sub(
+        "(AWS.*)-.*", "ARROW_\\1_URL",
+        toupper(files[aws])
+      )
+    )
+  )
+  full_filenames <- file.path(normalizePath(thirdparty_dependency_dir), files)
+
+  env_var_list <- replace(env_var_list, url_env_varname, full_filenames)
+  if (!quietly) {
+    env_var_list <- replace(env_var_list, "ARROW_VERBOSE_THIRDPARTY_BUILD", "ON")
+  }
+  env_var_list
+}
+
+is_feature_requested <- function(env_varname, default = env_is("LIBARROW_MINIMAL", "false")) {
+  env_value <- tolower(Sys.getenv(env_varname))
+  if (identical(env_value, "off")) {
+    # If e.g. ARROW_MIMALLOC=OFF explicitly, override default
+    requested <- FALSE
+  } else if (identical(env_value, "on")) {
+    requested <- TRUE
+  } else {
+    requested <- default
   }
+  requested
+}
+
+with_mimalloc <- function(env_var_list) {
+  arrow_mimalloc <- is_feature_requested("ARROW_MIMALLOC")
+  if (arrow_mimalloc) {
+    # User wants mimalloc. If they're using gcc, let's make sure the version is >= 4.9
+    if (isTRUE(cmake_gcc_version(env_var_list) < "4.9")) {
+      cat("**** mimalloc support not available for gcc < 4.9; building with ARROW_MIMALLOC=OFF\n")
+      arrow_mimalloc <- FALSE
+    }
+  }
+  replace(env_var_list, "ARROW_MIMALLOC", ifelse(arrow_mimalloc, "ON", "OFF"))
+}
+
+with_s3_support <- function(env_var_list) {
+  arrow_s3 <- is_feature_requested("ARROW_S3")
   if (arrow_s3) {
     # User wants S3 support. If they're using gcc, let's make sure the version is >= 4.9
     # and make sure that we have curl and openssl system libs
-    if (isTRUE(cmake_gcc_version(env_vars) < "4.9")) {
+    if (isTRUE(cmake_gcc_version(env_var_list) < "4.9")) {
       cat("**** S3 support not available for gcc < 4.9; building with ARROW_S3=OFF\n")
       arrow_s3 <- FALSE
-    } else if (!cmake_find_package("CURL", NULL, env_vars)) {
+    } else if (!cmake_find_package("CURL", NULL, env_var_list)) {
       # curl on macos should be installed, so no need to alter this for macos
       cat("**** S3 support requires libcurl-devel (rpm) or libcurl4-openssl-dev (deb); building with ARROW_S3=OFF\n")
       arrow_s3 <- FALSE
-    } else if (!cmake_find_package("OpenSSL", "1.0.2", env_vars)) {
+    } else if (!cmake_find_package("OpenSSL", "1.0.2", env_var_list)) {
       cat("**** S3 support requires version >= 1.0.2 of openssl-devel (rpm), libssl-dev (deb), or openssl (brew); building with ARROW_S3=OFF\n")
       arrow_s3 <- FALSE
     }
   }
-  paste(env_vars, ifelse(arrow_s3, "ARROW_S3=ON", "ARROW_S3=OFF"))
+  replace(env_var_list, "ARROW_S3", ifelse(arrow_s3, "ON", "OFF"))
 }
 
-with_mimalloc <- function(env_vars) {
-  arrow_mimalloc <- toupper(Sys.getenv("ARROW_MIMALLOC")) == "ON" || tolower(Sys.getenv("LIBARROW_MINIMAL")) == "false"
-  if (arrow_mimalloc) {
-    # User wants mimalloc. If they're using gcc, let's make sure the version is >= 4.9
-    if (isTRUE(cmake_gcc_version(env_vars) < "4.9")) {
-      cat("**** mimalloc support not available for gcc < 4.9; building with ARROW_MIMALLOC=OFF\n")
-      arrow_mimalloc <- FALSE
-    }
-  }
-  paste(env_vars, ifelse(arrow_mimalloc, "ARROW_MIMALLOC=ON", "ARROW_MIMALLOC=OFF"))
-}
-
-cmake_gcc_version <- function(env_vars) {
+cmake_gcc_version <- function(env_var_list) {
   # This function returns NA if using a non-gcc compiler
   # Always enclose calls to it in isTRUE() or isFALSE()
-  vals <- cmake_cxx_compiler_vars(env_vars)
+  vals <- cmake_cxx_compiler_vars(env_var_list)
   if (!identical(vals[["CMAKE_CXX_COMPILER_ID"]], "GNU")) {
     return(NA)
   }
   package_version(vals[["CMAKE_CXX_COMPILER_VERSION"]])
 }
 
-cmake_cxx_compiler_vars <- function(env_vars) {
+cmake_cxx_compiler_vars <- function(env_var_list) {
+  env_vars <- env_vars_as_string(env_var_list)
   info <- system(paste("export", env_vars, "&& $CMAKE --system-information"), intern = TRUE)
   info <- grep("^[A-Z_]* .*$", info, value = TRUE)
   vals <- as.list(sub('^.*? "?(.*?)"?$', "\\1", info))
@@ -467,12 +545,13 @@ cmake_cxx_compiler_vars <- function(env_vars) {
   vals[grepl("^CMAKE_CXX_COMPILER_?", names(vals))]
 }
 
-cmake_find_package <- function(pkg, version = NULL, env_vars) {
+cmake_find_package <- function(pkg, version = NULL, env_var_list) {
   td <- tempfile()
   dir.create(td)
   options(.arrow.cleanup = c(getOption(".arrow.cleanup"), td))
   find_package <- paste0("find_package(", pkg, " ", version, " REQUIRED)")
   writeLines(find_package, file.path(td, "CMakeLists.txt"))
+  env_vars <- env_vars_as_string(env_var_list)
   cmake_cmd <- paste0(
     "export ", env_vars,
     " && cd ", td,
@@ -501,12 +580,7 @@ if (!file.exists(paste0(dst_dir, "/include/arrow/api.h"))) {
     unlink(bin_file)
   } else if (build_ok) {
     # (2) Find source and build it
-    if (download_ok) {
-      src_dir <- download_source()
-    }
-    if (is.null(src_dir)) {
-      src_dir <- find_local_source()
-    }
+    src_dir <- find_local_source()
     if (!is.null(src_dir)) {
       cat("*** Building C++ libraries\n")
       build_libarrow(src_dir, dst_dir)
diff --git a/r/vignettes/developing.Rmd b/r/vignettes/developing.Rmd
index 3d7f82e3619..5cff5e5608c 100644
--- a/r/vignettes/developing.Rmd
+++ b/r/vignettes/developing.Rmd
@@ -9,13 +9,11 @@ vignette: >
 
 ```{r setup-options, include=FALSE}
 knitr::opts_chunk$set(error = TRUE, eval = FALSE)
-
 # Get environment variables describing what to evaluate
 run <- tolower(Sys.getenv("RUN_DEVDOCS", "false")) == "true"
 macos <- tolower(Sys.getenv("DEVDOCS_MACOS", "false")) == "true"
 ubuntu <- tolower(Sys.getenv("DEVDOCS_UBUNTU", "false")) == "true"
 sys_install <- tolower(Sys.getenv("DEVDOCS_SYSTEM_INSTALL", "false")) == "true"
-
 # Update the source knit_hook to save the chunk (if it is marked to be saved)
 knit_hooks_source <- knitr::knit_hooks$get("source")
 knitr::knit_hooks$set(source = function(x, options) {
@@ -40,90 +38,111 @@ set -e
 set -x
 ```
 
-If you're looking to contribute to `arrow`, this document can help you set up a development environment that will enable you to write code and run tests locally. It outlines how to build the various components that make up the Arrow project and R package, as well as some common troubleshooting and workflows developers use. Many contributions can be accomplished with the instructions in [R-only development](#r-only-development). But if you're working on both the C++ library and the R package, the [Developer environment setup](#-developer-environment-setup) section will guide you through setting up a developer environment.
+If you're looking to contribute to arrow, this vignette can help you set up a development environment that will enable you to write code and run tests locally. It outlines:
+
+* how to build the components that make up the Arrow project and R package
+* workflows that developers use
+* some common troubleshooting steps and solutions
+
+This document is intended only for **developers** of Apache Arrow or the Arrow R package. R package users do not need to do any of this setup. If you're looking for how to install Arrow, see [the instructions in the readme](https://arrow.apache.org/docs/r/#installation).
+
+This document is a work in progress and will grow and change as the Apache Arrow project grows and changes. We have tried to make these steps as robust as possible (in fact, we even test exactly these instructions on our nightly CI to ensure they don't become stale!), but custom configurations might conflict with these instructions and there are differences of opinion across developers about how to set up development environments like this.
 
-This document is intended only for developers of Apache Arrow or the Arrow R package. Users of the package in R do not need to do any of this setup. If you're looking for how to install Arrow, see [the instructions in the readme](https://arrow.apache.org/docs/r/#installation); Linux users can find more details on building from source at `vignette("install", package = "arrow")`.
+We welcome any feedback you have about things that are confusing or additions you would like to see here - please [report an issue](https://issues.apache.org/jira/projects/ARROW/issues) if you have any suggestions or requests.
 
-This document is a work in progress and will grow + change as the Apache Arrow project grows and changes. We have tried to make these steps as robust as possible (in fact, we even test exactly these instructions on our nightly CI to ensure they don't become stale!), but certain custom configurations might conflict with these instructions and there are differences of opinion across developers about if and what the one true way to set up development environments like this is.  We also solicit any feedback you have about things that are confusing or additions you would like to see here. Please [report an issue](https://issues.apache.org/jira/projects/ARROW/issues) if there you see anything that is confusing, odd, or just plain wrong.
+# Developer environment setup
 
-## R-only development
+## R-only {.tabset}
 
 Windows and macOS users who wish to contribute to the R package and
-don’t need to alter the Arrow C++ library may be able to obtain a
-recent version of the library without building from source. On macOS,
-you may install the C++ library using [Homebrew](https://brew.sh/):
+don't need to alter libarrow (Arrow's C++ library) may be able to obtain a
+recent version of the library without building from source.
+
+### Linux
+
+On Linux, you can download a .zip file containing libarrow from the
+nightly repository.
+
+To see what nightlies are available, you can use arrow's (or any other S3 client's) S3 listing functionality to see what is in the bucket `s3://arrow-r-nightly/libarrow/bin`:
 
-``` shell
+```
+nightly <- s3_bucket("arrow-r-nightly")
+nightly$ls("libarrow/bin")
+```
+Version numbers in that repository correspond to dates.
+
+You'll need to create a `libarrow` directory inside the R package directory and unzip the zip file containing the compiled libarrow binary files into it.
+
+### macOS
+On macOS, you can install libarrow using [Homebrew](https://brew.sh/):
+
+```bash
 # For the released version:
 brew install apache-arrow
 # Or for a development version, you can try:
 brew install apache-arrow --HEAD
 ```
 
-On Windows and Linux, you can download a .zip file with the arrow dependencies from the
-nightly repository.
-Windows users then can set the `RWINLIB_LOCAL` environment variable to point to that
-zip file before installing the `arrow` R package. On Linux, you'll need to create a `libarrow` directory inside the R package directory and unzip that file into it. Version numbers in that
-repository correspond to dates, and you will likely want the most recent.
+### Windows
+
+On Windows, you can download a .zip file containing libarrow from the nightly repository.
 
-To see what nightlies are available, you can use Arrow's (or any other S3 client's) S3 listing functionality to see what is in the bucket `s3://arrow-r-nightly/libarrow/bin`:
+To see what nightlies are available, you can use arrow's (or any other S3 client's) S3 listing functionality to see what is in the bucket `s3://arrow-r-nightly/libarrow/bin`:
 
 ```
 nightly <- s3_bucket("arrow-r-nightly")
 nightly$ls("libarrow/bin")
 ```
+Version numbers in that repository correspond to dates.
 
-## Developer environment setup
+You can set the `RWINLIB_LOCAL` environment variable to point to the zip file containing libarrow before installing the arrow R package.
 
-If you need to alter both the Arrow C++ library and the R package code, or if you can’t get a binary version of the latest C++ library elsewhere, you’ll need to build it from source too. This section discusses how to set up a C++ build configured to work with the R package. For more general resources, see the [Arrow C++ developer
-guide](https://arrow.apache.org/docs/developers/cpp/building.html).
 
-There are four major steps to the process — the first three are relevant to all Arrow developers, and the last one is specific to the R bindings:
+## R and C++
 
-1. Configuring the Arrow library build (using `cmake`) — this specifies how you want the build to go, what features to include, etc.
-2. Building the Arrow library — this actually compiles the Arrow library
-3. Install the Arrow library — this organizes and moves the compiled Arrow library files into the location specified in the configuration
-4. Building the R package — this builds the C++ code in the R package, and installs the R package for you
+If you need to alter both libarrow and the R package code, or if you can't get a binary version of the latest libarrow elsewhere, you'll need to build it from source. This section discusses how to set up a C++ libarrow build configured to work with the R package. For more general resources, see the [Arrow C++ developer guide](https://arrow.apache.org/docs/developers/cpp/building.html).
 
-### Install dependencies {.tabset}
+There are five major steps to the process.
 
-The Arrow C++ library will by default use system dependencies if suitable versions are found; if they are not present, it will build them during its own build process. The only dependencies that one needs to install outside of the build process are `cmake` (for configuring the build) and `openssl` if you are building with S3 support.
+### Step 1 - Install dependencies {.tabset}
 
-For a faster build, you may choose to install on the system more C++ library dependencies (such as `lz4`, `zstd`, etc.) so that they don't need to be built from source in the Arrow build. This is optional.
+When building libarrow, by default, system dependencies will be used if suitable versions are found.  If system dependencies are not present, libarrow will build them during its own build process. The only dependencies that you need to install _outside_ of the build process are [cmake](https://cmake.org/) (for configuring the build) and [openssl](https://www.openssl.org/) if you are building with S3 support.
 
-#### macOS
-```{bash, save=run & macos}
-brew install cmake openssl
-```
+For a faster build, you may choose to pre-install more C++ library dependencies (such as [lz4](http://lz4.github.io/lz4/), [zstd](https://facebook.github.io/zstd/), etc.) on the system  so that they don't need to be built from source in the libarrow build.
 
 #### Ubuntu
 ```{bash, save=run & ubuntu}
 sudo apt install -y cmake libcurl4-openssl-dev libssl-dev
 ```
 
-### Configure the Arrow build {.tabset}
+#### macOS
+```{bash, save=run & macos}
+brew install cmake openssl
+```
+
+#### Windows
 
-You can choose to build and then install the Arrow library into a user-defined directory or into a system-level directory. You only need to do one of these two options.
+Currently, the R package cannot be made to work with a local libarrow build. This will be resolved in a future release.
 
-It is recommended that you install the arrow library to a user-level directory to be used in development. This is so that the development version you are using doesn't overwrite a released version of Arrow you may have installed. You are also able to have more than one version of the Arrow library to link to with this approach (by using different `ARROW_HOME` directories for the different versions). This approach also matches the recommendations for other Arrow bindings like [Python](http://arrow.apache.org/docs/developers/python.html).
+### Step 2 - Configure the libarrow build
 
-#### Configure for installing to a user directory
+We recommend that you configure libarrow to be built to a user-level directory rather than a system directory for your development work.  This is so that the development version you are using doesn't overwrite a released version of libarrow you may already have installed, and so that you are also able work with more than one version of libarrow (by using different `ARROW_HOME` directories for the different versions).
 
-In this example we will install it to a directory called `dist` that has the same parent as our `arrow` checkout, but it could be named or located anywhere you would like. However, note that your installation of the Arrow R package will point to this directory and need it to remain intact for the package to continue to work. This is one reason we recommend *not* placing it inside of the arrow git checkout.
+In the example below, libarrow is installed to a directory called `dist` that has the same parent directory as the `arrow` checkout.  Your installation of the Arrow R package can point to any directory with any name, though we recommend *not* placing it inside of the `arrow` git checkout directory as unwanted changes could stop it working properly.
 
 ```{bash, save=run & !sys_install}
 export ARROW_HOME=$(pwd)/dist
 mkdir $ARROW_HOME
 ```
 
-_Special instructions on Linux:_ You will need to set `LD_LIBRARY_PATH` to the `lib` directory that is under where we set `$ARROW_HOME`, before launching R and using Arrow. One way to do this is to add it to your profile (we use `~/.bash_profile` here, but you might need to put this in a different file depending on your setup, e.g. if you use a shell other than `bash`). On macOS we do not need to do this because the macOS shared library paths are hardcoded to their locations during build time.
+_Special instructions on Linux:_ You will need to set `LD_LIBRARY_PATH` to the `lib` directory that is under where you set `$ARROW_HOME`, before launching R and using arrow. One way to do this is to add it to your profile (we use `~/.bash_profile` here, but you might need to put this in a different file depending on your setup, e.g. if you use a shell other than `bash`). On macOS you do not need to do this because the macOS shared library paths are hardcoded to their locations during build time.
 
 ```{bash, save=run & ubuntu & !sys_install}
 export LD_LIBRARY_PATH=$ARROW_HOME/lib:$LD_LIBRARY_PATH
 echo "export LD_LIBRARY_PATH=$ARROW_HOME/lib:$LD_LIBRARY_PATH" >> ~/.bash_profile
 ```
 
-Now we can move into the arrow repository to start the build process. You will need to create a directory into which the C++ build will put its contents. It is recommended to make a `build` directory inside of the `cpp` directory of the Arrow git repository (it is git-ignored, so you won't accidentally check it in). And then, change directories to be inside `cpp/build`:
+Start by navigating in a terminal to the `arrow` repository. You will need to create a directory into which the C++ build will put its contents. We recommend that you make a `build` directory inside of the `cpp` directory of the Arrow git repository (it is git-ignored, so you won't accidentally check it in). Next, change directories to be inside `cpp/build`:
 
 ```{bash, save=run & !sys_install}
 pushd arrow
@@ -131,7 +150,7 @@ mkdir -p cpp/build
 pushd cpp/build
 ```
 
-You’ll first call `cmake` to configure the build and then `make install`. For the R package, you’ll need to enable several features in the C++ library using `-D` flags:
+You'll first call `cmake` to configure the build and then `make install`. For the R package, you'll need to enable several features in libarrow using `-D` flags:
 
 ```{bash, save=run & !sys_install}
 cmake \
@@ -151,45 +170,13 @@ cmake \
   ..
 ```
 
-`..` refers to the C++ source directory: we're in `cpp/build`, and the source is in `cpp`.
-
-#### Configure to install to a system directory
+`..` refers to the C++ source directory: you're in `cpp/build` and the source is in `cpp`.
 
-If you would like to install Arrow as a system library you can do that as well. This is in some respects simpler, but if you already have Arrow libraries installed there, it would disrupt them and possibly require `sudo` permissions.
+#### Enabling more Arrow features
 
-Now we can move into the arrow repository to start the build process. You will need to create a directory into which the C++ build will put its contents. It is recommended to make a `build` directory inside of the `cpp` directory of the Arrow git repository (it is git-ignored, so you won't accidentally check it in). And then, change directories to be inside `cpp/build`:
+To enable optional features including: S3 support, an alternative memory allocator, and additional compression libraries, add some or all of these flags to your call to `cmake` (the trailing `\` makes them easier to paste into a bash shell on a new line):
 
-```{bash, save=run & sys_install}
-pushd arrow
-mkdir -p cpp/build
-pushd cpp/build
-```
-
-You’ll first call `cmake` to configure the build and then `make install`. For the R package, you’ll need to enable several features in the C++ library using `-D` flags:
-
-```{bash, save=run & sys_install}
-cmake \
-  -DARROW_COMPUTE=ON \
-  -DARROW_CSV=ON \
-  -DARROW_DATASET=ON \
-  -DARROW_EXTRA_ERROR_CONTEXT=ON \
-  -DARROW_FILESYSTEM=ON \
-  -DARROW_INSTALL_NAME_RPATH=OFF \
-  -DARROW_JEMALLOC=ON \
-  -DARROW_JSON=ON \
-  -DARROW_PARQUET=ON \
-  -DARROW_WITH_SNAPPY=ON \
-  -DARROW_WITH_ZLIB=ON \
-  ..
-```
-
-`..` refers to the C++ source directory: we're in `cpp/build`, and the source is in `cpp`.
-
-### More Arrow features
-
-To enable optional features including: S3 support, an alternative memory allocator, and additional compression libraries, add some or all of these flags (the trailing `\` makes them easier to paste into a bash shell on a new line):
-
-``` shell
+```bash
   -DARROW_MIMALLOC=ON \
   -DARROW_S3=ON \
   -DARROW_WITH_BROTLI=ON \
@@ -201,12 +188,13 @@ To enable optional features including: S3 support, an alternative memory allocat
 
 Other flags that may be useful:
 
-* `-DBoost_SOURCE=BUNDLED` and `-DThrift_SOURCE=bundled`, for example, or any other dependency `*_SOURCE`, if you have a system version of a C++ dependency that doesn't work correctly with Arrow. This tells the build to compile its own version of the dependency from source.
+* `-DBoost_SOURCE=BUNDLED` and `-DThrift_SOURCE=BUNDLED`, for example, or any other dependency `*_SOURCE`, if you have a system version of a C++ dependency that doesn't work correctly with Arrow. This tells the build to compile its own version of the dependency from source.
+
 * `-DCMAKE_BUILD_TYPE=debug` or `-DCMAKE_BUILD_TYPE=relwithdebinfo` can be useful for debugging. You probably don't want to do this generally because a debug build is much slower at runtime than the default `release` build.
 
-_Note_ `cmake` is particularly sensitive to whitespacing, if you see errors, check that you don't have any errant whitespace around
+_Note_ `cmake` is particularly sensitive to whitespacing, if you see errors, check that you don't have any errant whitespace.
 
-### Build Arrow
+### Step 3 - Building libarrow
 
 You can add `-j#` between `make` and `install` here too to speed up compilation by running in parallel (where `#` is the number of cores you have available).
 
@@ -214,49 +202,39 @@ You can add `-j#` between `make` and `install` here too to speed up compilation
 make -j8 install
 ```
 
-If you are installing on linux, and you are installing to the system, you may
-need to use `sudo`:
+### Step 4 - Build the Arrow R package
 
-```{bash, save=run & sys_install & ubuntu}
-sudo make install
-```
-
-
-### Build the Arrow R package
-
-Once you’ve built the C++ library, you can install the R package and its
+Once you've built libarrow, you can install the R package and its
 dependencies, along with additional dev dependencies, from the git
 checkout:
 
 ```{bash, save=run}
 popd # To go back to the root directory of the project, from cpp/build
-
 pushd r
 R -e 'install.packages("remotes"); remotes::install_deps(dependencies = TRUE)'
-
 R CMD INSTALL .
 ```
 
-### Compilation flags
+#### Compilation flags
 
 If you need to set any compilation flags while building the C++
 extensions, you can use the `ARROW_R_CXXFLAGS` environment variable. For
 example, if you are using `perf` to profile the R extensions, you may
 need to set
 
-``` shell
+```bash
 export ARROW_R_CXXFLAGS=-fno-omit-frame-pointer
 ```
 
-### Developer Experience
+#### Recompiling the C++ code
 
-With the setups described here, you should not need to rebuild the Arrow library or even the C++ source in the R package as you iterated and work on the R package. The only time those should need to be rebuilt is if you have changed the C++ in the R package (and even then, `R CMD INSTALL .` should only need to recompile the files that have changed) _or_ if the Arrow library C++ has changed and there is a mismatch between the Arrow Library and the R package. If you find yourself rebuilding either or both each time you install the package or run tests, something is probably wrong with your set up.
+With the setup described here, you should not need to rebuild the Arrow library or even the C++ source in the R package as you iterate and work on the R package. The only time those should need to be rebuilt is if you have changed the C++ in the R package (and even then, `R CMD INSTALL .` should only need to recompile the files that have changed) _or_ if the libarrow C++ has changed and there is a mismatch between libarrow and the R package. If you find yourself rebuilding either or both each time you install the package or run tests, something is probably wrong with your set up.
 
 <details>
 <summary>For a full build: a `cmake` command with all of the R-relevant optional dependencies turned on. Development with other languages might require different flags as well. For example, to develop Python, you would need to also add `-DARROW_PYTHON=ON` (though all of the other flags used for Python are already included here).</summary>
 <p>
 
-``` shell
+```bash
 cmake \
   -DCMAKE_INSTALL_PREFIX=$ARROW_HOME \
   -DCMAKE_INSTALL_LIBDIR=lib \
@@ -282,161 +260,102 @@ cmake \
 </p>
 </details>
 
-### Documentation
+## Installing a version of the R package with a specific git reference
 
-The documentation for the R package uses features of `roxygen2` that haven't yet been released on CRAN, such as conditional inclusion of examples via the `@examplesIf` tag.  If you are making changes which require updating the documentation, please install the development version of `roxygen2` from GitHub.
+If you need an arrow installation from a specific repository or git reference, on most platforms except Windows, you can run:
 
 ```{r}
-remotes::install_github("r-lib/roxygen2")
+remotes::install_github("apache/arrow/r", build = FALSE)
 ```
 
-## Troubleshooting
-
-Note that after any change to the C++ library, you must reinstall it and
-run `make clean` or `git clean -fdx .` to remove any cached object code
-in the `r/src/` directory before reinstalling the R package. This is
-only necessary if you make changes to the C++ library source; you do not
-need to manually purge object files if you are only editing R or C++
-code inside `r/`.
-
-### Arrow library-R package mismatches
-
-If the Arrow library and the R package have diverged, you will see errors like:
-
-```
-Error: package or namespace load failed for ‘arrow’ in dyn.load(file, DLLpath = DLLpath, ...):
- unable to load shared object '/Library/Frameworks/R.framework/Versions/4.0/Resources/library/00LOCK-r/00new/arrow/libs/arrow.so':
-  dlopen(/Library/Frameworks/R.framework/Versions/4.0/Resources/library/00LOCK-r/00new/arrow/libs/arrow.so, 6): Symbol not found: __ZN5arrow2io16RandomAccessFile9ReadAsyncERKNS0_9IOContextExx
-  Referenced from: /Library/Frameworks/R.framework/Versions/4.0/Resources/library/00LOCK-r/00new/arrow/libs/arrow.so
-  Expected in: flat namespace
- in /Library/Frameworks/R.framework/Versions/4.0/Resources/library/00LOCK-r/00new/arrow/libs/arrow.so
-Error: loading failed
-Execution halted
-ERROR: loading failed
-```
-
-To resolve this, try rebuilding the Arrow library from [Building Arrow above](#building-arrow).
+The `build = FALSE` argument is important so that the installation can access the
+C++ source in the `cpp/` directory in `apache/arrow`.
 
-### Multiple versions of Arrow library
+As with other installation methods, setting the environment variables `LIBARROW_MINIMAL=false` and `ARROW_R_DEV=true` will provide a more full-featured version of Arrow and provide more verbose output, respectively.
 
-If rebuilding the Arrow library doesn't work and you are [installing from a user-level directory](#installing-to-another-directory) and you already have a previous installation of libarrow in a system directory or you get you may get errors like the following when you install the R package:
+For example, to install from the (fictional) branch `bugfix` from `apache/arrow` you could run:
 
-```
-Error: package or namespace load failed for ‘arrow’ in dyn.load(file, DLLpath = DLLpath, ...):
- unable to load shared object '/Library/Frameworks/R.framework/Versions/4.0/Resources/library/00LOCK-r/00new/arrow/libs/arrow.so':
-  dlopen(/Library/Frameworks/R.framework/Versions/4.0/Resources/library/00LOCK-r/00new/arrow/libs/arrow.so, 6): Library not loaded: /usr/local/lib/libarrow.400.dylib
-  Referenced from: /usr/local/lib/libparquet.400.dylib
-  Reason: image not found
+```r
+Sys.setenv(LIBARROW_MINIMAL="false")
+remotes::install_github("apache/arrow/r@bugfix", build = FALSE)
 ```
 
-You need to make sure that you don't let R link to your system library when building arrow. You can do this a number of different ways:
+Developers may wish to use this method of installing a specific commit
+separate from another Arrow development environment or system installation
+(e.g. we use this in [arrowbench](https://github.com/ursacomputing/arrowbench)
+to install development versions of libarrow isolated from the system install). If
+you already have libarrow installed system-wide, you may need to set
+some additional variables in order to isolate this build from your system libraries:
 
-* Setting the `MAKEFLAGS` environment variable to `"LDFLAGS="` (see below for an example) this is the recommended way to accomplish this
-* Using {withr}'s `with_makevars(list(LDFLAGS = ""), ...)`
-* adding `LDFLAGS=` to your `~/.R/Makevars` file (the least recommended way, though it is a common debugging approach suggested online)
+* Setting the environment variable `FORCE_BUNDLED_BUILD` to `true` will skip the `pkg-config` search for libarrow and attempt to build from the same source at the repository+ref given.
 
-```{bash, save=run & !sys_install & macos, hide=TRUE}
-# Setup troubleshooting section
-# install a system-level arrow on macOS
-brew install apache-arrow
+* You may also need to set the Makevars `CPPFLAGS` and `LDFLAGS` to `""` in order to prevent the installation process from attempting to link to already installed system versions of libarrow. One way to do this temporarily is wrapping your `remotes::install_github()` call like so:
+```{r}
+withr::with_makevars(list(CPPFLAGS = "", LDFLAGS = ""), remotes::install_github(...))
 ```
 
+# Common developer workflow tasks
 
-```{bash, save=run & !sys_install & ubuntu, hide=TRUE}
-# Setup troubleshooting section
-# install a system-level arrow on Ubuntu
-sudo apt update
-sudo apt install -y -V ca-certificates lsb-release wget
-wget https://apache.jfrog.io/artifactory/arrow/$(lsb_release --id --short | tr 'A-Z' 'a-z')/apache-arrow-apt-source-latest-$(lsb_release --codename --short).deb
-sudo apt install -y -V ./apache-arrow-apt-source-latest-$(lsb_release --codename --short).deb
-sudo apt update
-sudo apt install -y -V libarrow-dev
-```
+The `arrow/r` directory contains a `Makefile` to help with some common tasks from the command line (e.g. `make test`, `make doc`, `make clean`, etc.).
 
-```{bash, save=run & !sys_install & macos}
-MAKEFLAGS="LDFLAGS=" R CMD INSTALL .
-```
+## Loading arrow
 
+You can load the R package via `devtools::load_all()`.
 
-### `rpath` issues
+## Rebuilding the documentation
 
-If the package fails to install/load with an error like this:
+The R documentation uses the [`@examplesIf`](https://roxygen2.r-lib.org/articles/rd.html#functions) tag introduced in `roxygen2` version 7.1.1.9001, which hasn't yet been released on CRAN at the time of writing.  If you are making changes which require updating the documentation, please install the development version of `roxygen2` from GitHub.
 
-```
-  ** testing if installed package can be loaded from temporary location
-  Error: package or namespace load failed for 'arrow' in dyn.load(file, DLLpath = DLLpath, ...):
-  unable to load shared object '/Users/you/R/00LOCK-r/00new/arrow/libs/arrow.so':
-  dlopen(/Users/you/R/00LOCK-r/00new/arrow/libs/arrow.so, 6): Library not loaded: @rpath/libarrow.14.dylib
+```{r}
+remotes::install_github("r-lib/roxygen2")
 ```
 
-ensure that `-DARROW_INSTALL_NAME_RPATH=OFF` was passed (this is important on
-macOS to prevent problems at link time and is a no-op on other platforms).
-Alternatively, try setting the environment variable `R_LD_LIBRARY_PATH` to
-wherever Arrow C++ was put in `make install`, e.g. `export
-R_LD_LIBRARY_PATH=/usr/local/lib`, and retry installing the R package.
-
-When installing from source, if the R and C++ library versions do not
-match, installation may fail. If you’ve previously installed the
-libraries and want to upgrade the R package, you’ll need to update the
-Arrow C++ library first.
+You can use `devtools::document()` and `pkgdown::build_site()` to rebuild the documentation and preview the results.
 
-For any other build/configuration challenges, see the [C++ developer
-guide](https://arrow.apache.org/docs/developers/cpp/building.html).
+```r
+# Update roxygen documentation
+devtools::document()
 
+# To preview the documentation website
+pkgdown::build_site(preview=TRUE)
+```
 
-## Using `remotes::install_github(...)`
+## Styling and linting
 
-If you need an Arrow installation from a specific repository or at a specific ref,
-`remotes::install_github("apache/arrow/r", build = FALSE)`
-should work on most platforms (with the notable exception of Windows).
-The `build = FALSE` argument is important so that the installation can access the
-C++ source in the `cpp/` directory in `apache/arrow`.
+### R code
 
-As with other installation methods, setting the environment variables `LIBARROW_MINIMAL=false` and `ARROW_R_DEV=true` will provide a more full-featured version of Arrow and provide more verbose output, respectively.
+The R code in the package follows [the tidyverse style](https://style.tidyverse.org/). On PR submission (and on pushes) our CI will run linting and will flag possible errors on the pull request with annotations.
 
-For example, to install from the (fictional) branch `bugfix` from `apache/arrow` one could:
+To run the [lintr](https://github.com/jimhester/lintr) locally, install the lintr package (note, we currently use a fork that includes fixes not yet accepted upstream, see how lintr is being installed in the file `ci/docker/linux-apt-lint.dockerfile` for the current status) and then run
 
-```r
-Sys.setenv(LIBARROW_MINIMAL="false")
-remotes::install_github("apache/arrow/r@bugfix", build = FALSE)
+```{r}
+lintr::lint_package("arrow/r")
 ```
 
-Developers may wish to use this method of installing a specific commit
-separate from another Arrow development environment or system installation
-(e.g. we use this in [arrowbench](https://github.com/ursacomputing/arrowbench) to install development versions of arrow isolated from the system install). If you already have Arrow C++ libraries installed system-wide, you may need to set some additional variables in order to isolate this build from your system libraries:
-
-* Setting the environment variable `FORCE_BUNDLED_BUILD` to `true` will skip the `pkg-config` search for Arrow libraries and attempt to build from the same source at the repository+ref given.
-* You may also need to set the Makevars `CPPFLAGS` and `LDFLAGS` to `""` in order to prevent the installation process from attempting to link to already installed system versions of Arrow. One way to do this temporarily is wrapping your `remotes::install_github()` call like so: `withr::with_makevars(list(CPPFLAGS = "", LDFLAGS = ""), remotes::install_github(...))`.
-
-## What happens when you `R CMD INSTALL`?
-
-There are a number of scripts that are triggered when `R CMD INSTALL .`. For Arrow users, these should all just work without configuration and pull in the most complete pieces (e.g. official binaries that we host) so the installation process is easy. However knowing about these scripts can help troubleshoot if things go wrong in them or things go wrong in an install:
-
-* `configure` and `configure.win` These scripts are triggered during `R CMD INSTALL .` on non-Windows and Windows platforms, respectively. They handle finding the Arrow library, setting up the build variables necessary, and writing the package Makevars file that is used to compile the C++ code in the R package.
-* `tools/nixlibs.R` This script is sometimes called by `configure` on Linux (or on any non-windows OS with the environment variable `FORCE_BUNDLED_BUILD=true`). This sets up the build process for our bundled builds (which is the default on linux). The operative logic is at the end of the script, but it will do the following (and it will stop with the first one that succeeds and some of the steps are only checked if they are enabled via an environment variable):
-  * Check if there is an already built libarrow in `arrow/r/libarrow-{version}`, use that to link against if it exists.
-  * Check if a binary is available from our hosted unofficial builds.
-  * Download the Arrow source and build the Arrow Library from source.
-  * `*** Proceed without C++` dependencies (this is an error and the package will not work, but if you see this message you know the previous steps have not succeeded/were not enabled)
-* `inst/build_arrow_static.sh` this script builds Arrow for a bundled, static build. It is called by `tools/nixlibs.R` when the Arrow library is being built. (If you're looking at this script, and you've gotten this far, it should look _incredibly_ familiar: it's basically the contents of this guide in script form — with a few important changes)
+You can automatically change the formatting of the code in the package using the [styler](https://styler.r-lib.org/) package. There are two ways to do this:
 
-## Styling and linting of the R code in the R package
+1. Use the comment bot to do this automatically with the command `@github-actions autotune` on a PR, and commit it back to the branch.
 
-The R code in the package follows [the tidyverse style](https://style.tidyverse.org/). On PR submission (and on pushes) our CI will run linting and will flag possible errors on the pull request with annotations.
+2. Run the styler locally either via Makefile commands:
 
-To run the [lintr](https://github.com/jimhester/lintr) locally, install the lintr package (note, we currently use a fork that includes fixes not yet accepted upstream, see how lintr is being installed in the file `ci/docker/linux-apt-lint.dockerfile` for the current status) and then run `lintr::lint_package("arrow/r")`.
+```bash
+make style # (for only the files changed)
+make style-all # (for all files)
+```
 
-One can automatically change the formatting of the code in the package using the [styler](https://styler.r-lib.org/) package. There are two ways to do this:
+or in R:
 
-1. Use the comment bot to do this automatically with the command `@github-actions autotune` on a PR and commit it back to the branch.
-2. Locally, with the command `make style` (for only the files changed), `make style-all` (for all files), or use `styler::style_pkg(exclude_files = c("tests/testthat/latin1.R", "data-raw/codegen.R"))` note the two excluded files which should not be styled.
+```{r}
+# note the two excluded files which should not be styled
+styler::style_pkg(exclude_files = c("tests/testthat/latin1.R", "data-raw/codegen.R"))
+```
 
-The styler package will fix many styling errors, thought not all lintr errors are automatically fixable with styler. The list of files we habitually do not style is in `r/.styler_excludes.R`.
+The styler package will fix many styling errors, thought not all lintr errors are automatically fixable with styler. The list of files we intentionally do not style is in `r/.styler_excludes.R`.
 
-## Editing C++ code in the R package
+### C++ code
 
-The `arrow` package uses some customized tools on top of `cpp11` to prepare its
-C++ code in `src/`. This is because we have some features that are only enabled
+The arrow package uses some customized tools on top of [cpp11](https://cpp11.r-lib.org/) to prepare its
+C++ code in `src/`. This is because there are some features that are only enabled
 and built conditionally during build time. If you change C++ code in the R
 package, you will need to set the `ARROW_R_DEV` environment variable to `true`
 (optionally, add it to your `~/.Renviron` file to persist across sessions) so
@@ -450,21 +369,27 @@ Installing/enabling the appropriate plugin may save you much frustration.
 
 Check for style errors with
 
-``` shell
+```bash
 ./lint.sh
 ```
 
 Fix any style issues before committing with
 
-``` shell
+```bash
 ./lint.sh --fix
 ```
 
 The lint script requires Python 3 and `clang-format-8`. If the command
-isn’t found, you can explicitly provide the path to it like
-`CLANG_FORMAT=$(which clang-format-8) ./lint.sh`. On macOS, you can get
-this by installing LLVM via Homebrew and running the script as
-`CLANG_FORMAT=$(brew --prefix llvm@8)/bin/clang-format ./lint.sh`
+isn't found, you can explicitly provide the path to it like:
+
+```bash
+CLANG_FORMAT=$(which clang-format-8) ./lint.sh
+```
+
+On macOS, you can get this by installing LLVM via Homebrew and running the script as:
+```bash
+CLANG_FORMAT=$(brew --prefix llvm@8)/bin/clang-format ./lint.sh
+```
 
 _Note_ that the lint script requires Python 3 and the Python dependencies
 (note that `cmake_format is pinned to a specific version):
@@ -475,65 +400,206 @@ _Note_ that the lint script requires Python 3 and the Python dependencies
 
 ## Running tests
 
+Tests can be run either using `devtools::test()` or the Makefile alternative.
+
+```r
+# Run the test suite, optionally filtering file names
+devtools::test(filter="^regexp$")
+
+# or the Makefile alternative from the arrow/r directory in a shell:
+make test file=regexp
+```
+
 Some tests are conditionally enabled based on the availability of certain
 features in the package build (S3 support, compression libraries, etc.).
 Others are generally skipped by default but can be enabled with environment
 variables or other settings:
 
+* All tests are skipped on Linux if the package builds without the C++ libarrow.
+  To make the build fail if libarrow is not available (as in, to test that
+  the C++ build was successful), set `TEST_R_WITH_ARROW=true`
+
 * Some tests are disabled unless `ARROW_R_DEV=true`
+
 * Tests that require allocating >2GB of memory to test Large types are disabled
   unless `ARROW_LARGE_MEMORY_TESTS=true`
+
 * Integration tests against a real S3 bucket are disabled unless credentials
   are set in `AWS_ACCESS_KEY_ID` and `AWS_SECRET_ACCESS_KEY`; these are available
   on request
+
 * S3 tests using [MinIO](https://min.io/) locally are enabled if the
   `minio server` process is found running. If you're running MinIO with custom
   settings, you can set `MINIO_ACCESS_KEY`, `MINIO_SECRET_KEY`, and
   `MINIO_PORT` to override the defaults.
 
-## Github workflows
+## Running checks
+
+You can run package checks by using `devtools::check()` and check test coverage
+with `covr::package_coverage()`.
+
+```r
+# All package checks
+devtools::check()
+
+# See test coverage statistics
+covr::report()
+covr::package_coverage()
+```
 
-On a pull request, there are some actions you can trigger by commenting on the PR. We have additional CI checks that run nightly and can be requested on demand using an internal tool called [crosssbow](https://arrow.apache.org/docs/developers/crossbow.html). A few important GitHub comment commands include:
+For full package validation, you can run the following commands from a terminal.
 
-* `@github-actions crossbow submit -g r` for all extended R CI tests
-* `@github-actions crossbow submit {task-name}` for running a specific task. See the `r:` group definition near the beginning of the [crossbow configuration](https://github.com/apache/arrow/blob/master/dev/tasks/tasks.yml) for a list of glob expression patterns that match names of items in the `tasks:` list below it.
-* `@github-actions autotune` will run and fix lint c++ linting errors + run R documentation (among other cleanup tasks) and commit them to the branch
+```
+R CMD build .
+R CMD check arrow_*.tar.gz --as-cran
+```
 
 
-## Useful functions for Arrow developers
+## Running additional CI checks
 
-Within an R session, these can help with package development:
+On a pull request, there are some actions you can trigger by commenting on the
+PR. We have additional CI checks that run nightly and can be requested on demand
+using an internal tool called
+[crossbow](https://arrow.apache.org/docs/developers/crossbow.html).
+A few important GitHub comment commands are shown below.
 
-``` r
-# Load the dev package
-devtools::load_all()
+#### Run all extended R CI tasks
+```
+@github-actions crossbow submit -g r
+```
 
-# Run the test suite, optionally filtering file names
-devtools::test(filter="^regexp$")
-# or the Makefile alternative from the arrow/r directory in a shell:
-make test file=regexp
+This runs each of the R-related CI tasks.
 
-# Update roxygen documentation
-devtools::document()
+#### Run a specific task
+```
+@github-actions crossbow submit {task-name}
+```
 
-# To preview the documentation website
-pkgdown::build_site()
+See the `r:` group definition near the beginning of the [crossbow configuration](https://github.com/apache/arrow/blob/master/dev/tasks/tasks.yml)
+for a list of glob expression patterns that match names of items in the `tasks:`
+list below it.
 
-# All package checks; see also below
-devtools::check()
+#### Run linting and documentation building tasks
 
-# See test coverage statistics
-covr::report()
-covr::package_coverage()
+```
+@github-actions autotune
 ```
 
-Any of those can be run from the command line by wrapping them in `R -e
-'$COMMAND'`. There’s also a `Makefile` to help with some common tasks
-from the command line (`make test`, `make doc`, `make clean`, etc.)
+This will run and fix lint C++ linting errors, run R documentation (among other
+cleanup tasks), run styler on any changed R code, and commit the resulting
+updates to the branch.
 
-### Full package validation
+# Summary of environment variables
+
+* See the user-facing [Install vignette](install.html) for a large number of
+  environment variables that determine how the build works and what features
+  get built.
+* `TEST_OFFLINE_BUILD`: When set to `true`, the build script will not download
+  prebuilt the C++ library binary.
+  It will turn off any features that require a download, unless they're available
+  in the `tools/cpp/thirdparty/download/` subfolder of the tar.gz file.
+  `create_package_with_all_dependencies()` creates that subfolder.
+  Regardless of this flag's value, `cmake` will be downloaded if it's unavailable.
+* `TEST_R_WITHOUT_LIBARROW`: When set to `true`, skip tests that would require
+  the C++ Arrow library (that is, almost everything).
+
+# Troubleshooting
+
+Note that after any change to libarrow, you must reinstall it and
+run `make clean` or `git clean -fdx .` to remove any cached object code
+in the `r/src/` directory before reinstalling the R package. This is
+only necessary if you make changes to libarrow source; you do not
+need to manually purge object files if you are only editing R or C++
+code inside `r/`.
+
+## Arrow library - R package mismatches
+
+If libarrow and the R package have diverged, you will see errors like:
 
-``` shell
-R CMD build .
-R CMD check arrow_*.tar.gz --as-cran
 ```
+Error: package or namespace load failed for ‘arrow' in dyn.load(file, DLLpath = DLLpath, ...):
+ unable to load shared object '/Library/Frameworks/R.framework/Versions/4.0/Resources/library/00LOCK-r/00new/arrow/libs/arrow.so':
+  dlopen(/Library/Frameworks/R.framework/Versions/4.0/Resources/library/00LOCK-r/00new/arrow/libs/arrow.so, 6): Symbol not found: __ZN5arrow2io16RandomAccessFile9ReadAsyncERKNS0_9IOContextExx
+  Referenced from: /Library/Frameworks/R.framework/Versions/4.0/Resources/library/00LOCK-r/00new/arrow/libs/arrow.so
+  Expected in: flat namespace
+ in /Library/Frameworks/R.framework/Versions/4.0/Resources/library/00LOCK-r/00new/arrow/libs/arrow.so
+Error: loading failed
+Execution halted
+ERROR: loading failed
+```
+
+To resolve this, try [rebuilding the Arrow library](#step-3-building-arrow).
+
+## Multiple versions of libarrow
+
+If you are installing from a user-level directory, and you already have a
+previous installation of libarrow in a system directory, you get you may get
+errors like the following when you install the R package:
+
+```
+Error: package or namespace load failed for ‘arrow' in dyn.load(file, DLLpath = DLLpath, ...):
+ unable to load shared object '/Library/Frameworks/R.framework/Versions/4.0/Resources/library/00LOCK-r/00new/arrow/libs/arrow.so':
+  dlopen(/Library/Frameworks/R.framework/Versions/4.0/Resources/library/00LOCK-r/00new/arrow/libs/arrow.so, 6): Library not loaded: /usr/local/lib/libarrow.400.dylib
+  Referenced from: /usr/local/lib/libparquet.400.dylib
+  Reason: image not found
+```
+
+If this happens, you need to make sure that you don't let R link to your system
+library when building arrow. You can do this a number of different ways:
+
+* Setting the `MAKEFLAGS` environment variable to `"LDFLAGS="` (see below for an example) this is the recommended way to accomplish this
+* Using {withr}'s `with_makevars(list(LDFLAGS = ""), ...)`
+* adding `LDFLAGS=` to your `~/.R/Makevars` file (the least recommended way, though it is a common debugging approach suggested online)
+
+```{bash, save=run & !sys_install & macos, hide=TRUE}
+# Setup troubleshooting section
+# install a system-level arrow on macOS
+brew install apache-arrow
+```
+
+
+```{bash, save=run & !sys_install & ubuntu, hide=TRUE}
+# Setup troubleshooting section
+# install a system-level arrow on Ubuntu
+sudo apt update
+sudo apt install -y -V ca-certificates lsb-release wget
+wget https://apache.jfrog.io/artifactory/arrow/$(lsb_release --id --short | tr 'A-Z' 'a-z')/apache-arrow-apt-source-latest-$(lsb_release --codename --short).deb
+sudo apt install -y -V ./apache-arrow-apt-source-latest-$(lsb_release --codename --short).deb
+sudo apt update
+sudo apt install -y -V libarrow-dev
+```
+
+```{bash, save=run & !sys_install & macos}
+MAKEFLAGS="LDFLAGS=" R CMD INSTALL .
+```
+
+
+## `rpath` issues
+
+If the package fails to install/load with an error like this:
+
+```
+  ** testing if installed package can be loaded from temporary location
+  Error: package or namespace load failed for 'arrow' in dyn.load(file, DLLpath = DLLpath, ...):
+  unable to load shared object '/Users/you/R/00LOCK-r/00new/arrow/libs/arrow.so':
+  dlopen(/Users/you/R/00LOCK-r/00new/arrow/libs/arrow.so, 6): Library not loaded: @rpath/libarrow.14.dylib
+```
+
+ensure that `-DARROW_INSTALL_NAME_RPATH=OFF` was passed (this is important on
+macOS to prevent problems at link time and is a no-op on other platforms).
+Alternatively, try setting the environment variable `R_LD_LIBRARY_PATH` to
+wherever Arrow C++ was put in `make install`, e.g. `export
+R_LD_LIBRARY_PATH=/usr/local/lib`, and retry installing the R package.
+
+When installing from source, if the R and C++ library versions do not
+match, installation may fail. If you've previously installed the
+libraries and want to upgrade the R package, you'll need to update the
+Arrow C++ library first.
+
+For any other build/configuration challenges, see the [C++ developer
+guide](https://arrow.apache.org/docs/developers/cpp/building.html).
+
+## Other installation issues
+
+There are a number of scripts that are triggered when the arrow R package is installed. For package users who are not interacting with the underlying code, these should all just work without configuration and pull in the most complete pieces (e.g. official binaries that we host). However, knowing about these scripts can help package developers troubleshoot if things go wrong in them or things go wrong in an install.  See [the installation vignette](./install.html#how-dependencies-are-resolved) for more information.
+>>>>>>> master
diff --git a/r/vignettes/install.Rmd b/r/vignettes/install.Rmd
index aca860473d8..66f3e8e2e6e 100644
--- a/r/vignettes/install.Rmd
+++ b/r/vignettes/install.Rmd
@@ -102,6 +102,50 @@ satisfy C++ dependencies.
 
 > Note that, unlike packages like `tensorflow`, `blogdown`, and others that require external dependencies, you do not need to run `install_arrow()` after a successful `arrow` installation.
 
+## Offline installation
+
+The `install-arrow.R` file also includes the `create_package_with_all_dependencies()`
+function. Normally, when installing on a computer with internet access, the
+build process will download third-party dependencies as needed.
+This function provides a way to download them in advance.
+Doing so may be useful when installing Arrow on a computer without internet access.
+Note that Arrow _can_ be installed on a computer without internet access without doing this, but
+many useful features will be disabled, as they depend on third-party components.
+More precisely, `arrow::arrow_info()$capabilities()` will be `FALSE` for every
+capability.
+One approach to add more capabilities in an offline install is to prepare a
+package with pre-downloaded dependencies. The
+`create_package_with_all_dependencies()` function does this preparation.
+
+If you're using binary packages you shouldn't need to follow these steps. You
+should download the appropriate binary from your package repository, transfer
+that to the offline computer, and install that. Any OS can create the source
+bundle, but it cannot be installed on Windows. (Instead, use a standard
+Windows binary package.)
+
+Note if you're using RStudio Package Manager on Linux: If you still want to
+make a source bundle with this function, make sure to set the first repo in
+`options("repos")` to be a mirror that contains source packages (that is:
+something other than the RSPM binary mirror URLs).
+
+### Using a computer with internet access, pre-download the dependencies:
+* Install the `arrow` package _or_ run
+  `source("https://raw.githubusercontent.com/apache/arrow/master/r/R/install-arrow.R")`
+* Run `create_package_with_all_dependencies("my_arrow_pkg.tar.gz")`
+* Copy the newly created `my_arrow_pkg.tar.gz` to the computer without internet access
+
+### On the computer without internet access, install the prepared package:
+* Install the `arrow` package from the copied file
+  * `install.packages("my_arrow_pkg.tar.gz", dependencies = c("Depends", "Imports", "LinkingTo"))`
+  * This installation will build from source, so `cmake` must be available
+* Run `arrow_info()` to check installed capabilities
+
+#### Alternative, hands-on approach
+* Download the dependency files (`cpp/thirdparty/download_dependencies.sh` may be helpful)
+* Copy the directory of dependencies to the offline computer
+* Create the environment variable `ARROW_THIRDPARTY_DEPENDENCY_DIR` on the offline computer, pointing to the copied directory.
+* Install the `arrow` package as usual.
+
 ## S3 support
 
 The `arrow` package allows you to work with data in AWS S3 or in other cloud
@@ -156,17 +200,54 @@ If found, they will be downloaded and bundled when your R package compiles.
 For a list of supported distributions and versions,
 see the [arrow-r-nightly](https://github.com/ursa-labs/arrow-r-nightly/blob/master/README.md) project.
 
-If no binary is found, it will download the Arrow C++ source that matches the R package version
-(CRAN release or nightly build) and attempt to build it locally.
-If no matching source bundle is found, it will also look to see if you are in
+If no C++ library binary is found, it will attempt to build it locally.
+First, it will also look to see if you are in
 a checkout of the `apache/arrow` git repository and thus have the C++ source there.
+Otherwise, it builds from the C++ files included in the package.
 Depending on your system, building Arrow C++ from source may be slow.
 
 For the specific mechanics of how all this works, see the R package `configure` script,
 which calls `tools/nixlibs.R`.
+
 If the C++ library is built from source, `inst/build_arrow_static.sh` is executed.
 This build script is also what is used to generate the prebuilt binaries.
 
+## How the package is installed - advanced
+
+This subsection contains information which is likely to be most relevant mostly 
+to Arrow developers and is not necessary for Arrow users to install Arrow.
+
+There are a number of scripts that are triggered when `R CMD INSTALL .` is run. 
+For Arrow users, these should all just work without configuration and pull in 
+the most complete pieces (e.g. official binaries that we host).
+
+An overview of these scripts is shown below:
+
+* `configure` and `configure.win` - these scripts are triggered during 
+`R CMD INSTALL .` on non-Windows and Windows platforms, respectively. They 
+handle finding the Arrow library, setting up the build variables necessary, and 
+writing the package Makevars file that is used to compile the C++ code in the R 
+package.
+
+* `tools/nixlibs.R` - this script is sometimes called by `configure` on Linux 
+(or on any non-windows OS with the environment variable 
+`FORCE_BUNDLED_BUILD=true`). This sets up the build process for our bundled 
+builds (which is the default on linux). The operative logic is at the end of 
+the script, but it will do the following (and it will stop with the first one 
+that succeeds and some of the steps are only checked if they are enabled via an 
+environment variable):
+  * Check if there is an already built libarrow in `arrow/r/libarrow-{version}`,
+  use that to link against if it exists.
+  * Check if a binary is available from our hosted unofficial builds.
+  * Download the Arrow source and build the Arrow Library from source.
+  * `*** Proceed without C++` dependencies (this is an error and the package 
+  will not work, but if you see this message you know the previous steps have 
+  not succeeded/were not enabled)
+  
+* `inst/build_arrow_static.sh` - called by `tools/nixlibs.R` when the Arrow 
+library is being built.  It builds Arrow for a bundled, static build, and 
+mirrors the steps described in the ["Arrow R Developer Guide" vignette]("./developing.html")
+
 # Troubleshooting
 
 The intent is that `install.packages("arrow")` will just work and handle all C++
@@ -292,10 +373,15 @@ Some features are optional when you build Arrow from source. With the exception
 * `ARROW_S3`: If set to `ON` S3 support will be built as long as the
   dependencies are met; if they are not met, the build script will turn this `OFF`
 * `ARROW_JEMALLOC` for the `jemalloc` memory allocator
+* `ARROW_MIMALLOC` for the `mimalloc` memmory allocator
 * `ARROW_PARQUET`
 * `ARROW_DATASET`
+* `ARROW_JSON` for the JSON parsing library
 * `ARROW_WITH_RE2` for the RE2 regular expression library, used in some string compute functions
 * `ARROW_WITH_UTF8PROC` for the UTF8Proc string library, used in many other string compute functions
+* `ARROW_JSON` for JSON parsing
+* `ARROW_WITH_BROTLI`, `ARROW_WITH_BZ2`, `ARROW_WITH_LZ4`, `ARROW_WITH_SNAPPY`, `ARROW_WITH_ZLIB`, and `ARROW_WITH_ZSTD` for various compression algorithms
+
 
 There are a number of other variables that affect the `configure` script and the bundled build script.
 By default, these are all unset. All boolean variables are case-insensitive.
@@ -304,10 +390,6 @@ By default, these are all unset. All boolean variables are case-insensitive.
   won't look for Arrow libraries on your system and instead will look to download/build them.
   Use this if you have a version mismatch between installed system libraries
   and the version of the R package you're installing.
-* `LIBARROW_DOWNLOAD`: Unless set to `false`, the build script
-  will attempt to download C++ binary or source bundles.
-  If you're in a checkout of the `apache/arrow` git repository
-  and want to build the C++ library from the local source, make this `false`.
 * `LIBARROW_BINARY`: If set to `true`, the script will try to download a binary
   C++ library built for your operating system.
   You may also set it to some other string,
diff --git a/ruby/red-arrow-dataset/lib/arrow-dataset/arrow-table-savable.rb b/ruby/red-arrow-dataset/lib/arrow-dataset/arrow-table-savable.rb
new file mode 100644
index 00000000000..f3896f04b92
--- /dev/null
+++ b/ruby/red-arrow-dataset/lib/arrow-dataset/arrow-table-savable.rb
@@ -0,0 +1,68 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+module ArrowDataset
+  module ArrowTableSavable
+    private
+    def save_to_uri
+      format = FileFormat.resolve(@options[:format])
+      options = FileSystemDatasetWriteOptions.new
+      options.file_write_options = format.default_write_options
+      path = @output.path
+      if @output.scheme.nil?
+        options.file_system = Arrow::LocalFileSystem.new
+      else
+        options.file_system = Arrow::FileSystem.create(@output.to_s)
+        # /C:/... -> C:/...
+        unless File.expand_path(".").start_with?("/")
+          path = path.gsub(/\A\//, "")
+        end
+      end
+      partitioning = @options[:partitioning]
+      if partitioning
+        # TODO
+        options.base_dir = File.dirname(path)
+        options.base_name_template = File.basename(path)
+        options.partitioning = Partitioning.resolve(@options[:partitioning])
+        scanner_builder = ScannerBuilder.new(@table)
+        scanner = scanner_builder.finish
+        FileSystemDataset.write_scanner(scanner, options)
+      else
+        dir = File.dirname(path)
+        unless File.exist?(dir)
+          options.file_system.create_dir(dir, true)
+        end
+        options.file_system.open_output_stream(path) do |output_stream|
+          format.open_writer(output_stream,
+                             options.file_system,
+                             path,
+                             @table.schema,
+                             format.default_write_options) do |writer|
+            reader = Arrow::TableBatchReader.new(@table)
+            writer.write_record_batch_reader(reader)
+          end
+        end
+      end
+    end
+  end
+end
+
+module Arrow
+  class TableSaver
+    include ArrowDataset::ArrowTableSavable
+  end
+end
diff --git a/ruby/red-arrow-dataset/lib/arrow-dataset/file-format.rb b/ruby/red-arrow-dataset/lib/arrow-dataset/file-format.rb
index 266ea49e3f5..83e61c4b24a 100644
--- a/ruby/red-arrow-dataset/lib/arrow-dataset/file-format.rb
+++ b/ruby/red-arrow-dataset/lib/arrow-dataset/file-format.rb
@@ -41,5 +41,19 @@ def resolve(format)
         end
       end
     end
+
+    alias_method :open_writer_raw, :open_writer
+    def open_writer(destination, file_system, path, schema, options)
+      writer = open_writer_raw(destination, file_system, path, schema, options)
+      if block_given?
+        begin
+          yield(writer)
+        ensure
+          writer.finish
+        end
+      else
+        writer
+      end
+    end
   end
 end
diff --git a/ruby/red-arrow-dataset/lib/arrow-dataset/loader.rb b/ruby/red-arrow-dataset/lib/arrow-dataset/loader.rb
index 599c055e84c..b1be000f7c3 100644
--- a/ruby/red-arrow-dataset/lib/arrow-dataset/loader.rb
+++ b/ruby/red-arrow-dataset/lib/arrow-dataset/loader.rb
@@ -30,6 +30,7 @@ def post_load(repository, namespace)
 
     def require_libraries
       require "arrow-dataset/arrow-table-loadable"
+      require "arrow-dataset/arrow-table-savable"
       require "arrow-dataset/dataset"
       require "arrow-dataset/file-format"
       require "arrow-dataset/file-system-dataset-factory"
diff --git a/ruby/red-arrow-dataset/test/test-arrow-table.rb b/ruby/red-arrow-dataset/test/test-arrow-table.rb
index 6ae9a905d2b..a9ab40337b6 100644
--- a/ruby/red-arrow-dataset/test/test-arrow-table.rb
+++ b/ruby/red-arrow-dataset/test/test-arrow-table.rb
@@ -19,10 +19,9 @@ class TestArrowTable < Test::Unit::TestCase
   def setup
     Dir.mktmpdir do |tmpdir|
       @dir = tmpdir
-      @path = File.join(@dir, "table.arrow")
+      @path = File.join(@dir, "data", "table.arrow")
       @table = Arrow::Table.new(visible: [true, false, true],
                                 point: [1, 2, 3])
-      @table.save(@path)
       yield
     end
   end
@@ -40,12 +39,14 @@ def build_file_uri(path)
     def test_no_scheme
       Dir.chdir(@dir) do
         uri = URI(File.basename(@path))
+        @table.save(uri)
         assert_equal(@table, Arrow::Table.load(uri))
       end
     end
 
     def test_file
       uri = build_file_uri(@path)
+      @table.save(uri)
       assert_equal(@table, Arrow::Table.load(uri))
     end
   end
diff --git a/ruby/red-arrow/lib/arrow/column-containable.rb b/ruby/red-arrow/lib/arrow/column-containable.rb
index 51ad88e7080..7d7de66bda0 100644
--- a/ruby/red-arrow/lib/arrow/column-containable.rb
+++ b/ruby/red-arrow/lib/arrow/column-containable.rb
@@ -27,6 +27,17 @@ def each_column(&block)
       columns.each(&block)
     end
 
+    # @overload [](name)
+    #   Find a column that has the given name.
+    #
+    #   @param name [String, Symbol] The column name to be found.
+    #   @return [Column] The found column.
+    #
+    # @overload [](index)
+    #   Find the `index`-th column.
+    #
+    #   @param index [Integer] The index to be found.
+    #   @return [Column] The found column.
     def find_column(name_or_index)
       case name_or_index
       when String, Symbol
@@ -40,9 +51,97 @@ def find_column(name_or_index)
         return nil if index < 0 or index >= n_columns
         Column.new(self, index)
       else
-        message = "column name or index must be String, Symbol or Integer"
+        message = "column name or index must be String, Symbol or Integer: "
+        message << name_or_index.inspect
         raise ArgumentError, message
       end
     end
+
+    # Selects columns that are selected by `selectors` and/or `block`
+    # and creates a new container only with the selected columns.
+    #
+    # @param selectors [Array<String, Symbol, Integer, Range>]
+    #   If a selector is `String`, `Symbol` or `Integer`, the selector
+    #   selects a column by {#find_column}.
+    #
+    #   If a selector is `Range`, the selector selects columns by `::Array#[]`.
+    # @yield [column] Gives a column to the block to select columns.
+    #   This uses `::Array#select`.
+    # @yieldparam column [Column] A target column.
+    # @yieldreturn [Boolean] Whether the given column is selected or not.
+    # @return [self.class] The newly created container that only has selected
+    #   columns.
+    def select_columns(*selectors, &block)
+      if selectors.empty?
+        return to_enum(__method__) unless block_given?
+        selected_columns = columns.select(&block)
+      else
+        selected_columns = []
+        selectors.each do |selector|
+          case selector
+          when Range
+            selected_columns.concat(columns[selector])
+          else
+            column = find_column(selector)
+            if column.nil?
+              case selector
+              when String, Symbol
+                message = "unknown column: #{selector.inspect}: #{inspect}"
+                raise KeyError.new(message)
+              else
+                message = "out of index (0..#{n_columns - 1}): "
+                message << "#{selector.inspect}: #{inspect}"
+                raise IndexError.new(message)
+              end
+            end
+            selected_columns << column
+          end
+        end
+        selected_columns = selected_columns.select(&block) if block_given?
+      end
+      self.class.new(selected_columns)
+    end
+
+    # @overload [](name)
+    #   Find a column that has the given name.
+    #
+    #   @param name [String, Symbol] The column name to be found.
+    #   @return [Column] The found column.
+    #   @see #find_column
+    #
+    # @overload [](index)
+    #   Find the `index`-th column.
+    #
+    #   @param index [Integer] The index to be found.
+    #   @return [Column] The found column.
+    #   @see #find_column
+    #
+    # @overload [](range)
+    #   Selects columns that are in `range` and creates a new container
+    #   only with the selected columns.
+    #
+    #   @param range [Range] The range to be selected.
+    #   @return [self.class] The newly created container that only has selected
+    #     columns.
+    #   @see #select_columns
+    #
+    # @overload [](selectors)
+    #   Selects columns that are selected by `selectors` and creates a
+    #   new container only with the selected columns.
+    #
+    #   @param selectors [Array] The selectors that are used to select columns.
+    #   @return [self.class] The newly created container that only has selected
+    #     columns.
+    #   @see #select_columns
+    def [](selector)
+      case selector
+      when ::Array
+        select_columns(*selector)
+      when Range
+        select_columns(selector)
+      else
+        find_column(selector)
+      end
+    end
   end
 end
diff --git a/ruby/red-arrow/lib/arrow/datum.rb b/ruby/red-arrow/lib/arrow/datum.rb
index 99d1dae32f8..196a18f54ff 100644
--- a/ruby/red-arrow/lib/arrow/datum.rb
+++ b/ruby/red-arrow/lib/arrow/datum.rb
@@ -21,6 +21,8 @@ class << self
       # @api private
       def try_convert(value)
         case value
+        when Table
+          TableDatum.new(value)
         when Array
           ArrayDatum.new(value)
         when ChunkedArray
diff --git a/ruby/red-arrow/lib/arrow/file-system.rb b/ruby/red-arrow/lib/arrow/file-system.rb
new file mode 100644
index 00000000000..7d105b42a3e
--- /dev/null
+++ b/ruby/red-arrow/lib/arrow/file-system.rb
@@ -0,0 +1,34 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+module Arrow
+  class FileSystem
+    alias_method :open_output_stream_raw, :open_output_stream
+    def open_output_stream(path)
+      stream = open_output_stream_raw(path)
+      if block_given?
+        begin
+          yield(stream)
+        ensure
+          stream.close
+        end
+      else
+        stream
+      end
+    end
+  end
+end
diff --git a/ruby/red-arrow/lib/arrow/loader.rb b/ruby/red-arrow/lib/arrow/loader.rb
index 5ede8eeea1d..9ca7e2619ef 100644
--- a/ruby/red-arrow/lib/arrow/loader.rb
+++ b/ruby/red-arrow/lib/arrow/loader.rb
@@ -72,6 +72,7 @@ def require_libraries
       require "arrow/equal-options"
       require "arrow/field"
       require "arrow/file-output-stream"
+      require "arrow/file-system"
       require "arrow/fixed-size-binary-array"
       require "arrow/fixed-size-binary-array-builder"
       require "arrow/group"
diff --git a/ruby/red-arrow/lib/arrow/map-data-type.rb b/ruby/red-arrow/lib/arrow/map-data-type.rb
index a157aa512af..67e1343295c 100644
--- a/ruby/red-arrow/lib/arrow/map-data-type.rb
+++ b/ruby/red-arrow/lib/arrow/map-data-type.rb
@@ -40,7 +40,7 @@ class MapDataType
     #     See {Arrow::DataType.resolve} how to specify data type
     #     description.
     #
-    #   @example Create a map data type for {0: "Hello", 1: "World"}
+    #   @example Create a map data type for `{0: "Hello", 1: "World"}`
     #     key = :int8
     #     item = :string
     #     Arrow::MapDataType.new(key, item)
@@ -66,7 +66,7 @@ class MapDataType
     #     See {Arrow::DataType.resolve} how to specify data type
     #     description.
     #
-    #   @example Create a maap data type for {0: "Hello", 1: "World"}
+    #   @example Create a map data type for `{0: "Hello", 1: "World"}`
     #     Arrow::MapDataType.new(key: :int8, item: :string)
     def initialize(*args)
       n_args = args.size
diff --git a/ruby/red-arrow/lib/arrow/record-batch.rb b/ruby/red-arrow/lib/arrow/record-batch.rb
index e7ebf50e197..c5aaf876b07 100644
--- a/ruby/red-arrow/lib/arrow/record-batch.rb
+++ b/ruby/red-arrow/lib/arrow/record-batch.rb
@@ -50,8 +50,6 @@ def new(*args)
     alias_method :size, :n_rows
     alias_method :length, :n_rows
 
-    alias_method :[], :find_column
-
     # Converts the record batch to {Arrow::Table}.
     #
     # @return [Arrow::Table]
diff --git a/ruby/red-arrow/lib/arrow/slicer.rb b/ruby/red-arrow/lib/arrow/slicer.rb
index fa834766866..6cca7f75e9b 100644
--- a/ruby/red-arrow/lib/arrow/slicer.rb
+++ b/ruby/red-arrow/lib/arrow/slicer.rb
@@ -16,9 +16,6 @@
 # under the License.
 
 module Arrow
-  # Experimental
-  #
-  # TODO: Almost codes should be implemented in Apache Arrow C++.
   class Slicer
     def initialize(table)
       @table = table
@@ -43,6 +40,21 @@ def method_missing(name, *args, &block)
       super
     end
 
+    module Helper
+      class << self
+        def ensure_boolean(column)
+          case column.data_type
+          when Arrow::BooleanDataType
+            column.data
+          else
+            options = CastOptions.new
+            options.to_data_type = Arrow::BooleanDataType.new
+            Function.find("cast").execute([column.data], options).value
+          end
+        end
+      end
+    end
+
     class Condition
       def evaluate
         message = "Slicer::Condition must define \#evaluate: #{inspect}"
@@ -69,43 +81,28 @@ def initialize(condition1, condition2)
       end
 
       def evaluate
-        values1 = @condition1.evaluate.each
-        values2 = @condition2.evaluate.each
-        raw_array = []
-        begin
-          loop do
-            value1 = values1.next
-            value2 = values2.next
-            if value1.nil? or value2.nil?
-              raw_array << nil
-            else
-              raw_array << evaluate_value(value1, value2)
-            end
-          end
-        rescue StopIteration
-        end
-        BooleanArray.new(raw_array)
+        function.execute([@condition1.evaluate, @condition2.evaluate]).value
       end
     end
 
     class AndCondition < LogicalCondition
       private
-      def evaluate_value(value1, value2)
-        value1 and value2
+      def function
+        Function.find("and")
       end
     end
 
     class OrCondition < LogicalCondition
       private
-      def evaluate_value(value1, value2)
-        value1 or value2
+      def function
+        Function.find("or")
       end
     end
 
     class XorCondition < LogicalCondition
       private
-      def evaluate_value(value1, value2)
-        value1 ^ value2
+      def function
+        Function.find("xor")
       end
     end
 
@@ -115,21 +112,7 @@ def initialize(column)
       end
 
       def evaluate
-        data = @column.data
-
-        case @column.data_type
-        when BooleanDataType
-          data
-        else
-          if data.n_chunks == 1
-            data.get_chunk(0).cast(BooleanDataType.new, nil)
-          else
-            arrays = data.each_chunk.collect do |chunk|
-              chunk.cast(BooleanDataType.new, nil)
-            end
-            ChunkedArray.new(arrays)
-          end
-        end
+        Helper.ensure_boolean(@column)
       end
 
       def !@
@@ -187,23 +170,8 @@ def initialize(column)
       end
 
       def evaluate
-        data = @column.data
-        raw_array = []
-        data.each_chunk do |chunk|
-          if chunk.is_a?(BooleanArray)
-            boolean_array = chunk
-          else
-            boolean_array = chunk.cast(BooleanDataType.new, nil)
-          end
-          boolean_array.each do |value|
-            if value.nil?
-              raw_array << value
-            else
-              raw_array << !value
-            end
-          end
-        end
-        BooleanArray.new(raw_array)
+        data = Helper.ensure_boolean(@column)
+        Function.find("invert").execute([data]).value
       end
 
       def !@
@@ -222,19 +190,10 @@ def !@
       end
 
       def evaluate
-        case @value
-        when nil
-          raw_array = @column.collect(&:nil?)
-          BooleanArray.new(raw_array)
+        if @value.nil?
+          Function.find("is_null").execute([@column.data]).value
         else
-          raw_array = @column.collect do |value|
-            if value.nil?
-              nil
-            else
-              @value == value
-            end
-          end
-          BooleanArray.new(raw_array)
+          Function.find("equal").execute([@column.data, @value]).value
         end
       end
     end
@@ -250,25 +209,10 @@ def !@
       end
 
       def evaluate
-        case @value
-        when nil
-          if @column.n_nulls.zero?
-            raw_array = [true] * @column.n_rows
-          else
-            raw_array = @column.n_rows.times.collect do |i|
-              @column.valid?(i)
-            end
-          end
-          BooleanArray.new(raw_array)
+        if @value.nil?
+          Function.find("is_valid").execute([@column.data]).value
         else
-          raw_array = @column.collect do |value|
-            if value.nil?
-              nil
-            else
-              @value != value
-            end
-          end
-          BooleanArray.new(raw_array)
+          Function.find("not_equal").execute([@column.data, @value]).value
         end
       end
     end
@@ -284,14 +228,7 @@ def !@
       end
 
       def evaluate
-        raw_array = @column.collect do |value|
-          if value.nil?
-            nil
-          else
-            @value > value
-          end
-        end
-        BooleanArray.new(raw_array)
+        Function.find("less").execute([@column.data, @value]).value
       end
     end
 
@@ -306,14 +243,7 @@ def !@
       end
 
       def evaluate
-        raw_array = @column.collect do |value|
-          if value.nil?
-            nil
-          else
-            @value >= value
-          end
-        end
-        BooleanArray.new(raw_array)
+        Function.find("less_equal").execute([@column.data, @value]).value
       end
     end
 
@@ -328,14 +258,7 @@ def !@
       end
 
       def evaluate
-        raw_array = @column.collect do |value|
-          if value.nil?
-            nil
-          else
-            @value < value
-          end
-        end
-        BooleanArray.new(raw_array)
+        Function.find("greater").execute([@column.data, @value]).value
       end
     end
 
@@ -350,14 +273,7 @@ def !@
       end
 
       def evaluate
-        raw_array = @column.collect do |value|
-          if value.nil?
-            nil
-          else
-            @value <= value
-          end
-        end
-        BooleanArray.new(raw_array)
+        Function.find("greater_equal").execute([@column.data, @value]).value
       end
     end
 
@@ -372,18 +288,10 @@ def !@
       end
 
       def evaluate
-        values_index = {}
-        @values.each do |value|
-          values_index[value] = true
-        end
-        raw_array = @column.collect do |value|
-          if value.nil?
-            nil
-          else
-            values_index.key?(value)
-          end
-        end
-        BooleanArray.new(raw_array)
+        values = @values
+        values = Array.new(values) unless values.is_a?(Array)
+        options = SetLookupOptions.new(values)
+        Function.find("is_in").execute([@column.data], options).value
       end
     end
 
@@ -398,18 +306,11 @@ def !@
       end
 
       def evaluate
-        values_index = {}
-        @values.each do |value|
-          values_index[value] = true
-        end
-        raw_array = @column.collect do |value|
-          if value.nil?
-            nil
-          else
-            not values_index.key?(value)
-          end
-        end
-        BooleanArray.new(raw_array)
+        values = @values
+        values = Array.new(values) unless values.is_a?(Array)
+        options = SetLookupOptions.new(values)
+        booleans = Function.find("is_in").execute([@column.data], options).value
+        Function.find("invert").execute([booleans]).value
       end
     end
 
diff --git a/ruby/red-arrow/lib/arrow/table-saver.rb b/ruby/red-arrow/lib/arrow/table-saver.rb
index bc2296a0a07..207a10a8217 100644
--- a/ruby/red-arrow/lib/arrow/table-saver.rb
+++ b/ruby/red-arrow/lib/arrow/table-saver.rb
@@ -32,6 +32,29 @@ def initialize(table, output, options={})
     end
 
     def save
+      if @output.is_a?(URI)
+        custom_save_method = "save_to_uri"
+      else
+        custom_save_method = "save_to_file"
+      end
+      unless respond_to?(custom_save_method, true)
+        available_schemes = []
+        (methods(true) | private_methods(true)).each do |name|
+          match_data = /\Asave_to_/.match(name.to_s)
+          if match_data
+            available_schemes << match_data.post_match
+          end
+        end
+        message = "Arrow::Table save source must be one of ["
+        message << available_schemes.join(", ")
+        message << "]: #{@output.scheme.inspect}"
+        raise ArgumentError, message
+      end
+      __send__(custom_save_method)
+    end
+
+    private
+    def save_to_file
       format = @options[:format]
       custom_save_method = "save_as_#{format}"
       unless respond_to?(custom_save_method, true)
@@ -57,21 +80,24 @@ def save
       end
     end
 
-    private
     def fill_options
       if @options[:format] and @options.key?(:compression)
         return
       end
 
-      if @output.is_a?(Buffer)
+      case @output
+      when Buffer
         info = {}
+      when URI
+        extension = PathExtension.new(@output.path)
+        info = extension.extract
       else
         extension = PathExtension.new(@output)
         info = extension.extract
       end
       format = info[:format]
       @options = @options.dup
-      if format and respond_to?("save_as_#{format}", true)
+      if format
         @options[:format] ||= format.to_sym
       else
         @options[:format] ||= :arrow
diff --git a/ruby/red-arrow/lib/arrow/table.rb b/ruby/red-arrow/lib/arrow/table.rb
index e9bf3221304..aab4c409861 100644
--- a/ruby/red-arrow/lib/arrow/table.rb
+++ b/ruby/red-arrow/lib/arrow/table.rb
@@ -195,8 +195,6 @@ def each_record_batch
     alias_method :size, :n_rows
     alias_method :length, :n_rows
 
-    alias_method :[], :find_column
-
     alias_method :slice_raw, :slice
 
     # @overload slice(offset, length)
@@ -397,41 +395,6 @@ def remove_column(name_or_index)
       remove_column_raw(index)
     end
 
-    # TODO
-    #
-    # @return [Arrow::Table]
-    def select_columns(*selectors, &block)
-      if selectors.empty?
-        return to_enum(__method__) unless block_given?
-        selected_columns = columns.select(&block)
-      else
-        selected_columns = []
-        selectors.each do |selector|
-          case selector
-          when String, Symbol
-            column = find_column(selector)
-            if column.nil?
-              message = "unknown column: #{selector.inspect}: #{inspect}"
-              raise KeyError.new(message)
-            end
-            selected_columns << column
-          when Range
-            selected_columns.concat(columns[selector])
-          else
-            column = columns[selector]
-            if column.nil?
-              message = "out of index (0..#{n_columns - 1}): " +
-              "#{selector.inspect}: #{inspect}"
-              raise IndexError.new(message)
-            end
-            selected_columns << column
-          end
-        end
-        selected_columns = selected_columns.select(&block) if block_given?
-      end
-      self.class.new(selected_columns)
-    end
-
     # Experimental
     def group(*keys)
       Group.new(self, keys)
diff --git a/ruby/red-arrow/test/test-record-batch.rb b/ruby/red-arrow/test/test-record-batch.rb
index 87f89355854..e94c26f2e32 100644
--- a/ruby/red-arrow/test/test-record-batch.rb
+++ b/ruby/red-arrow/test/test-record-batch.rb
@@ -136,5 +136,47 @@ def setup
         end
       end
     end
+
+    sub_test_case("#[]") do
+      def setup
+        @record_batch = Arrow::RecordBatch.new(a: [true],
+                                               b: [true],
+                                               c: [true],
+                                               d: [true],
+                                               e: [true],
+                                               f: [true],
+                                               g: [true])
+      end
+
+      test("[String]") do
+        assert_equal(Arrow::Column.new(@record_batch, 0),
+                     @record_batch["a"])
+      end
+
+      test("[Symbol]") do
+        assert_equal(Arrow::Column.new(@record_batch, 1),
+                     @record_batch[:b])
+      end
+
+      test("[Integer]") do
+        assert_equal(Arrow::Column.new(@record_batch, 6),
+                     @record_batch[-1])
+      end
+
+      test("[Range]") do
+        assert_equal(Arrow::RecordBatch.new(d: [true],
+                                            e: [true]),
+                     @record_batch[3..4])
+      end
+
+      test("[[Symbol, String, Integer, Range]]") do
+        assert_equal(Arrow::RecordBatch.new(c: [true],
+                                            a: [true],
+                                            g: [true],
+                                            d: [true],
+                                            e: [true]),
+                     @record_batch[[:c, "a", -1, 3..4]])
+      end
+    end
   end
 end
diff --git a/ruby/red-arrow/test/test-slicer.rb b/ruby/red-arrow/test/test-slicer.rb
index b0f2dfa32c6..420086690a0 100644
--- a/ruby/red-arrow/test/test-slicer.rb
+++ b/ruby/red-arrow/test/test-slicer.rb
@@ -349,12 +349,11 @@ def setup
       slicer.count.in?([1, 4, 16, 64])
     end
     assert_equal(<<-TABLE, sliced_table.to_s)
-	 count	visible
-0	     1	true   
-1	     4	 (null)
-2	    16	true   
-3	    64	 (null)
-4	(null)	 (null)
+	count	visible
+0	    1	true   
+1	    4	 (null)
+2	   16	true   
+3	   64	 (null)
     TABLE
   end
 
diff --git a/ruby/red-arrow/test/test-table.rb b/ruby/red-arrow/test/test-table.rb
index 5f6ba8b94be..d530be24a24 100644
--- a/ruby/red-arrow/test/test-table.rb
+++ b/ruby/red-arrow/test/test-table.rb
@@ -190,20 +190,45 @@ def setup
   end
 
   sub_test_case("#[]") do
+    def setup
+      @table = Arrow::Table.new(a: [true],
+                                b: [true],
+                                c: [true],
+                                d: [true],
+                                e: [true],
+                                f: [true],
+                                g: [true])
+    end
+
     test("[String]") do
       assert_equal(Arrow::Column.new(@table, 0),
-                   @table["count"])
+                   @table["a"])
     end
 
     test("[Symbol]") do
       assert_equal(Arrow::Column.new(@table, 1),
-                   @table[:visible])
+                   @table[:b])
     end
 
     test("[Integer]") do
-      assert_equal(Arrow::Column.new(@table, 1),
+      assert_equal(Arrow::Column.new(@table, 6),
                    @table[-1])
     end
+
+    test("[Range]") do
+      assert_equal(Arrow::Table.new(d: [true],
+                                    e: [true]),
+                   @table[3..4])
+    end
+
+    test("[[Symbol, String, Integer, Range]]") do
+      assert_equal(Arrow::Table.new(c: [true],
+                                    a: [true],
+                                    g: [true],
+                                    d: [true],
+                                    e: [true]),
+                   @table[[:c, "a", -1, 3..4]])
+    end
   end
 
   sub_test_case("#merge") do
diff --git a/testing b/testing
index 6d98243093c..2c29a733ac2 160000
--- a/testing
+++ b/testing
@@ -1 +1 @@
-Subproject commit 6d98243093c0b36442da94de7010f3eacc2a9909
+Subproject commit 2c29a733ac2c8492d5df3b74ea5ab1a32f892f60