From 053f7da21c47f7caf739c999bbb424356ee18cd7 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Tue, 30 Apr 2024 02:53:43 +0000
Subject: [PATCH 01/53] Read duration type in cudf parquet via arrow:schema

---
 .../cudf/detail/utilities/base64_utils.hpp    |  159 +
 cpp/include/cudf/io/ipc/Message.fbs           |  155 +
 cpp/include/cudf/io/ipc/Schema.fbs            |  570 ++++
 .../cudf/io/ipc/detail/Message_generated.h    |  651 ++++
 .../cudf/io/ipc/detail/Schema_generated.h     | 2769 +++++++++++++++++
 .../cudf/io/ipc/flatbuffers/allocator.h       |   73 +
 cpp/include/cudf/io/ipc/flatbuffers/array.h   |  267 ++
 cpp/include/cudf/io/ipc/flatbuffers/base.h    |  498 +++
 cpp/include/cudf/io/ipc/flatbuffers/buffer.h  |  222 ++
 .../cudf/io/ipc/flatbuffers/buffer_ref.h      |   58 +
 .../io/ipc/flatbuffers/default_allocator.h    |   70 +
 .../cudf/io/ipc/flatbuffers/detached_buffer.h |  128 +
 .../io/ipc/flatbuffers/flatbuffer_builder.h   | 1574 ++++++++++
 .../cudf/io/ipc/flatbuffers/flatbuffers.h     |  289 ++
 .../cudf/io/ipc/flatbuffers/stl_emulation.h   |  568 ++++
 cpp/include/cudf/io/ipc/flatbuffers/string.h  |   70 +
 cpp/include/cudf/io/ipc/flatbuffers/struct.h  |   60 +
 cpp/include/cudf/io/ipc/flatbuffers/table.h   |  202 ++
 cpp/include/cudf/io/ipc/flatbuffers/vector.h  |  416 +++
 .../cudf/io/ipc/flatbuffers/vector_downward.h |  316 ++
 .../cudf/io/ipc/flatbuffers/verifier.h        |  389 +++
 cpp/src/io/functions.cpp                      |    3 +
 cpp/src/io/parquet/reader_impl.cpp            |   42 +-
 cpp/src/io/parquet/reader_impl_helpers.cpp    |  628 ++--
 cpp/src/io/parquet/reader_impl_helpers.hpp    |   22 +-
 25 files changed, 9993 insertions(+), 206 deletions(-)
 create mode 100644 cpp/include/cudf/detail/utilities/base64_utils.hpp
 create mode 100644 cpp/include/cudf/io/ipc/Message.fbs
 create mode 100644 cpp/include/cudf/io/ipc/Schema.fbs
 create mode 100644 cpp/include/cudf/io/ipc/detail/Message_generated.h
 create mode 100644 cpp/include/cudf/io/ipc/detail/Schema_generated.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/allocator.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/array.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/base.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/buffer.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/buffer_ref.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/default_allocator.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/detached_buffer.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/flatbuffer_builder.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/flatbuffers.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/stl_emulation.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/string.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/struct.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/table.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/vector.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/vector_downward.h
 create mode 100644 cpp/include/cudf/io/ipc/flatbuffers/verifier.h

diff --git a/cpp/include/cudf/detail/utilities/base64_utils.hpp b/cpp/include/cudf/detail/utilities/base64_utils.hpp
new file mode 100644
index 00000000000..fd8e85ec382
--- /dev/null
+++ b/cpp/include/cudf/detail/utilities/base64_utils.hpp
@@ -0,0 +1,159 @@
+/*
+   base64_utils.cpp and base64_utils.hpp
+
+   base64 encoding and decoding with C++.
+
+   Version: 1.01.00
+
+   Copyright (C) 2004-2017 René Nyffenegger
+
+   This source code is provided 'as-is', without any express or implied
+   warranty. In no event will the author be held liable for any damages
+   arising from the use of this software.
+
+   Permission is granted to anyone to use this software for any purpose,
+   including commercial applications, and to alter it and redistribute it
+   freely, subject to the following restrictions:
+
+   1. The origin of this source code must not be misrepresented; you must not
+      claim that you wrote the original source code. If you use this source code
+      in a product, an acknowledgment in the product documentation would be
+      appreciated but is not required.
+
+   2. Altered source versions must be plainly marked as such, and must not be
+      misrepresented as being the original source code.
+
+   3. This notice may not be removed or altered from any source distribution.
+
+   René Nyffenegger rene.nyffenegger@adp-gmbh.ch
+
+*/
+
+/**
+ * @file base64_utils.hpp
+ * @brief base64 string encoding/decoding utilities and implementation
+ */
+
+#pragma once
+
+// altered: including required std headers
+#include <array>
+#include <iostream>
+#include <string>
+#include <vector>
+
+// altered: merged base64.h and base64.cpp into one file.
+// altered: applying clang-format for libcudf on this file.
+
+// altered: use cudf namespaces
+namespace cudf::detail {
+
+static const std::string base64_chars =
+  "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
+  "abcdefghijklmnopqrstuvwxyz"
+  "0123456789+/";
+
+static inline auto is_base64(unsigned char c) { return (isalnum(c) or (c == '+') or (c == '/')); }
+
+// merging the encoder wrapper into the single function
+std::string base64_encode(std::string_view string_to_encode)
+{
+  // get bytes to encode and length
+  auto bytes_to_encode = reinterpret_cast<const unsigned char*>(string_to_encode.data());
+  auto input_length    = string_to_encode.size();
+
+  std::string encoded;
+  std::array<unsigned char, 4> char_array_4;
+  std::array<unsigned char, 3> char_array_3;
+  int i = 0;
+  int j = 0;
+
+  // altered: added braces to one liner loops in the rest of this function
+  while (input_length--) {
+    char_array_3[i++] = *(bytes_to_encode++);
+    if (i == 3) {
+      char_array_4[0] = (char_array_3[0] & 0xfc) >> 2;
+      char_array_4[1] = ((char_array_3[0] & 0x03) << 4) + ((char_array_3[1] & 0xf0) >> 4);
+      char_array_4[2] = ((char_array_3[1] & 0x0f) << 2) + ((char_array_3[2] & 0xc0) >> 6);
+      char_array_4[3] = char_array_3[2] & 0x3f;
+
+      for (i = 0; (i < 4); i++) {
+        encoded += base64_chars[char_array_4[i]];
+      }
+      i = 0;
+    }
+  }
+
+  if (i) {
+    for (j = i; j < 3; j++) {
+      char_array_3[j] = '\0';
+    }
+
+    char_array_4[0] = (char_array_3[0] & 0xfc) >> 2;
+    char_array_4[1] = ((char_array_3[0] & 0x03) << 4) + ((char_array_3[1] & 0xf0) >> 4);
+    char_array_4[2] = ((char_array_3[1] & 0x0f) << 2) + ((char_array_3[2] & 0xc0) >> 6);
+
+    for (j = 0; (j < i + 1); j++) {
+      encoded += base64_chars[char_array_4[j]];
+    }
+    while ((i++ < 3)) {
+      encoded += '=';
+    }
+  }
+
+  return encoded;
+}
+
+// base64 decode lambda function
+std::string base64_decode(std::string_view encoded_string)
+{
+  std::array<unsigned char, 4> char_array_4;
+  std::array<unsigned char, 3> char_array_3;
+  std::string decoded;
+  size_t input_len = encoded_string.size();
+
+  int i   = 0;
+  int j   = 0;
+  int in_ = 0;
+
+  // altered: added braces to one liner loops in the rest of this function
+  while (input_len-- and (encoded_string[in_] != '=') and is_base64(encoded_string[in_])) {
+    char_array_4[i++] = encoded_string[in_];
+    in_++;
+    if (i == 4) {
+      for (i = 0; i < 4; i++) {
+        char_array_4[i] = base64_chars.find(char_array_4[i]) & 0xff;
+      }
+
+      char_array_3[0] = (char_array_4[0] << 2) + ((char_array_4[1] & 0x30) >> 4);
+      char_array_3[1] = ((char_array_4[1] & 0xf) << 4) + ((char_array_4[2] & 0x3c) >> 2);
+      char_array_3[2] = ((char_array_4[2] & 0x3) << 6) + char_array_4[3];
+
+      for (i = 0; (i < 3); i++) {
+        decoded += char_array_3[i];
+      }
+      i = 0;
+    }
+  }
+
+  // altered: modify to i!=0 for better readability
+  if (i != 0) {
+    for (j = 0; j < i; j++) {
+      char_array_4[j] = base64_chars.find(char_array_4[j]) & 0xff;
+    }
+    char_array_3[0] = (char_array_4[0] << 2) + ((char_array_4[1] & 0x30) >> 4);
+    char_array_3[1] = ((char_array_4[1] & 0xf) << 4) + ((char_array_4[2] & 0x3c) >> 2);
+    // altered: TODO: arrow source code doesn't have the below line.
+    // altered: This is inconsequential as it is never appended to
+    // altered: `decoded` as max(i) = 3 and 0 <= j < 2.
+    char_array_3[2] = ((char_array_4[2] & 0x3) << 6) + char_array_4[3];
+
+    for (j = 0; j < i - 1; j++) {
+      decoded += char_array_3[j];
+    }
+  }
+
+  return decoded;
+}
+
+}  // namespace cudf::detail
diff --git a/cpp/include/cudf/io/ipc/Message.fbs b/cpp/include/cudf/io/ipc/Message.fbs
new file mode 100644
index 00000000000..8a65c2e3cf9
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/Message.fbs
@@ -0,0 +1,155 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+include "Schema.fbs";
+
+namespace cudf.io.parquet.flatbuf;
+
+/// ----------------------------------------------------------------------
+/// Data structures for describing a table row batch (a collection of
+/// equal-length Arrow arrays)
+
+/// Metadata about a field at some level of a nested type tree (but not
+/// its children).
+///
+/// For example, a List<Int16> with values `[[1, 2, 3], null, [4], [5, 6], null]`
+/// would have {length: 5, null_count: 2} for its List node, and {length: 6,
+/// null_count: 0} for its Int16 node, as separate FieldNode structs
+struct FieldNode {
+  /// The number of value slots in the Arrow array at this level of a nested
+  /// tree
+  length: long;
+
+  /// The number of observed nulls. Fields with null_count == 0 may choose not
+  /// to write their physical validity bitmap out as a materialized buffer,
+  /// instead setting the length of the bitmap buffer to 0.
+  null_count: long;
+}
+
+enum CompressionType:byte {
+  // LZ4 frame format, for portability, as provided by lz4frame.h or wrappers
+  // thereof. Not to be confused with "raw" (also called "block") format
+  // provided by lz4.h
+  LZ4_FRAME,
+
+  // Zstandard
+  ZSTD
+}
+
+/// Provided for forward compatibility in case we need to support different
+/// strategies for compressing the IPC message body (like whole-body
+/// compression rather than buffer-level) in the future
+enum BodyCompressionMethod:byte {
+  /// Each constituent buffer is first compressed with the indicated
+  /// compressor, and then written with the uncompressed length in the first 8
+  /// bytes as a 64-bit little-endian signed integer followed by the compressed
+  /// buffer bytes (and then padding as required by the protocol). The
+  /// uncompressed length may be set to -1 to indicate that the data that
+  /// follows is not compressed, which can be useful for cases where
+  /// compression does not yield appreciable savings.
+  BUFFER
+}
+
+/// Optional compression for the memory buffers constituting IPC message
+/// bodies. Intended for use with RecordBatch but could be used for other
+/// message types
+table BodyCompression {
+  /// Compressor library.
+  /// For LZ4_FRAME, each compressed buffer must consist of a single frame.
+  codec: CompressionType = LZ4_FRAME;
+
+  /// Indicates the way the record batch body was compressed
+  method: BodyCompressionMethod = BUFFER;
+}
+
+/// A data header describing the shared memory layout of a "record" or "row"
+/// batch. Some systems call this a "row batch" internally and others a "record
+/// batch".
+table RecordBatch {
+  /// number of records / rows. The arrays in the batch should all have this
+  /// length
+  length: long;
+
+  /// Nodes correspond to the pre-ordered flattened logical schema
+  nodes: [FieldNode];
+
+  /// Buffers correspond to the pre-ordered flattened buffer tree
+  ///
+  /// The number of buffers appended to this list depends on the schema. For
+  /// example, most primitive arrays will have 2 buffers, 1 for the validity
+  /// bitmap and 1 for the values. For struct arrays, there will only be a
+  /// single buffer for the validity (nulls) bitmap
+  buffers: [Buffer];
+
+  /// Optional compression of the message body
+  compression: BodyCompression;
+
+  /// Some types such as Utf8View are represented using a variable number of buffers.
+  /// For each such Field in the pre-ordered flattened logical schema, there will be
+  /// an entry in variadicBufferCounts to indicate the number of number of variadic
+  /// buffers which belong to that Field in the current RecordBatch.
+  ///
+  /// For example, the schema
+  ///     col1: Struct<alpha: Int32, beta: BinaryView, gamma: Float64>
+  ///     col2: Utf8View
+  /// contains two Fields with variadic buffers so variadicBufferCounts will have
+  /// two entries, the first counting the variadic buffers of `col1.beta` and the
+  /// second counting `col2`'s.
+  ///
+  /// This field may be omitted if and only if the schema contains no Fields with
+  /// a variable number of buffers, such as BinaryView and Utf8View.
+  variadicBufferCounts: [long];
+}
+
+/// For sending dictionary encoding information. Any Field can be
+/// dictionary-encoded, but in this case none of its children may be
+/// dictionary-encoded.
+/// There is one vector / column per dictionary, but that vector / column
+/// may be spread across multiple dictionary batches by using the isDelta
+/// flag
+
+table DictionaryBatch {
+  id: long;
+  data: RecordBatch;
+
+  /// If isDelta is true the values in the dictionary are to be appended to a
+  /// dictionary with the indicated id. If isDelta is false this dictionary
+  /// should replace the existing dictionary.
+  isDelta: bool = false;
+}
+
+/// ----------------------------------------------------------------------
+/// The root Message type
+
+/// This union enables us to easily send different message types without
+/// redundant storage, and in the future we can easily add new message types.
+///
+/// Arrow implementations do not need to implement all of the message types,
+/// which may include experimental metadata types. For maximum compatibility,
+/// it is best to send data using RecordBatch
+union MessageHeader {
+  Schema
+}
+
+table Message {
+  version: cudf.io.parquet.flatbuf.MetadataVersion;
+  header: MessageHeader;
+  bodyLength: long;
+  custom_metadata: [ KeyValue ];
+}
+
+root_type Message;
diff --git a/cpp/include/cudf/io/ipc/Schema.fbs b/cpp/include/cudf/io/ipc/Schema.fbs
new file mode 100644
index 00000000000..8479785b261
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/Schema.fbs
@@ -0,0 +1,570 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+/// Logical types, vector layouts, and schemas
+
+/// Format Version History.
+/// Version 1.0 - Forward and backwards compatibility guaranteed.
+/// Version 1.1 - Add Decimal256.
+/// Version 1.2 - Add Interval MONTH_DAY_NANO.
+/// Version 1.3 - Add Run-End Encoded.
+/// Version 1.4 - Add BinaryView, Utf8View, variadicBufferCounts, ListView, and
+/// LargeListView.
+
+namespace cudf.io.parquet.flatbuf;
+
+enum MetadataVersion:short {
+  /// 0.1.0 (October 2016).
+  V1,
+
+  /// 0.2.0 (February 2017). Non-backwards compatible with V1.
+  V2,
+
+  /// 0.3.0 -> 0.7.1 (May - December 2017). Non-backwards compatible with V2.
+  V3,
+
+  /// >= 0.8.0 (December 2017). Non-backwards compatible with V3.
+  V4,
+
+  /// >= 1.0.0 (July 2020). Backwards compatible with V4 (V5 readers can read V4
+  /// metadata and IPC messages). Implementations are recommended to provide a
+  /// V4 compatibility mode with V5 format changes disabled.
+  ///
+  /// Incompatible changes between V4 and V5:
+  /// - Union buffer layout has changed. In V5, Unions don't have a validity
+  ///   bitmap buffer.
+  V5,
+}
+
+/// Represents Arrow Features that might not have full support
+/// within implementations. This is intended to be used in
+/// two scenarios:
+///  1.  A mechanism for readers of Arrow Streams
+///      and files to understand that the stream or file makes
+///      use of a feature that isn't supported or unknown to
+///      the implementation (and therefore can meet the Arrow
+///      forward compatibility guarantees).
+///  2.  A means of negotiating between a client and server
+///      what features a stream is allowed to use. The enums
+///      values here are intented to represent higher level
+///      features, additional details maybe negotiated
+///      with key-value pairs specific to the protocol.
+///
+/// Enums added to this list should be assigned power-of-two values
+/// to facilitate exchanging and comparing bitmaps for supported
+/// features.
+enum Feature : long {
+  /// Needed to make flatbuffers happy.
+  UNUSED = 0,
+  /// The stream makes use of multiple full dictionaries with the
+  /// same ID and assumes clients implement dictionary replacement
+  /// correctly.
+  DICTIONARY_REPLACEMENT = 1,
+  /// The stream makes use of compressed bodies as described
+  /// in Message.fbs.
+  COMPRESSED_BODY = 2
+}
+
+/// These are stored in the flatbuffer in the Type union below
+
+table Null {
+}
+
+/// A Struct_ in the flatbuffer metadata is the same as an Arrow Struct
+/// (according to the physical memory layout). We used Struct_ here as
+/// Struct is a reserved word in Flatbuffers
+table Struct_ {
+}
+
+table List {
+}
+
+/// Same as List, but with 64-bit offsets, allowing to represent
+/// extremely large data values.
+table LargeList {
+}
+
+/// Represents the same logical types that List can, but contains offsets and
+/// sizes allowing for writes in any order and sharing of child values among
+/// list values.
+table ListView {
+}
+
+/// Same as ListView, but with 64-bit offsets and sizes, allowing to represent
+/// extremely large data values.
+table LargeListView {
+}
+
+table FixedSizeList {
+  /// Number of list items per value
+  listSize: int;
+}
+
+/// A Map is a logical nested type that is represented as
+///
+/// List<entries: Struct<key: K, value: V>>
+///
+/// In this layout, the keys and values are each respectively contiguous. We do
+/// not constrain the key and value types, so the application is responsible
+/// for ensuring that the keys are hashable and unique. Whether the keys are sorted
+/// may be set in the metadata for this field.
+///
+/// In a field with Map type, the field has a child Struct field, which then
+/// has two children: key type and the second the value type. The names of the
+/// child fields may be respectively "entries", "key", and "value", but this is
+/// not enforced.
+///
+/// Map
+/// ```text
+///   - child[0] entries: Struct
+///     - child[0] key: K
+///     - child[1] value: V
+/// ```
+/// Neither the "entries" field nor the "key" field may be nullable.
+///
+/// The metadata is structured so that Arrow systems without special handling
+/// for Map can make Map an alias for List. The "layout" attribute for the Map
+/// field must have the same contents as a List.
+table Map {
+  /// Set to true if the keys within each value are sorted
+  keysSorted: bool;
+}
+
+enum UnionMode:short { Sparse, Dense }
+
+/// A union is a complex type with children in Field
+/// By default ids in the type vector refer to the offsets in the children
+/// optionally typeIds provides an indirection between the child offset and the type id
+/// for each child `typeIds[offset]` is the id used in the type vector
+table Union {
+  mode: UnionMode;
+  typeIds: [ int ]; // optional, describes typeid of each child.
+}
+
+table Int {
+  bitWidth: int; // restricted to 8, 16, 32, and 64 in v1
+  is_signed: bool;
+}
+
+enum Precision:short {HALF, SINGLE, DOUBLE}
+
+table FloatingPoint {
+  precision: Precision;
+}
+
+/// Unicode with UTF-8 encoding
+table Utf8 {
+}
+
+/// Opaque binary data
+table Binary {
+}
+
+/// Same as Utf8, but with 64-bit offsets, allowing to represent
+/// extremely large data values.
+table LargeUtf8 {
+}
+
+/// Same as Binary, but with 64-bit offsets, allowing to represent
+/// extremely large data values.
+table LargeBinary {
+}
+
+/// Logically the same as Utf8, but the internal representation uses a view
+/// struct that contains the string length and either the string's entire data
+/// inline (for small strings) or an inlined prefix, an index of another buffer,
+/// and an offset pointing to a slice in that buffer (for non-small strings).
+///
+/// Since it uses a variable number of data buffers, each Field with this type
+/// must have a corresponding entry in `variadicBufferCounts`.
+table Utf8View {
+}
+
+/// Logically the same as Binary, but the internal representation uses a view
+/// struct that contains the string length and either the string's entire data
+/// inline (for small strings) or an inlined prefix, an index of another buffer,
+/// and an offset pointing to a slice in that buffer (for non-small strings).
+///
+/// Since it uses a variable number of data buffers, each Field with this type
+/// must have a corresponding entry in `variadicBufferCounts`.
+table BinaryView {
+}
+
+
+table FixedSizeBinary {
+  /// Number of bytes per value
+  byteWidth: int;
+}
+
+table Bool {
+}
+
+/// Contains two child arrays, run_ends and values.
+/// The run_ends child array must be a 16/32/64-bit integer array
+/// which encodes the indices at which the run with the value in 
+/// each corresponding index in the values child array ends.
+/// Like list/struct types, the value array can be of any type.
+table RunEndEncoded {
+}
+
+/// Exact decimal value represented as an integer value in two's
+/// complement. Currently only 128-bit (16-byte) and 256-bit (32-byte) integers
+/// are used. The representation uses the endianness indicated
+/// in the Schema.
+table Decimal {
+  /// Total number of decimal digits
+  precision: int;
+
+  /// Number of digits after the decimal point "."
+  scale: int;
+
+  /// Number of bits per value. The only accepted widths are 128 and 256.
+  /// We use bitWidth for consistency with Int::bitWidth.
+  bitWidth: int = 128;
+}
+
+enum DateUnit: short {
+  DAY,
+  MILLISECOND
+}
+
+/// Date is either a 32-bit or 64-bit signed integer type representing an
+/// elapsed time since UNIX epoch (1970-01-01), stored in either of two units:
+///
+/// * Milliseconds (64 bits) indicating UNIX time elapsed since the epoch (no
+///   leap seconds), where the values are evenly divisible by 86400000
+/// * Days (32 bits) since the UNIX epoch
+table Date {
+  unit: DateUnit = MILLISECOND;
+}
+
+enum TimeUnit: short { SECOND, MILLISECOND, MICROSECOND, NANOSECOND }
+
+/// Time is either a 32-bit or 64-bit signed integer type representing an
+/// elapsed time since midnight, stored in either of four units: seconds,
+/// milliseconds, microseconds or nanoseconds.
+///
+/// The integer `bitWidth` depends on the `unit` and must be one of the following:
+/// * SECOND and MILLISECOND: 32 bits
+/// * MICROSECOND and NANOSECOND: 64 bits
+///
+/// The allowed values are between 0 (inclusive) and 86400 (=24*60*60) seconds
+/// (exclusive), adjusted for the time unit (for example, up to 86400000
+/// exclusive for the MILLISECOND unit).
+/// This definition doesn't allow for leap seconds. Time values from
+/// measurements with leap seconds will need to be corrected when ingesting
+/// into Arrow (for example by replacing the value 86400 with 86399).
+table Time {
+  unit: TimeUnit = MILLISECOND;
+  bitWidth: int = 32;
+}
+
+/// Timestamp is a 64-bit signed integer representing an elapsed time since a
+/// fixed epoch, stored in either of four units: seconds, milliseconds,
+/// microseconds or nanoseconds, and is optionally annotated with a timezone.
+///
+/// Timestamp values do not include any leap seconds (in other words, all
+/// days are considered 86400 seconds long).
+///
+/// Timestamps with a non-empty timezone
+/// ------------------------------------
+///
+/// If a Timestamp column has a non-empty timezone value, its epoch is
+/// 1970-01-01 00:00:00 (January 1st 1970, midnight) in the *UTC* timezone
+/// (the Unix epoch), regardless of the Timestamp's own timezone.
+///
+/// Therefore, timestamp values with a non-empty timezone correspond to
+/// physical points in time together with some additional information about
+/// how the data was obtained and/or how to display it (the timezone).
+///
+///   For example, the timestamp value 0 with the timezone string "Europe/Paris"
+///   corresponds to "January 1st 1970, 00h00" in the UTC timezone, but the
+///   application may prefer to display it as "January 1st 1970, 01h00" in
+///   the Europe/Paris timezone (which is the same physical point in time).
+///
+/// One consequence is that timestamp values with a non-empty timezone
+/// can be compared and ordered directly, since they all share the same
+/// well-known point of reference (the Unix epoch).
+///
+/// Timestamps with an unset / empty timezone
+/// -----------------------------------------
+///
+/// If a Timestamp column has no timezone value, its epoch is
+/// 1970-01-01 00:00:00 (January 1st 1970, midnight) in an *unknown* timezone.
+///
+/// Therefore, timestamp values without a timezone cannot be meaningfully
+/// interpreted as physical points in time, but only as calendar / clock
+/// indications ("wall clock time") in an unspecified timezone.
+///
+///   For example, the timestamp value 0 with an empty timezone string
+///   corresponds to "January 1st 1970, 00h00" in an unknown timezone: there
+///   is not enough information to interpret it as a well-defined physical
+///   point in time.
+///
+/// One consequence is that timestamp values without a timezone cannot
+/// be reliably compared or ordered, since they may have different points of
+/// reference.  In particular, it is *not* possible to interpret an unset
+/// or empty timezone as the same as "UTC".
+///
+/// Conversion between timezones
+/// ----------------------------
+///
+/// If a Timestamp column has a non-empty timezone, changing the timezone
+/// to a different non-empty value is a metadata-only operation:
+/// the timestamp values need not change as their point of reference remains
+/// the same (the Unix epoch).
+///
+/// However, if a Timestamp column has no timezone value, changing it to a
+/// non-empty value requires to think about the desired semantics.
+/// One possibility is to assume that the original timestamp values are
+/// relative to the epoch of the timezone being set; timestamp values should
+/// then adjusted to the Unix epoch (for example, changing the timezone from
+/// empty to "Europe/Paris" would require converting the timestamp values
+/// from "Europe/Paris" to "UTC", which seems counter-intuitive but is
+/// nevertheless correct).
+///
+/// Guidelines for encoding data from external libraries
+/// ----------------------------------------------------
+///
+/// Date & time libraries often have multiple different data types for temporal
+/// data. In order to ease interoperability between different implementations the
+/// Arrow project has some recommendations for encoding these types into a Timestamp
+/// column.
+///
+/// An "instant" represents a physical point in time that has no relevant timezone
+/// (for example, astronomical data). To encode an instant, use a Timestamp with
+/// the timezone string set to "UTC", and make sure the Timestamp values
+/// are relative to the UTC epoch (January 1st 1970, midnight).
+///
+/// A "zoned date-time" represents a physical point in time annotated with an
+/// informative timezone (for example, the timezone in which the data was
+/// recorded).  To encode a zoned date-time, use a Timestamp with the timezone
+/// string set to the name of the timezone, and make sure the Timestamp values
+/// are relative to the UTC epoch (January 1st 1970, midnight).
+///
+///  (There is some ambiguity between an instant and a zoned date-time with the
+///   UTC timezone.  Both of these are stored the same in Arrow.  Typically,
+///   this distinction does not matter.  If it does, then an application should
+///   use custom metadata or an extension type to distinguish between the two cases.)
+///
+/// An "offset date-time" represents a physical point in time combined with an
+/// explicit offset from UTC.  To encode an offset date-time, use a Timestamp
+/// with the timezone string set to the numeric timezone offset string
+/// (e.g. "+03:00"), and make sure the Timestamp values are relative to
+/// the UTC epoch (January 1st 1970, midnight).
+///
+/// A "naive date-time" (also called "local date-time" in some libraries)
+/// represents a wall clock time combined with a calendar date, but with
+/// no indication of how to map this information to a physical point in time.
+/// Naive date-times must be handled with care because of this missing
+/// information, and also because daylight saving time (DST) may make
+/// some values ambiguous or nonexistent. A naive date-time may be
+/// stored as a struct with Date and Time fields. However, it may also be
+/// encoded into a Timestamp column with an empty timezone. The timestamp
+/// values should be computed "as if" the timezone of the date-time values
+/// was UTC; for example, the naive date-time "January 1st 1970, 00h00" would
+/// be encoded as timestamp value 0.
+table Timestamp {
+  unit: TimeUnit;
+
+  /// The timezone is an optional string indicating the name of a timezone,
+  /// one of:
+  ///
+  /// * As used in the Olson timezone database (the "tz database" or
+  ///   "tzdata"), such as "America/New_York".
+  /// * An absolute timezone offset of the form "+XX:XX" or "-XX:XX",
+  ///   such as "+07:30".
+  ///
+  /// Whether a timezone string is present indicates different semantics about
+  /// the data (see above).
+  timezone: string;
+}
+
+enum IntervalUnit: short { YEAR_MONTH, DAY_TIME, MONTH_DAY_NANO}
+// A "calendar" interval which models types that don't necessarily
+// have a precise duration without the context of a base timestamp (e.g.
+// days can differ in length during day light savings time transitions).
+// All integers in the types below are stored in the endianness indicated
+// by the schema.
+//
+// YEAR_MONTH - Indicates the number of elapsed whole months, stored as
+//   4-byte signed integers.
+// DAY_TIME - Indicates the number of elapsed days and milliseconds (no leap seconds),
+//   stored as 2 contiguous 32-bit signed integers (8-bytes in total). Support
+//   of this IntervalUnit is not required for full arrow compatibility.
+// MONTH_DAY_NANO - A triple of the number of elapsed months, days, and nanoseconds.
+//  The values are stored contiguously in 16-byte blocks. Months and days are
+//  encoded as 32-bit signed integers and nanoseconds is encoded as a 64-bit
+//  signed integer. Nanoseconds does not allow for leap seconds. Each field is
+//  independent (e.g. there is no constraint that nanoseconds have the same
+//  sign as days or that the quantity of nanoseconds represents less than a
+//  day's worth of time).
+table Interval {
+  unit: IntervalUnit;
+}
+
+// An absolute length of time unrelated to any calendar artifacts.
+//
+// For the purposes of Arrow Implementations, adding this value to a Timestamp
+// ("t1") naively (i.e. simply summing the two number) is acceptable even
+// though in some cases the resulting Timestamp (t2) would not account for
+// leap-seconds during the elapsed time between "t1" and "t2".  Similarly,
+// representing the difference between two Unix timestamp is acceptable, but
+// would yield a value that is possibly a few seconds off from the true elapsed
+// time.
+//
+//  The resolution defaults to millisecond, but can be any of the other
+//  supported TimeUnit values as with Timestamp and Time types.  This type is
+//  always represented as an 8-byte integer.
+table Duration {
+  unit: TimeUnit = MILLISECOND;
+}
+
+/// ----------------------------------------------------------------------
+/// Top-level Type value, enabling extensible type-specific metadata. We can
+/// add new logical types to Type without breaking backwards compatibility
+
+union Type {
+  Null,
+  Int,
+  FloatingPoint,
+  Binary,
+  Utf8,
+  Bool,
+  Decimal,
+  Date,
+  Time,
+  Timestamp,
+  Interval,
+  List,
+  Struct_,
+  Union,
+  FixedSizeBinary,
+  FixedSizeList,
+  Map,
+  Duration,
+  LargeBinary,
+  LargeUtf8,
+  LargeList,
+  RunEndEncoded,
+  BinaryView,
+  Utf8View,
+  ListView,
+  LargeListView,
+}
+
+/// ----------------------------------------------------------------------
+/// user defined key value pairs to add custom metadata to arrow
+/// key namespacing is the responsibility of the user
+
+table KeyValue {
+  key: string;
+  value: string;
+}
+
+/// ----------------------------------------------------------------------
+/// Dictionary encoding metadata
+/// Maintained for forwards compatibility, in the future
+/// Dictionaries might be explicit maps between integers and values
+/// allowing for non-contiguous index values
+enum DictionaryKind : short { DenseArray }
+table DictionaryEncoding {
+  /// The known dictionary id in the application where this data is used. In
+  /// the file or streaming formats, the dictionary ids are found in the
+  /// DictionaryBatch messages
+  id: long;
+
+  /// The dictionary indices are constrained to be non-negative integers. If
+  /// this field is null, the indices must be signed int32. To maximize
+  /// cross-language compatibility and performance, implementations are
+  /// recommended to prefer signed integer types over unsigned integer types
+  /// and to avoid uint64 indices unless they are required by an application.
+  indexType: Int;
+
+  /// By default, dictionaries are not ordered, or the order does not have
+  /// semantic meaning. In some statistical, applications, dictionary-encoding
+  /// is used to represent ordered categorical data, and we provide a way to
+  /// preserve that metadata here
+  isOrdered: bool;
+
+  dictionaryKind: DictionaryKind;
+}
+
+/// ----------------------------------------------------------------------
+/// A field represents a named column in a record / row batch or child of a
+/// nested type.
+
+table Field {
+  /// Name is not required, in i.e. a List
+  name: string;
+
+  /// Whether or not this field can contain nulls. Should be true in general.
+  nullable: bool;
+
+  /// This is the type of the decoded value if the field is dictionary encoded.
+  type: Type;
+
+  /// Present only if the field is dictionary encoded.
+  dictionary: DictionaryEncoding;
+
+  /// children apply only to nested data types like Struct, List and Union. For
+  /// primitive types children will have length 0.
+  children: [ Field ];
+
+  /// User-defined metadata
+  custom_metadata: [ KeyValue ];
+}
+
+/// ----------------------------------------------------------------------
+/// Endianness of the platform producing the data
+
+enum Endianness:short { Little, Big }
+
+/// ----------------------------------------------------------------------
+/// A Buffer represents a single contiguous memory segment
+struct Buffer {
+  /// The relative offset into the shared memory page where the bytes for this
+  /// buffer starts
+  offset: long;
+
+  /// The absolute length (in bytes) of the memory buffer. The memory is found
+  /// from offset (inclusive) to offset + length (non-inclusive). When building
+  /// messages using the encapsulated IPC message, padding bytes may be written
+  /// after a buffer, but such padding bytes do not need to be accounted for in
+  /// the size here.
+  length: long;
+}
+
+/// ----------------------------------------------------------------------
+/// A Schema describes the columns in a row batch
+
+table Schema {
+
+  /// endianness of the buffer
+  /// it is Little Endian by default
+  /// if endianness doesn't match the underlying system then the vectors need to be converted
+  endianness: Endianness=Little;
+
+  fields: [Field];
+  // User-defined metadata
+  custom_metadata: [ KeyValue ];
+
+  /// Features used in the stream/file.
+  features : [ Feature ];
+}
+
+root_type Schema;
diff --git a/cpp/include/cudf/io/ipc/detail/Message_generated.h b/cpp/include/cudf/io/ipc/detail/Message_generated.h
new file mode 100644
index 00000000000..1cede9a963d
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/detail/Message_generated.h
@@ -0,0 +1,651 @@
+// automatically generated by the FlatBuffers compiler, do not modify
+
+#ifndef FLATBUFFERS_GENERATED_MESSAGE_CUDF_IO_PARQUET_FLATBUF_H_
+#define FLATBUFFERS_GENERATED_MESSAGE_CUDF_IO_PARQUET_FLATBUF_H_
+
+#include <cudf/io/ipc/flatbuffers/flatbuffers.h>
+
+// Ensure the included flatbuffers.h is the same version as when this file was
+// generated, otherwise it may not be compatible.
+static_assert(FLATBUFFERS_VERSION_MAJOR == 24 && FLATBUFFERS_VERSION_MINOR == 3 &&
+                FLATBUFFERS_VERSION_REVISION == 25,
+              "Non-compatible flatbuffers version included");
+
+#include <cudf/io/ipc/detail/Schema_generated.h>
+
+namespace cudf {
+namespace io {
+namespace parquet {
+namespace flatbuf {
+
+struct FieldNode;
+
+struct BodyCompression;
+struct BodyCompressionBuilder;
+
+struct RecordBatch;
+struct RecordBatchBuilder;
+
+struct DictionaryBatch;
+struct DictionaryBatchBuilder;
+
+struct Message;
+struct MessageBuilder;
+
+enum CompressionType : int8_t {
+  CompressionType_LZ4_FRAME = 0,
+  CompressionType_ZSTD      = 1,
+  CompressionType_MIN       = CompressionType_LZ4_FRAME,
+  CompressionType_MAX       = CompressionType_ZSTD
+};
+
+inline const CompressionType (&EnumValuesCompressionType())[2]
+{
+  static const CompressionType values[] = {CompressionType_LZ4_FRAME, CompressionType_ZSTD};
+  return values;
+}
+
+inline const char* const* EnumNamesCompressionType()
+{
+  static const char* const names[3] = {"LZ4_FRAME", "ZSTD", nullptr};
+  return names;
+}
+
+inline const char* EnumNameCompressionType(CompressionType e)
+{
+  if (::flatbuffers::IsOutRange(e, CompressionType_LZ4_FRAME, CompressionType_ZSTD)) return "";
+  const size_t index = static_cast<size_t>(e);
+  return EnumNamesCompressionType()[index];
+}
+
+/// Provided for forward compatibility in case we need to support different
+/// strategies for compressing the IPC message body (like whole-body
+/// compression rather than buffer-level) in the future
+enum BodyCompressionMethod : int8_t {
+  /// Each constituent buffer is first compressed with the indicated
+  /// compressor, and then written with the uncompressed length in the first 8
+  /// bytes as a 64-bit little-endian signed integer followed by the compressed
+  /// buffer bytes (and then padding as required by the protocol). The
+  /// uncompressed length may be set to -1 to indicate that the data that
+  /// follows is not compressed, which can be useful for cases where
+  /// compression does not yield appreciable savings.
+  BodyCompressionMethod_BUFFER = 0,
+  BodyCompressionMethod_MIN    = BodyCompressionMethod_BUFFER,
+  BodyCompressionMethod_MAX    = BodyCompressionMethod_BUFFER
+};
+
+inline const BodyCompressionMethod (&EnumValuesBodyCompressionMethod())[1]
+{
+  static const BodyCompressionMethod values[] = {BodyCompressionMethod_BUFFER};
+  return values;
+}
+
+inline const char* const* EnumNamesBodyCompressionMethod()
+{
+  static const char* const names[2] = {"BUFFER", nullptr};
+  return names;
+}
+
+inline const char* EnumNameBodyCompressionMethod(BodyCompressionMethod e)
+{
+  if (::flatbuffers::IsOutRange(e, BodyCompressionMethod_BUFFER, BodyCompressionMethod_BUFFER))
+    return "";
+  const size_t index = static_cast<size_t>(e);
+  return EnumNamesBodyCompressionMethod()[index];
+}
+
+/// ----------------------------------------------------------------------
+/// The root Message type
+/// This union enables us to easily send different message types without
+/// redundant storage, and in the future we can easily add new message types.
+///
+/// Arrow implementations do not need to implement all of the message types,
+/// which may include experimental metadata types. For maximum compatibility,
+/// it is best to send data using RecordBatch
+enum MessageHeader : uint8_t {
+  MessageHeader_NONE   = 0,
+  MessageHeader_Schema = 1,
+  MessageHeader_MIN    = MessageHeader_NONE,
+  MessageHeader_MAX    = MessageHeader_Schema
+};
+
+inline const MessageHeader (&EnumValuesMessageHeader())[2]
+{
+  static const MessageHeader values[] = {MessageHeader_NONE, MessageHeader_Schema};
+  return values;
+}
+
+inline const char* const* EnumNamesMessageHeader()
+{
+  static const char* const names[3] = {"NONE", "Schema", nullptr};
+  return names;
+}
+
+inline const char* EnumNameMessageHeader(MessageHeader e)
+{
+  if (::flatbuffers::IsOutRange(e, MessageHeader_NONE, MessageHeader_Schema)) return "";
+  const size_t index = static_cast<size_t>(e);
+  return EnumNamesMessageHeader()[index];
+}
+
+template <typename T>
+struct MessageHeaderTraits {
+  static const MessageHeader enum_value = MessageHeader_NONE;
+};
+
+template <>
+struct MessageHeaderTraits<cudf::io::parquet::flatbuf::Schema> {
+  static const MessageHeader enum_value = MessageHeader_Schema;
+};
+
+bool VerifyMessageHeader(::flatbuffers::Verifier& verifier, const void* obj, MessageHeader type);
+bool VerifyMessageHeaderVector(::flatbuffers::Verifier& verifier,
+                               const ::flatbuffers::Vector<::flatbuffers::Offset<void>>* values,
+                               const ::flatbuffers::Vector<uint8_t>* types);
+
+/// ----------------------------------------------------------------------
+/// Data structures for describing a table row batch (a collection of
+/// equal-length Arrow arrays)
+/// Metadata about a field at some level of a nested type tree (but not
+/// its children).
+///
+/// For example, a List<Int16> with values `[[1, 2, 3], null, [4], [5, 6], null]`
+/// would have {length: 5, null_count: 2} for its List node, and {length: 6,
+/// null_count: 0} for its Int16 node, as separate FieldNode structs
+FLATBUFFERS_MANUALLY_ALIGNED_STRUCT(8) FieldNode FLATBUFFERS_FINAL_CLASS
+{
+ private:
+  int64_t length_;
+  int64_t null_count_;
+
+ public:
+  FieldNode() : length_(0), null_count_(0) {}
+  FieldNode(int64_t _length, int64_t _null_count)
+    : length_(::flatbuffers::EndianScalar(_length)),
+      null_count_(::flatbuffers::EndianScalar(_null_count))
+  {
+  }
+  /// The number of value slots in the Arrow array at this level of a nested
+  /// tree
+  int64_t length() const { return ::flatbuffers::EndianScalar(length_); }
+  /// The number of observed nulls. Fields with null_count == 0 may choose not
+  /// to write their physical validity bitmap out as a materialized buffer,
+  /// instead setting the length of the bitmap buffer to 0.
+  int64_t null_count() const { return ::flatbuffers::EndianScalar(null_count_); }
+};
+FLATBUFFERS_STRUCT_END(FieldNode, 16);
+
+/// Optional compression for the memory buffers constituting IPC message
+/// bodies. Intended for use with RecordBatch but could be used for other
+/// message types
+struct BodyCompression FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef BodyCompressionBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE { VT_CODEC = 4, VT_METHOD = 6 };
+  /// Compressor library.
+  /// For LZ4_FRAME, each compressed buffer must consist of a single frame.
+  cudf::io::parquet::flatbuf::CompressionType codec() const
+  {
+    return static_cast<cudf::io::parquet::flatbuf::CompressionType>(GetField<int8_t>(VT_CODEC, 0));
+  }
+  /// Indicates the way the record batch body was compressed
+  cudf::io::parquet::flatbuf::BodyCompressionMethod method() const
+  {
+    return static_cast<cudf::io::parquet::flatbuf::BodyCompressionMethod>(
+      GetField<int8_t>(VT_METHOD, 0));
+  }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int8_t>(verifier, VT_CODEC, 1) &&
+           VerifyField<int8_t>(verifier, VT_METHOD, 1) && verifier.EndTable();
+  }
+};
+
+struct BodyCompressionBuilder {
+  typedef BodyCompression Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_codec(cudf::io::parquet::flatbuf::CompressionType codec)
+  {
+    fbb_.AddElement<int8_t>(BodyCompression::VT_CODEC, static_cast<int8_t>(codec), 0);
+  }
+  void add_method(cudf::io::parquet::flatbuf::BodyCompressionMethod method)
+  {
+    fbb_.AddElement<int8_t>(BodyCompression::VT_METHOD, static_cast<int8_t>(method), 0);
+  }
+  explicit BodyCompressionBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<BodyCompression> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<BodyCompression>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<BodyCompression> CreateBodyCompression(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  cudf::io::parquet::flatbuf::CompressionType codec =
+    cudf::io::parquet::flatbuf::CompressionType_LZ4_FRAME,
+  cudf::io::parquet::flatbuf::BodyCompressionMethod method =
+    cudf::io::parquet::flatbuf::BodyCompressionMethod_BUFFER)
+{
+  BodyCompressionBuilder builder_(_fbb);
+  builder_.add_method(method);
+  builder_.add_codec(codec);
+  return builder_.Finish();
+}
+
+/// A data header describing the shared memory layout of a "record" or "row"
+/// batch. Some systems call this a "row batch" internally and others a "record
+/// batch".
+struct RecordBatch FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef RecordBatchBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE {
+    VT_LENGTH               = 4,
+    VT_NODES                = 6,
+    VT_BUFFERS              = 8,
+    VT_COMPRESSION          = 10,
+    VT_VARIADICBUFFERCOUNTS = 12
+  };
+  /// number of records / rows. The arrays in the batch should all have this
+  /// length
+  int64_t length() const { return GetField<int64_t>(VT_LENGTH, 0); }
+  /// Nodes correspond to the pre-ordered flattened logical schema
+  const ::flatbuffers::Vector<const cudf::io::parquet::flatbuf::FieldNode*>* nodes() const
+  {
+    return GetPointer<const ::flatbuffers::Vector<const cudf::io::parquet::flatbuf::FieldNode*>*>(
+      VT_NODES);
+  }
+  /// Buffers correspond to the pre-ordered flattened buffer tree
+  ///
+  /// The number of buffers appended to this list depends on the schema. For
+  /// example, most primitive arrays will have 2 buffers, 1 for the validity
+  /// bitmap and 1 for the values. For struct arrays, there will only be a
+  /// single buffer for the validity (nulls) bitmap
+  const ::flatbuffers::Vector<const cudf::io::parquet::flatbuf::Buffer*>* buffers() const
+  {
+    return GetPointer<const ::flatbuffers::Vector<const cudf::io::parquet::flatbuf::Buffer*>*>(
+      VT_BUFFERS);
+  }
+  /// Optional compression of the message body
+  const cudf::io::parquet::flatbuf::BodyCompression* compression() const
+  {
+    return GetPointer<const cudf::io::parquet::flatbuf::BodyCompression*>(VT_COMPRESSION);
+  }
+  /// Some types such as Utf8View are represented using a variable number of buffers.
+  /// For each such Field in the pre-ordered flattened logical schema, there will be
+  /// an entry in variadicBufferCounts to indicate the number of number of variadic
+  /// buffers which belong to that Field in the current RecordBatch.
+  ///
+  /// For example, the schema
+  ///     col1: Struct<alpha: Int32, beta: BinaryView, gamma: Float64>
+  ///     col2: Utf8View
+  /// contains two Fields with variadic buffers so variadicBufferCounts will have
+  /// two entries, the first counting the variadic buffers of `col1.beta` and the
+  /// second counting `col2`'s.
+  ///
+  /// This field may be omitted if and only if the schema contains no Fields with
+  /// a variable number of buffers, such as BinaryView and Utf8View.
+  const ::flatbuffers::Vector<int64_t>* variadicBufferCounts() const
+  {
+    return GetPointer<const ::flatbuffers::Vector<int64_t>*>(VT_VARIADICBUFFERCOUNTS);
+  }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int64_t>(verifier, VT_LENGTH, 8) &&
+           VerifyOffset(verifier, VT_NODES) && verifier.VerifyVector(nodes()) &&
+           VerifyOffset(verifier, VT_BUFFERS) && verifier.VerifyVector(buffers()) &&
+           VerifyOffset(verifier, VT_COMPRESSION) && verifier.VerifyTable(compression()) &&
+           VerifyOffset(verifier, VT_VARIADICBUFFERCOUNTS) &&
+           verifier.VerifyVector(variadicBufferCounts()) && verifier.EndTable();
+  }
+};
+
+struct RecordBatchBuilder {
+  typedef RecordBatch Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_length(int64_t length) { fbb_.AddElement<int64_t>(RecordBatch::VT_LENGTH, length, 0); }
+  void add_nodes(
+    ::flatbuffers::Offset<::flatbuffers::Vector<const cudf::io::parquet::flatbuf::FieldNode*>>
+      nodes)
+  {
+    fbb_.AddOffset(RecordBatch::VT_NODES, nodes);
+  }
+  void add_buffers(
+    ::flatbuffers::Offset<::flatbuffers::Vector<const cudf::io::parquet::flatbuf::Buffer*>> buffers)
+  {
+    fbb_.AddOffset(RecordBatch::VT_BUFFERS, buffers);
+  }
+  void add_compression(
+    ::flatbuffers::Offset<cudf::io::parquet::flatbuf::BodyCompression> compression)
+  {
+    fbb_.AddOffset(RecordBatch::VT_COMPRESSION, compression);
+  }
+  void add_variadicBufferCounts(
+    ::flatbuffers::Offset<::flatbuffers::Vector<int64_t>> variadicBufferCounts)
+  {
+    fbb_.AddOffset(RecordBatch::VT_VARIADICBUFFERCOUNTS, variadicBufferCounts);
+  }
+  explicit RecordBatchBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<RecordBatch> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<RecordBatch>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<RecordBatch> CreateRecordBatch(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  int64_t length = 0,
+  ::flatbuffers::Offset<::flatbuffers::Vector<const cudf::io::parquet::flatbuf::FieldNode*>> nodes =
+    0,
+  ::flatbuffers::Offset<::flatbuffers::Vector<const cudf::io::parquet::flatbuf::Buffer*>> buffers =
+    0,
+  ::flatbuffers::Offset<cudf::io::parquet::flatbuf::BodyCompression> compression = 0,
+  ::flatbuffers::Offset<::flatbuffers::Vector<int64_t>> variadicBufferCounts     = 0)
+{
+  RecordBatchBuilder builder_(_fbb);
+  builder_.add_length(length);
+  builder_.add_variadicBufferCounts(variadicBufferCounts);
+  builder_.add_compression(compression);
+  builder_.add_buffers(buffers);
+  builder_.add_nodes(nodes);
+  return builder_.Finish();
+}
+
+inline ::flatbuffers::Offset<RecordBatch> CreateRecordBatchDirect(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  int64_t length                                                                 = 0,
+  const std::vector<cudf::io::parquet::flatbuf::FieldNode>* nodes                = nullptr,
+  const std::vector<cudf::io::parquet::flatbuf::Buffer>* buffers                 = nullptr,
+  ::flatbuffers::Offset<cudf::io::parquet::flatbuf::BodyCompression> compression = 0,
+  const std::vector<int64_t>* variadicBufferCounts                               = nullptr)
+{
+  auto nodes__ =
+    nodes ? _fbb.CreateVectorOfStructs<cudf::io::parquet::flatbuf::FieldNode>(*nodes) : 0;
+  auto buffers__ =
+    buffers ? _fbb.CreateVectorOfStructs<cudf::io::parquet::flatbuf::Buffer>(*buffers) : 0;
+  auto variadicBufferCounts__ =
+    variadicBufferCounts ? _fbb.CreateVector<int64_t>(*variadicBufferCounts) : 0;
+  return cudf::io::parquet::flatbuf::CreateRecordBatch(
+    _fbb, length, nodes__, buffers__, compression, variadicBufferCounts__);
+}
+
+/// For sending dictionary encoding information. Any Field can be
+/// dictionary-encoded, but in this case none of its children may be
+/// dictionary-encoded.
+/// There is one vector / column per dictionary, but that vector / column
+/// may be spread across multiple dictionary batches by using the isDelta
+/// flag
+struct DictionaryBatch FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef DictionaryBatchBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE {
+    VT_ID      = 4,
+    VT_DATA    = 6,
+    VT_ISDELTA = 8
+  };
+  int64_t id() const { return GetField<int64_t>(VT_ID, 0); }
+  const cudf::io::parquet::flatbuf::RecordBatch* data() const
+  {
+    return GetPointer<const cudf::io::parquet::flatbuf::RecordBatch*>(VT_DATA);
+  }
+  /// If isDelta is true the values in the dictionary are to be appended to a
+  /// dictionary with the indicated id. If isDelta is false this dictionary
+  /// should replace the existing dictionary.
+  bool isDelta() const { return GetField<uint8_t>(VT_ISDELTA, 0) != 0; }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int64_t>(verifier, VT_ID, 8) &&
+           VerifyOffset(verifier, VT_DATA) && verifier.VerifyTable(data()) &&
+           VerifyField<uint8_t>(verifier, VT_ISDELTA, 1) && verifier.EndTable();
+  }
+};
+
+struct DictionaryBatchBuilder {
+  typedef DictionaryBatch Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_id(int64_t id) { fbb_.AddElement<int64_t>(DictionaryBatch::VT_ID, id, 0); }
+  void add_data(::flatbuffers::Offset<cudf::io::parquet::flatbuf::RecordBatch> data)
+  {
+    fbb_.AddOffset(DictionaryBatch::VT_DATA, data);
+  }
+  void add_isDelta(bool isDelta)
+  {
+    fbb_.AddElement<uint8_t>(DictionaryBatch::VT_ISDELTA, static_cast<uint8_t>(isDelta), 0);
+  }
+  explicit DictionaryBatchBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<DictionaryBatch> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<DictionaryBatch>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<DictionaryBatch> CreateDictionaryBatch(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  int64_t id                                                          = 0,
+  ::flatbuffers::Offset<cudf::io::parquet::flatbuf::RecordBatch> data = 0,
+  bool isDelta                                                        = false)
+{
+  DictionaryBatchBuilder builder_(_fbb);
+  builder_.add_id(id);
+  builder_.add_data(data);
+  builder_.add_isDelta(isDelta);
+  return builder_.Finish();
+}
+
+struct Message FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef MessageBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE {
+    VT_VERSION         = 4,
+    VT_HEADER_TYPE     = 6,
+    VT_HEADER          = 8,
+    VT_BODYLENGTH      = 10,
+    VT_CUSTOM_METADATA = 12
+  };
+  cudf::io::parquet::flatbuf::MetadataVersion version() const
+  {
+    return static_cast<cudf::io::parquet::flatbuf::MetadataVersion>(
+      GetField<int16_t>(VT_VERSION, 0));
+  }
+  cudf::io::parquet::flatbuf::MessageHeader header_type() const
+  {
+    return static_cast<cudf::io::parquet::flatbuf::MessageHeader>(
+      GetField<uint8_t>(VT_HEADER_TYPE, 0));
+  }
+  const void* header() const { return GetPointer<const void*>(VT_HEADER); }
+  template <typename T>
+  const T* header_as() const;
+  const cudf::io::parquet::flatbuf::Schema* header_as_Schema() const
+  {
+    return header_type() == cudf::io::parquet::flatbuf::MessageHeader_Schema
+             ? static_cast<const cudf::io::parquet::flatbuf::Schema*>(header())
+             : nullptr;
+  }
+  int64_t bodyLength() const { return GetField<int64_t>(VT_BODYLENGTH, 0); }
+  const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>*
+  custom_metadata() const
+  {
+    return GetPointer<
+      const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>*>(
+      VT_CUSTOM_METADATA);
+  }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int16_t>(verifier, VT_VERSION, 2) &&
+           VerifyField<uint8_t>(verifier, VT_HEADER_TYPE, 1) && VerifyOffset(verifier, VT_HEADER) &&
+           VerifyMessageHeader(verifier, header(), header_type()) &&
+           VerifyField<int64_t>(verifier, VT_BODYLENGTH, 8) &&
+           VerifyOffset(verifier, VT_CUSTOM_METADATA) && verifier.VerifyVector(custom_metadata()) &&
+           verifier.VerifyVectorOfTables(custom_metadata()) && verifier.EndTable();
+  }
+};
+
+template <>
+inline const cudf::io::parquet::flatbuf::Schema*
+Message::header_as<cudf::io::parquet::flatbuf::Schema>() const
+{
+  return header_as_Schema();
+}
+
+struct MessageBuilder {
+  typedef Message Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_version(cudf::io::parquet::flatbuf::MetadataVersion version)
+  {
+    fbb_.AddElement<int16_t>(Message::VT_VERSION, static_cast<int16_t>(version), 0);
+  }
+  void add_header_type(cudf::io::parquet::flatbuf::MessageHeader header_type)
+  {
+    fbb_.AddElement<uint8_t>(Message::VT_HEADER_TYPE, static_cast<uint8_t>(header_type), 0);
+  }
+  void add_header(::flatbuffers::Offset<void> header)
+  {
+    fbb_.AddOffset(Message::VT_HEADER, header);
+  }
+  void add_bodyLength(int64_t bodyLength)
+  {
+    fbb_.AddElement<int64_t>(Message::VT_BODYLENGTH, bodyLength, 0);
+  }
+  void add_custom_metadata(
+    ::flatbuffers::Offset<
+      ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>>
+      custom_metadata)
+  {
+    fbb_.AddOffset(Message::VT_CUSTOM_METADATA, custom_metadata);
+  }
+  explicit MessageBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Message> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Message>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Message> CreateMessage(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  cudf::io::parquet::flatbuf::MetadataVersion version =
+    cudf::io::parquet::flatbuf::MetadataVersion_V1,
+  cudf::io::parquet::flatbuf::MessageHeader header_type =
+    cudf::io::parquet::flatbuf::MessageHeader_NONE,
+  ::flatbuffers::Offset<void> header                                              = 0,
+  int64_t bodyLength                                                              = 0,
+  ::flatbuffers::Offset<::flatbuffers::Vector<
+    ::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>> custom_metadata = 0)
+{
+  MessageBuilder builder_(_fbb);
+  builder_.add_bodyLength(bodyLength);
+  builder_.add_custom_metadata(custom_metadata);
+  builder_.add_header(header);
+  builder_.add_version(version);
+  builder_.add_header_type(header_type);
+  return builder_.Finish();
+}
+
+inline ::flatbuffers::Offset<Message> CreateMessageDirect(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  cudf::io::parquet::flatbuf::MetadataVersion version =
+    cudf::io::parquet::flatbuf::MetadataVersion_V1,
+  cudf::io::parquet::flatbuf::MessageHeader header_type =
+    cudf::io::parquet::flatbuf::MessageHeader_NONE,
+  ::flatbuffers::Offset<void> header = 0,
+  int64_t bodyLength                 = 0,
+  const std::vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>* custom_metadata =
+    nullptr)
+{
+  auto custom_metadata__ =
+    custom_metadata
+      ? _fbb.CreateVector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>(
+          *custom_metadata)
+      : 0;
+  return cudf::io::parquet::flatbuf::CreateMessage(
+    _fbb, version, header_type, header, bodyLength, custom_metadata__);
+}
+
+inline bool VerifyMessageHeader(::flatbuffers::Verifier& verifier,
+                                const void* obj,
+                                MessageHeader type)
+{
+  switch (type) {
+    case MessageHeader_NONE: {
+      return true;
+    }
+    case MessageHeader_Schema: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Schema*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    default: return true;
+  }
+}
+
+inline bool VerifyMessageHeaderVector(
+  ::flatbuffers::Verifier& verifier,
+  const ::flatbuffers::Vector<::flatbuffers::Offset<void>>* values,
+  const ::flatbuffers::Vector<uint8_t>* types)
+{
+  if (!values || !types) return !values && !types;
+  if (values->size() != types->size()) return false;
+  for (::flatbuffers::uoffset_t i = 0; i < values->size(); ++i) {
+    if (!VerifyMessageHeader(verifier, values->Get(i), types->GetEnum<MessageHeader>(i))) {
+      return false;
+    }
+  }
+  return true;
+}
+
+inline const cudf::io::parquet::flatbuf::Message* GetMessage(const void* buf)
+{
+  return ::flatbuffers::GetRoot<cudf::io::parquet::flatbuf::Message>(buf);
+}
+
+inline const cudf::io::parquet::flatbuf::Message* GetSizePrefixedMessage(const void* buf)
+{
+  return ::flatbuffers::GetSizePrefixedRoot<cudf::io::parquet::flatbuf::Message>(buf);
+}
+
+inline bool VerifyMessageBuffer(::flatbuffers::Verifier& verifier)
+{
+  return verifier.VerifyBuffer<cudf::io::parquet::flatbuf::Message>(nullptr);
+}
+
+inline bool VerifySizePrefixedMessageBuffer(::flatbuffers::Verifier& verifier)
+{
+  return verifier.VerifySizePrefixedBuffer<cudf::io::parquet::flatbuf::Message>(nullptr);
+}
+
+inline void FinishMessageBuffer(::flatbuffers::FlatBufferBuilder& fbb,
+                                ::flatbuffers::Offset<cudf::io::parquet::flatbuf::Message> root)
+{
+  fbb.Finish(root);
+}
+
+inline void FinishSizePrefixedMessageBuffer(
+  ::flatbuffers::FlatBufferBuilder& fbb,
+  ::flatbuffers::Offset<cudf::io::parquet::flatbuf::Message> root)
+{
+  fbb.FinishSizePrefixed(root);
+}
+
+}  // namespace flatbuf
+}  // namespace parquet
+}  // namespace io
+}  // namespace cudf
+
+#endif  // FLATBUFFERS_GENERATED_MESSAGE_CUDF_IO_PARQUET_FLATBUF_H_
diff --git a/cpp/include/cudf/io/ipc/detail/Schema_generated.h b/cpp/include/cudf/io/ipc/detail/Schema_generated.h
new file mode 100644
index 00000000000..4d662704604
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/detail/Schema_generated.h
@@ -0,0 +1,2769 @@
+// automatically generated by the FlatBuffers compiler, do not modify
+
+#ifndef FLATBUFFERS_GENERATED_SCHEMA_CUDF_IO_PARQUET_FLATBUF_H_
+#define FLATBUFFERS_GENERATED_SCHEMA_CUDF_IO_PARQUET_FLATBUF_H_
+
+#include <cudf/io/ipc/flatbuffers/flatbuffers.h>
+
+// Ensure the included flatbuffers.h is the same version as when this file was
+// generated, otherwise it may not be compatible.
+static_assert(FLATBUFFERS_VERSION_MAJOR == 24 && FLATBUFFERS_VERSION_MINOR == 3 &&
+                FLATBUFFERS_VERSION_REVISION == 25,
+              "Non-compatible flatbuffers version included");
+
+namespace cudf {
+namespace io {
+namespace parquet {
+namespace flatbuf {
+
+struct Null;
+struct NullBuilder;
+
+struct Struct_;
+struct Struct_Builder;
+
+struct List;
+struct ListBuilder;
+
+struct LargeList;
+struct LargeListBuilder;
+
+struct ListView;
+struct ListViewBuilder;
+
+struct LargeListView;
+struct LargeListViewBuilder;
+
+struct FixedSizeList;
+struct FixedSizeListBuilder;
+
+struct Map;
+struct MapBuilder;
+
+struct Union;
+struct UnionBuilder;
+
+struct Int;
+struct IntBuilder;
+
+struct FloatingPoint;
+struct FloatingPointBuilder;
+
+struct Utf8;
+struct Utf8Builder;
+
+struct Binary;
+struct BinaryBuilder;
+
+struct LargeUtf8;
+struct LargeUtf8Builder;
+
+struct LargeBinary;
+struct LargeBinaryBuilder;
+
+struct Utf8View;
+struct Utf8ViewBuilder;
+
+struct BinaryView;
+struct BinaryViewBuilder;
+
+struct FixedSizeBinary;
+struct FixedSizeBinaryBuilder;
+
+struct Bool;
+struct BoolBuilder;
+
+struct RunEndEncoded;
+struct RunEndEncodedBuilder;
+
+struct Decimal;
+struct DecimalBuilder;
+
+struct Date;
+struct DateBuilder;
+
+struct Time;
+struct TimeBuilder;
+
+struct Timestamp;
+struct TimestampBuilder;
+
+struct Interval;
+struct IntervalBuilder;
+
+struct Duration;
+struct DurationBuilder;
+
+struct KeyValue;
+struct KeyValueBuilder;
+
+struct DictionaryEncoding;
+struct DictionaryEncodingBuilder;
+
+struct Field;
+struct FieldBuilder;
+
+struct Buffer;
+
+struct Schema;
+struct SchemaBuilder;
+
+enum MetadataVersion : int16_t {
+  /// 0.1.0 (October 2016).
+  MetadataVersion_V1 = 0,
+  /// 0.2.0 (February 2017). Non-backwards compatible with V1.
+  MetadataVersion_V2 = 1,
+  /// 0.3.0 -> 0.7.1 (May - December 2017). Non-backwards compatible with V2.
+  MetadataVersion_V3 = 2,
+  /// >= 0.8.0 (December 2017). Non-backwards compatible with V3.
+  MetadataVersion_V4 = 3,
+  /// >= 1.0.0 (July 2020). Backwards compatible with V4 (V5 readers can read V4
+  /// metadata and IPC messages). Implementations are recommended to provide a
+  /// V4 compatibility mode with V5 format changes disabled.
+  ///
+  /// Incompatible changes between V4 and V5:
+  /// - Union buffer layout has changed. In V5, Unions don't have a validity
+  ///   bitmap buffer.
+  MetadataVersion_V5  = 4,
+  MetadataVersion_MIN = MetadataVersion_V1,
+  MetadataVersion_MAX = MetadataVersion_V5
+};
+
+inline const MetadataVersion (&EnumValuesMetadataVersion())[5]
+{
+  static const MetadataVersion values[] = {MetadataVersion_V1,
+                                           MetadataVersion_V2,
+                                           MetadataVersion_V3,
+                                           MetadataVersion_V4,
+                                           MetadataVersion_V5};
+  return values;
+}
+
+inline const char* const* EnumNamesMetadataVersion()
+{
+  static const char* const names[6] = {"V1", "V2", "V3", "V4", "V5", nullptr};
+  return names;
+}
+
+inline const char* EnumNameMetadataVersion(MetadataVersion e)
+{
+  if (::flatbuffers::IsOutRange(e, MetadataVersion_V1, MetadataVersion_V5)) return "";
+  const size_t index = static_cast<size_t>(e);
+  return EnumNamesMetadataVersion()[index];
+}
+
+/// Represents Arrow Features that might not have full support
+/// within implementations. This is intended to be used in
+/// two scenarios:
+///  1.  A mechanism for readers of Arrow Streams
+///      and files to understand that the stream or file makes
+///      use of a feature that isn't supported or unknown to
+///      the implementation (and therefore can meet the Arrow
+///      forward compatibility guarantees).
+///  2.  A means of negotiating between a client and server
+///      what features a stream is allowed to use. The enums
+///      values here are intented to represent higher level
+///      features, additional details maybe negotiated
+///      with key-value pairs specific to the protocol.
+///
+/// Enums added to this list should be assigned power-of-two values
+/// to facilitate exchanging and comparing bitmaps for supported
+/// features.
+enum Feature : int64_t {
+  /// Needed to make flatbuffers happy.
+  Feature_UNUSED = 0,
+  /// The stream makes use of multiple full dictionaries with the
+  /// same ID and assumes clients implement dictionary replacement
+  /// correctly.
+  Feature_DICTIONARY_REPLACEMENT = 1LL,
+  /// The stream makes use of compressed bodies as described
+  /// in Message.fbs.
+  Feature_COMPRESSED_BODY = 2LL,
+  Feature_MIN             = Feature_UNUSED,
+  Feature_MAX             = Feature_COMPRESSED_BODY
+};
+
+inline const Feature (&EnumValuesFeature())[3]
+{
+  static const Feature values[] = {
+    Feature_UNUSED, Feature_DICTIONARY_REPLACEMENT, Feature_COMPRESSED_BODY};
+  return values;
+}
+
+inline const char* const* EnumNamesFeature()
+{
+  static const char* const names[4] = {
+    "UNUSED", "DICTIONARY_REPLACEMENT", "COMPRESSED_BODY", nullptr};
+  return names;
+}
+
+inline const char* EnumNameFeature(Feature e)
+{
+  if (::flatbuffers::IsOutRange(e, Feature_UNUSED, Feature_COMPRESSED_BODY)) return "";
+  const size_t index = static_cast<size_t>(e);
+  return EnumNamesFeature()[index];
+}
+
+enum UnionMode : int16_t {
+  UnionMode_Sparse = 0,
+  UnionMode_Dense  = 1,
+  UnionMode_MIN    = UnionMode_Sparse,
+  UnionMode_MAX    = UnionMode_Dense
+};
+
+inline const UnionMode (&EnumValuesUnionMode())[2]
+{
+  static const UnionMode values[] = {UnionMode_Sparse, UnionMode_Dense};
+  return values;
+}
+
+inline const char* const* EnumNamesUnionMode()
+{
+  static const char* const names[3] = {"Sparse", "Dense", nullptr};
+  return names;
+}
+
+inline const char* EnumNameUnionMode(UnionMode e)
+{
+  if (::flatbuffers::IsOutRange(e, UnionMode_Sparse, UnionMode_Dense)) return "";
+  const size_t index = static_cast<size_t>(e);
+  return EnumNamesUnionMode()[index];
+}
+
+enum Precision : int16_t {
+  Precision_HALF   = 0,
+  Precision_SINGLE = 1,
+  Precision_DOUBLE = 2,
+  Precision_MIN    = Precision_HALF,
+  Precision_MAX    = Precision_DOUBLE
+};
+
+inline const Precision (&EnumValuesPrecision())[3]
+{
+  static const Precision values[] = {Precision_HALF, Precision_SINGLE, Precision_DOUBLE};
+  return values;
+}
+
+inline const char* const* EnumNamesPrecision()
+{
+  static const char* const names[4] = {"HALF", "SINGLE", "DOUBLE", nullptr};
+  return names;
+}
+
+inline const char* EnumNamePrecision(Precision e)
+{
+  if (::flatbuffers::IsOutRange(e, Precision_HALF, Precision_DOUBLE)) return "";
+  const size_t index = static_cast<size_t>(e);
+  return EnumNamesPrecision()[index];
+}
+
+enum DateUnit : int16_t {
+  DateUnit_DAY         = 0,
+  DateUnit_MILLISECOND = 1,
+  DateUnit_MIN         = DateUnit_DAY,
+  DateUnit_MAX         = DateUnit_MILLISECOND
+};
+
+inline const DateUnit (&EnumValuesDateUnit())[2]
+{
+  static const DateUnit values[] = {DateUnit_DAY, DateUnit_MILLISECOND};
+  return values;
+}
+
+inline const char* const* EnumNamesDateUnit()
+{
+  static const char* const names[3] = {"DAY", "MILLISECOND", nullptr};
+  return names;
+}
+
+inline const char* EnumNameDateUnit(DateUnit e)
+{
+  if (::flatbuffers::IsOutRange(e, DateUnit_DAY, DateUnit_MILLISECOND)) return "";
+  const size_t index = static_cast<size_t>(e);
+  return EnumNamesDateUnit()[index];
+}
+
+enum TimeUnit : int16_t {
+  TimeUnit_SECOND      = 0,
+  TimeUnit_MILLISECOND = 1,
+  TimeUnit_MICROSECOND = 2,
+  TimeUnit_NANOSECOND  = 3,
+  TimeUnit_MIN         = TimeUnit_SECOND,
+  TimeUnit_MAX         = TimeUnit_NANOSECOND
+};
+
+inline const TimeUnit (&EnumValuesTimeUnit())[4]
+{
+  static const TimeUnit values[] = {
+    TimeUnit_SECOND, TimeUnit_MILLISECOND, TimeUnit_MICROSECOND, TimeUnit_NANOSECOND};
+  return values;
+}
+
+inline const char* const* EnumNamesTimeUnit()
+{
+  static const char* const names[5] = {
+    "SECOND", "MILLISECOND", "MICROSECOND", "NANOSECOND", nullptr};
+  return names;
+}
+
+inline const char* EnumNameTimeUnit(TimeUnit e)
+{
+  if (::flatbuffers::IsOutRange(e, TimeUnit_SECOND, TimeUnit_NANOSECOND)) return "";
+  const size_t index = static_cast<size_t>(e);
+  return EnumNamesTimeUnit()[index];
+}
+
+enum IntervalUnit : int16_t {
+  IntervalUnit_YEAR_MONTH     = 0,
+  IntervalUnit_DAY_TIME       = 1,
+  IntervalUnit_MONTH_DAY_NANO = 2,
+  IntervalUnit_MIN            = IntervalUnit_YEAR_MONTH,
+  IntervalUnit_MAX            = IntervalUnit_MONTH_DAY_NANO
+};
+
+inline const IntervalUnit (&EnumValuesIntervalUnit())[3]
+{
+  static const IntervalUnit values[] = {
+    IntervalUnit_YEAR_MONTH, IntervalUnit_DAY_TIME, IntervalUnit_MONTH_DAY_NANO};
+  return values;
+}
+
+inline const char* const* EnumNamesIntervalUnit()
+{
+  static const char* const names[4] = {"YEAR_MONTH", "DAY_TIME", "MONTH_DAY_NANO", nullptr};
+  return names;
+}
+
+inline const char* EnumNameIntervalUnit(IntervalUnit e)
+{
+  if (::flatbuffers::IsOutRange(e, IntervalUnit_YEAR_MONTH, IntervalUnit_MONTH_DAY_NANO)) return "";
+  const size_t index = static_cast<size_t>(e);
+  return EnumNamesIntervalUnit()[index];
+}
+
+/// ----------------------------------------------------------------------
+/// Top-level Type value, enabling extensible type-specific metadata. We can
+/// add new logical types to Type without breaking backwards compatibility
+enum Type : uint8_t {
+  Type_NONE            = 0,
+  Type_Null            = 1,
+  Type_Int             = 2,
+  Type_FloatingPoint   = 3,
+  Type_Binary          = 4,
+  Type_Utf8            = 5,
+  Type_Bool            = 6,
+  Type_Decimal         = 7,
+  Type_Date            = 8,
+  Type_Time            = 9,
+  Type_Timestamp       = 10,
+  Type_Interval        = 11,
+  Type_List            = 12,
+  Type_Struct_         = 13,
+  Type_Union           = 14,
+  Type_FixedSizeBinary = 15,
+  Type_FixedSizeList   = 16,
+  Type_Map             = 17,
+  Type_Duration        = 18,
+  Type_LargeBinary     = 19,
+  Type_LargeUtf8       = 20,
+  Type_LargeList       = 21,
+  Type_RunEndEncoded   = 22,
+  Type_BinaryView      = 23,
+  Type_Utf8View        = 24,
+  Type_ListView        = 25,
+  Type_LargeListView   = 26,
+  Type_MIN             = Type_NONE,
+  Type_MAX             = Type_LargeListView
+};
+
+inline const Type (&EnumValuesType())[27]
+{
+  static const Type values[] = {
+    Type_NONE,          Type_Null,      Type_Int,           Type_FloatingPoint,
+    Type_Binary,        Type_Utf8,      Type_Bool,          Type_Decimal,
+    Type_Date,          Type_Time,      Type_Timestamp,     Type_Interval,
+    Type_List,          Type_Struct_,   Type_Union,         Type_FixedSizeBinary,
+    Type_FixedSizeList, Type_Map,       Type_Duration,      Type_LargeBinary,
+    Type_LargeUtf8,     Type_LargeList, Type_RunEndEncoded, Type_BinaryView,
+    Type_Utf8View,      Type_ListView,  Type_LargeListView};
+  return values;
+}
+
+inline const char* const* EnumNamesType()
+{
+  static const char* const names[28] = {
+    "NONE",          "Null",      "Int",           "FloatingPoint",
+    "Binary",        "Utf8",      "Bool",          "Decimal",
+    "Date",          "Time",      "Timestamp",     "Interval",
+    "List",          "Struct_",   "Union",         "FixedSizeBinary",
+    "FixedSizeList", "Map",       "Duration",      "LargeBinary",
+    "LargeUtf8",     "LargeList", "RunEndEncoded", "BinaryView",
+    "Utf8View",      "ListView",  "LargeListView", nullptr};
+  return names;
+}
+
+inline const char* EnumNameType(Type e)
+{
+  if (::flatbuffers::IsOutRange(e, Type_NONE, Type_LargeListView)) return "";
+  const size_t index = static_cast<size_t>(e);
+  return EnumNamesType()[index];
+}
+
+template <typename T>
+struct TypeTraits {
+  static const Type enum_value = Type_NONE;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Null> {
+  static const Type enum_value = Type_Null;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Int> {
+  static const Type enum_value = Type_Int;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::FloatingPoint> {
+  static const Type enum_value = Type_FloatingPoint;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Binary> {
+  static const Type enum_value = Type_Binary;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Utf8> {
+  static const Type enum_value = Type_Utf8;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Bool> {
+  static const Type enum_value = Type_Bool;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Decimal> {
+  static const Type enum_value = Type_Decimal;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Date> {
+  static const Type enum_value = Type_Date;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Time> {
+  static const Type enum_value = Type_Time;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Timestamp> {
+  static const Type enum_value = Type_Timestamp;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Interval> {
+  static const Type enum_value = Type_Interval;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::List> {
+  static const Type enum_value = Type_List;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Struct_> {
+  static const Type enum_value = Type_Struct_;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Union> {
+  static const Type enum_value = Type_Union;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::FixedSizeBinary> {
+  static const Type enum_value = Type_FixedSizeBinary;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::FixedSizeList> {
+  static const Type enum_value = Type_FixedSizeList;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Map> {
+  static const Type enum_value = Type_Map;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Duration> {
+  static const Type enum_value = Type_Duration;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::LargeBinary> {
+  static const Type enum_value = Type_LargeBinary;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::LargeUtf8> {
+  static const Type enum_value = Type_LargeUtf8;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::LargeList> {
+  static const Type enum_value = Type_LargeList;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::RunEndEncoded> {
+  static const Type enum_value = Type_RunEndEncoded;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::BinaryView> {
+  static const Type enum_value = Type_BinaryView;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::Utf8View> {
+  static const Type enum_value = Type_Utf8View;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::ListView> {
+  static const Type enum_value = Type_ListView;
+};
+
+template <>
+struct TypeTraits<cudf::io::parquet::flatbuf::LargeListView> {
+  static const Type enum_value = Type_LargeListView;
+};
+
+bool VerifyType(::flatbuffers::Verifier& verifier, const void* obj, Type type);
+bool VerifyTypeVector(::flatbuffers::Verifier& verifier,
+                      const ::flatbuffers::Vector<::flatbuffers::Offset<void>>* values,
+                      const ::flatbuffers::Vector<uint8_t>* types);
+
+/// ----------------------------------------------------------------------
+/// Dictionary encoding metadata
+/// Maintained for forwards compatibility, in the future
+/// Dictionaries might be explicit maps between integers and values
+/// allowing for non-contiguous index values
+enum DictionaryKind : int16_t {
+  DictionaryKind_DenseArray = 0,
+  DictionaryKind_MIN        = DictionaryKind_DenseArray,
+  DictionaryKind_MAX        = DictionaryKind_DenseArray
+};
+
+inline const DictionaryKind (&EnumValuesDictionaryKind())[1]
+{
+  static const DictionaryKind values[] = {DictionaryKind_DenseArray};
+  return values;
+}
+
+inline const char* const* EnumNamesDictionaryKind()
+{
+  static const char* const names[2] = {"DenseArray", nullptr};
+  return names;
+}
+
+inline const char* EnumNameDictionaryKind(DictionaryKind e)
+{
+  if (::flatbuffers::IsOutRange(e, DictionaryKind_DenseArray, DictionaryKind_DenseArray)) return "";
+  const size_t index = static_cast<size_t>(e);
+  return EnumNamesDictionaryKind()[index];
+}
+
+/// ----------------------------------------------------------------------
+/// Endianness of the platform producing the data
+enum Endianness : int16_t {
+  Endianness_Little = 0,
+  Endianness_Big    = 1,
+  Endianness_MIN    = Endianness_Little,
+  Endianness_MAX    = Endianness_Big
+};
+
+inline const Endianness (&EnumValuesEndianness())[2]
+{
+  static const Endianness values[] = {Endianness_Little, Endianness_Big};
+  return values;
+}
+
+inline const char* const* EnumNamesEndianness()
+{
+  static const char* const names[3] = {"Little", "Big", nullptr};
+  return names;
+}
+
+inline const char* EnumNameEndianness(Endianness e)
+{
+  if (::flatbuffers::IsOutRange(e, Endianness_Little, Endianness_Big)) return "";
+  const size_t index = static_cast<size_t>(e);
+  return EnumNamesEndianness()[index];
+}
+
+/// ----------------------------------------------------------------------
+/// A Buffer represents a single contiguous memory segment
+FLATBUFFERS_MANUALLY_ALIGNED_STRUCT(8) Buffer FLATBUFFERS_FINAL_CLASS
+{
+ private:
+  int64_t offset_;
+  int64_t length_;
+
+ public:
+  Buffer() : offset_(0), length_(0) {}
+  Buffer(int64_t _offset, int64_t _length)
+    : offset_(::flatbuffers::EndianScalar(_offset)), length_(::flatbuffers::EndianScalar(_length))
+  {
+  }
+  /// The relative offset into the shared memory page where the bytes for this
+  /// buffer starts
+  int64_t offset() const { return ::flatbuffers::EndianScalar(offset_); }
+  /// The absolute length (in bytes) of the memory buffer. The memory is found
+  /// from offset (inclusive) to offset + length (non-inclusive). When building
+  /// messages using the encapsulated IPC message, padding bytes may be written
+  /// after a buffer, but such padding bytes do not need to be accounted for in
+  /// the size here.
+  int64_t length() const { return ::flatbuffers::EndianScalar(length_); }
+};
+FLATBUFFERS_STRUCT_END(Buffer, 16);
+
+/// These are stored in the flatbuffer in the Type union below
+struct Null FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef NullBuilder Builder;
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && verifier.EndTable();
+  }
+};
+
+struct NullBuilder {
+  typedef Null Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  explicit NullBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Null> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Null>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Null> CreateNull(::flatbuffers::FlatBufferBuilder& _fbb)
+{
+  NullBuilder builder_(_fbb);
+  return builder_.Finish();
+}
+
+/// A Struct_ in the flatbuffer metadata is the same as an Arrow Struct
+/// (according to the physical memory layout). We used Struct_ here as
+/// Struct is a reserved word in Flatbuffers
+struct Struct_ FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef Struct_Builder Builder;
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && verifier.EndTable();
+  }
+};
+
+struct Struct_Builder {
+  typedef Struct_ Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  explicit Struct_Builder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Struct_> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Struct_>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Struct_> CreateStruct_(::flatbuffers::FlatBufferBuilder& _fbb)
+{
+  Struct_Builder builder_(_fbb);
+  return builder_.Finish();
+}
+
+struct List FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef ListBuilder Builder;
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && verifier.EndTable();
+  }
+};
+
+struct ListBuilder {
+  typedef List Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  explicit ListBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<List> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<List>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<List> CreateList(::flatbuffers::FlatBufferBuilder& _fbb)
+{
+  ListBuilder builder_(_fbb);
+  return builder_.Finish();
+}
+
+/// Same as List, but with 64-bit offsets, allowing to represent
+/// extremely large data values.
+struct LargeList FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef LargeListBuilder Builder;
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && verifier.EndTable();
+  }
+};
+
+struct LargeListBuilder {
+  typedef LargeList Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  explicit LargeListBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<LargeList> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<LargeList>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<LargeList> CreateLargeList(::flatbuffers::FlatBufferBuilder& _fbb)
+{
+  LargeListBuilder builder_(_fbb);
+  return builder_.Finish();
+}
+
+/// Represents the same logical types that List can, but contains offsets and
+/// sizes allowing for writes in any order and sharing of child values among
+/// list values.
+struct ListView FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef ListViewBuilder Builder;
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && verifier.EndTable();
+  }
+};
+
+struct ListViewBuilder {
+  typedef ListView Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  explicit ListViewBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<ListView> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<ListView>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<ListView> CreateListView(::flatbuffers::FlatBufferBuilder& _fbb)
+{
+  ListViewBuilder builder_(_fbb);
+  return builder_.Finish();
+}
+
+/// Same as ListView, but with 64-bit offsets and sizes, allowing to represent
+/// extremely large data values.
+struct LargeListView FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef LargeListViewBuilder Builder;
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && verifier.EndTable();
+  }
+};
+
+struct LargeListViewBuilder {
+  typedef LargeListView Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  explicit LargeListViewBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<LargeListView> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<LargeListView>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<LargeListView> CreateLargeListView(
+  ::flatbuffers::FlatBufferBuilder& _fbb)
+{
+  LargeListViewBuilder builder_(_fbb);
+  return builder_.Finish();
+}
+
+struct FixedSizeList FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef FixedSizeListBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE { VT_LISTSIZE = 4 };
+  /// Number of list items per value
+  int32_t listSize() const { return GetField<int32_t>(VT_LISTSIZE, 0); }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int32_t>(verifier, VT_LISTSIZE, 4) &&
+           verifier.EndTable();
+  }
+};
+
+struct FixedSizeListBuilder {
+  typedef FixedSizeList Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_listSize(int32_t listSize)
+  {
+    fbb_.AddElement<int32_t>(FixedSizeList::VT_LISTSIZE, listSize, 0);
+  }
+  explicit FixedSizeListBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<FixedSizeList> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<FixedSizeList>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<FixedSizeList> CreateFixedSizeList(
+  ::flatbuffers::FlatBufferBuilder& _fbb, int32_t listSize = 0)
+{
+  FixedSizeListBuilder builder_(_fbb);
+  builder_.add_listSize(listSize);
+  return builder_.Finish();
+}
+
+/// A Map is a logical nested type that is represented as
+///
+/// List<entries: Struct<key: K, value: V>>
+///
+/// In this layout, the keys and values are each respectively contiguous. We do
+/// not constrain the key and value types, so the application is responsible
+/// for ensuring that the keys are hashable and unique. Whether the keys are sorted
+/// may be set in the metadata for this field.
+///
+/// In a field with Map type, the field has a child Struct field, which then
+/// has two children: key type and the second the value type. The names of the
+/// child fields may be respectively "entries", "key", and "value", but this is
+/// not enforced.
+///
+/// Map
+/// ```text
+///   - child[0] entries: Struct
+///     - child[0] key: K
+///     - child[1] value: V
+/// ```
+/// Neither the "entries" field nor the "key" field may be nullable.
+///
+/// The metadata is structured so that Arrow systems without special handling
+/// for Map can make Map an alias for List. The "layout" attribute for the Map
+/// field must have the same contents as a List.
+struct Map FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef MapBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE { VT_KEYSSORTED = 4 };
+  /// Set to true if the keys within each value are sorted
+  bool keysSorted() const { return GetField<uint8_t>(VT_KEYSSORTED, 0) != 0; }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<uint8_t>(verifier, VT_KEYSSORTED, 1) &&
+           verifier.EndTable();
+  }
+};
+
+struct MapBuilder {
+  typedef Map Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_keysSorted(bool keysSorted)
+  {
+    fbb_.AddElement<uint8_t>(Map::VT_KEYSSORTED, static_cast<uint8_t>(keysSorted), 0);
+  }
+  explicit MapBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Map> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Map>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Map> CreateMap(::flatbuffers::FlatBufferBuilder& _fbb,
+                                            bool keysSorted = false)
+{
+  MapBuilder builder_(_fbb);
+  builder_.add_keysSorted(keysSorted);
+  return builder_.Finish();
+}
+
+/// A union is a complex type with children in Field
+/// By default ids in the type vector refer to the offsets in the children
+/// optionally typeIds provides an indirection between the child offset and the type id
+/// for each child `typeIds[offset]` is the id used in the type vector
+struct Union FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef UnionBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE { VT_MODE = 4, VT_TYPEIDS = 6 };
+  cudf::io::parquet::flatbuf::UnionMode mode() const
+  {
+    return static_cast<cudf::io::parquet::flatbuf::UnionMode>(GetField<int16_t>(VT_MODE, 0));
+  }
+  const ::flatbuffers::Vector<int32_t>* typeIds() const
+  {
+    return GetPointer<const ::flatbuffers::Vector<int32_t>*>(VT_TYPEIDS);
+  }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int16_t>(verifier, VT_MODE, 2) &&
+           VerifyOffset(verifier, VT_TYPEIDS) && verifier.VerifyVector(typeIds()) &&
+           verifier.EndTable();
+  }
+};
+
+struct UnionBuilder {
+  typedef Union Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_mode(cudf::io::parquet::flatbuf::UnionMode mode)
+  {
+    fbb_.AddElement<int16_t>(Union::VT_MODE, static_cast<int16_t>(mode), 0);
+  }
+  void add_typeIds(::flatbuffers::Offset<::flatbuffers::Vector<int32_t>> typeIds)
+  {
+    fbb_.AddOffset(Union::VT_TYPEIDS, typeIds);
+  }
+  explicit UnionBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Union> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Union>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Union> CreateUnion(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  cudf::io::parquet::flatbuf::UnionMode mode = cudf::io::parquet::flatbuf::UnionMode_Sparse,
+  ::flatbuffers::Offset<::flatbuffers::Vector<int32_t>> typeIds = 0)
+{
+  UnionBuilder builder_(_fbb);
+  builder_.add_typeIds(typeIds);
+  builder_.add_mode(mode);
+  return builder_.Finish();
+}
+
+inline ::flatbuffers::Offset<Union> CreateUnionDirect(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  cudf::io::parquet::flatbuf::UnionMode mode = cudf::io::parquet::flatbuf::UnionMode_Sparse,
+  const std::vector<int32_t>* typeIds        = nullptr)
+{
+  auto typeIds__ = typeIds ? _fbb.CreateVector<int32_t>(*typeIds) : 0;
+  return cudf::io::parquet::flatbuf::CreateUnion(_fbb, mode, typeIds__);
+}
+
+struct Int FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef IntBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE {
+    VT_BITWIDTH  = 4,
+    VT_IS_SIGNED = 6
+  };
+  int32_t bitWidth() const { return GetField<int32_t>(VT_BITWIDTH, 0); }
+  bool is_signed() const { return GetField<uint8_t>(VT_IS_SIGNED, 0) != 0; }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int32_t>(verifier, VT_BITWIDTH, 4) &&
+           VerifyField<uint8_t>(verifier, VT_IS_SIGNED, 1) && verifier.EndTable();
+  }
+};
+
+struct IntBuilder {
+  typedef Int Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_bitWidth(int32_t bitWidth) { fbb_.AddElement<int32_t>(Int::VT_BITWIDTH, bitWidth, 0); }
+  void add_is_signed(bool is_signed)
+  {
+    fbb_.AddElement<uint8_t>(Int::VT_IS_SIGNED, static_cast<uint8_t>(is_signed), 0);
+  }
+  explicit IntBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Int> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Int>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Int> CreateInt(::flatbuffers::FlatBufferBuilder& _fbb,
+                                            int32_t bitWidth = 0,
+                                            bool is_signed   = false)
+{
+  IntBuilder builder_(_fbb);
+  builder_.add_bitWidth(bitWidth);
+  builder_.add_is_signed(is_signed);
+  return builder_.Finish();
+}
+
+struct FloatingPoint FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef FloatingPointBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE { VT_PRECISION = 4 };
+  cudf::io::parquet::flatbuf::Precision precision() const
+  {
+    return static_cast<cudf::io::parquet::flatbuf::Precision>(GetField<int16_t>(VT_PRECISION, 0));
+  }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int16_t>(verifier, VT_PRECISION, 2) &&
+           verifier.EndTable();
+  }
+};
+
+struct FloatingPointBuilder {
+  typedef FloatingPoint Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_precision(cudf::io::parquet::flatbuf::Precision precision)
+  {
+    fbb_.AddElement<int16_t>(FloatingPoint::VT_PRECISION, static_cast<int16_t>(precision), 0);
+  }
+  explicit FloatingPointBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<FloatingPoint> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<FloatingPoint>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<FloatingPoint> CreateFloatingPoint(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  cudf::io::parquet::flatbuf::Precision precision = cudf::io::parquet::flatbuf::Precision_HALF)
+{
+  FloatingPointBuilder builder_(_fbb);
+  builder_.add_precision(precision);
+  return builder_.Finish();
+}
+
+/// Unicode with UTF-8 encoding
+struct Utf8 FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef Utf8Builder Builder;
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && verifier.EndTable();
+  }
+};
+
+struct Utf8Builder {
+  typedef Utf8 Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  explicit Utf8Builder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Utf8> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Utf8>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Utf8> CreateUtf8(::flatbuffers::FlatBufferBuilder& _fbb)
+{
+  Utf8Builder builder_(_fbb);
+  return builder_.Finish();
+}
+
+/// Opaque binary data
+struct Binary FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef BinaryBuilder Builder;
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && verifier.EndTable();
+  }
+};
+
+struct BinaryBuilder {
+  typedef Binary Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  explicit BinaryBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Binary> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Binary>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Binary> CreateBinary(::flatbuffers::FlatBufferBuilder& _fbb)
+{
+  BinaryBuilder builder_(_fbb);
+  return builder_.Finish();
+}
+
+/// Same as Utf8, but with 64-bit offsets, allowing to represent
+/// extremely large data values.
+struct LargeUtf8 FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef LargeUtf8Builder Builder;
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && verifier.EndTable();
+  }
+};
+
+struct LargeUtf8Builder {
+  typedef LargeUtf8 Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  explicit LargeUtf8Builder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<LargeUtf8> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<LargeUtf8>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<LargeUtf8> CreateLargeUtf8(::flatbuffers::FlatBufferBuilder& _fbb)
+{
+  LargeUtf8Builder builder_(_fbb);
+  return builder_.Finish();
+}
+
+/// Same as Binary, but with 64-bit offsets, allowing to represent
+/// extremely large data values.
+struct LargeBinary FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef LargeBinaryBuilder Builder;
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && verifier.EndTable();
+  }
+};
+
+struct LargeBinaryBuilder {
+  typedef LargeBinary Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  explicit LargeBinaryBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<LargeBinary> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<LargeBinary>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<LargeBinary> CreateLargeBinary(::flatbuffers::FlatBufferBuilder& _fbb)
+{
+  LargeBinaryBuilder builder_(_fbb);
+  return builder_.Finish();
+}
+
+/// Logically the same as Utf8, but the internal representation uses a view
+/// struct that contains the string length and either the string's entire data
+/// inline (for small strings) or an inlined prefix, an index of another buffer,
+/// and an offset pointing to a slice in that buffer (for non-small strings).
+///
+/// Since it uses a variable number of data buffers, each Field with this type
+/// must have a corresponding entry in `variadicBufferCounts`.
+struct Utf8View FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef Utf8ViewBuilder Builder;
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && verifier.EndTable();
+  }
+};
+
+struct Utf8ViewBuilder {
+  typedef Utf8View Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  explicit Utf8ViewBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Utf8View> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Utf8View>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Utf8View> CreateUtf8View(::flatbuffers::FlatBufferBuilder& _fbb)
+{
+  Utf8ViewBuilder builder_(_fbb);
+  return builder_.Finish();
+}
+
+/// Logically the same as Binary, but the internal representation uses a view
+/// struct that contains the string length and either the string's entire data
+/// inline (for small strings) or an inlined prefix, an index of another buffer,
+/// and an offset pointing to a slice in that buffer (for non-small strings).
+///
+/// Since it uses a variable number of data buffers, each Field with this type
+/// must have a corresponding entry in `variadicBufferCounts`.
+struct BinaryView FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef BinaryViewBuilder Builder;
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && verifier.EndTable();
+  }
+};
+
+struct BinaryViewBuilder {
+  typedef BinaryView Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  explicit BinaryViewBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<BinaryView> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<BinaryView>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<BinaryView> CreateBinaryView(::flatbuffers::FlatBufferBuilder& _fbb)
+{
+  BinaryViewBuilder builder_(_fbb);
+  return builder_.Finish();
+}
+
+struct FixedSizeBinary FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef FixedSizeBinaryBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE { VT_BYTEWIDTH = 4 };
+  /// Number of bytes per value
+  int32_t byteWidth() const { return GetField<int32_t>(VT_BYTEWIDTH, 0); }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int32_t>(verifier, VT_BYTEWIDTH, 4) &&
+           verifier.EndTable();
+  }
+};
+
+struct FixedSizeBinaryBuilder {
+  typedef FixedSizeBinary Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_byteWidth(int32_t byteWidth)
+  {
+    fbb_.AddElement<int32_t>(FixedSizeBinary::VT_BYTEWIDTH, byteWidth, 0);
+  }
+  explicit FixedSizeBinaryBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<FixedSizeBinary> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<FixedSizeBinary>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<FixedSizeBinary> CreateFixedSizeBinary(
+  ::flatbuffers::FlatBufferBuilder& _fbb, int32_t byteWidth = 0)
+{
+  FixedSizeBinaryBuilder builder_(_fbb);
+  builder_.add_byteWidth(byteWidth);
+  return builder_.Finish();
+}
+
+struct Bool FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef BoolBuilder Builder;
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && verifier.EndTable();
+  }
+};
+
+struct BoolBuilder {
+  typedef Bool Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  explicit BoolBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Bool> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Bool>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Bool> CreateBool(::flatbuffers::FlatBufferBuilder& _fbb)
+{
+  BoolBuilder builder_(_fbb);
+  return builder_.Finish();
+}
+
+/// Contains two child arrays, run_ends and values.
+/// The run_ends child array must be a 16/32/64-bit integer array
+/// which encodes the indices at which the run with the value in
+/// each corresponding index in the values child array ends.
+/// Like list/struct types, the value array can be of any type.
+struct RunEndEncoded FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef RunEndEncodedBuilder Builder;
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && verifier.EndTable();
+  }
+};
+
+struct RunEndEncodedBuilder {
+  typedef RunEndEncoded Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  explicit RunEndEncodedBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<RunEndEncoded> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<RunEndEncoded>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<RunEndEncoded> CreateRunEndEncoded(
+  ::flatbuffers::FlatBufferBuilder& _fbb)
+{
+  RunEndEncodedBuilder builder_(_fbb);
+  return builder_.Finish();
+}
+
+/// Exact decimal value represented as an integer value in two's
+/// complement. Currently only 128-bit (16-byte) and 256-bit (32-byte) integers
+/// are used. The representation uses the endianness indicated
+/// in the Schema.
+struct Decimal FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef DecimalBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE {
+    VT_PRECISION = 4,
+    VT_SCALE     = 6,
+    VT_BITWIDTH  = 8
+  };
+  /// Total number of decimal digits
+  int32_t precision() const { return GetField<int32_t>(VT_PRECISION, 0); }
+  /// Number of digits after the decimal point "."
+  int32_t scale() const { return GetField<int32_t>(VT_SCALE, 0); }
+  /// Number of bits per value. The only accepted widths are 128 and 256.
+  /// We use bitWidth for consistency with Int::bitWidth.
+  int32_t bitWidth() const { return GetField<int32_t>(VT_BITWIDTH, 128); }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int32_t>(verifier, VT_PRECISION, 4) &&
+           VerifyField<int32_t>(verifier, VT_SCALE, 4) &&
+           VerifyField<int32_t>(verifier, VT_BITWIDTH, 4) && verifier.EndTable();
+  }
+};
+
+struct DecimalBuilder {
+  typedef Decimal Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_precision(int32_t precision)
+  {
+    fbb_.AddElement<int32_t>(Decimal::VT_PRECISION, precision, 0);
+  }
+  void add_scale(int32_t scale) { fbb_.AddElement<int32_t>(Decimal::VT_SCALE, scale, 0); }
+  void add_bitWidth(int32_t bitWidth)
+  {
+    fbb_.AddElement<int32_t>(Decimal::VT_BITWIDTH, bitWidth, 128);
+  }
+  explicit DecimalBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Decimal> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Decimal>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Decimal> CreateDecimal(::flatbuffers::FlatBufferBuilder& _fbb,
+                                                    int32_t precision = 0,
+                                                    int32_t scale     = 0,
+                                                    int32_t bitWidth  = 128)
+{
+  DecimalBuilder builder_(_fbb);
+  builder_.add_bitWidth(bitWidth);
+  builder_.add_scale(scale);
+  builder_.add_precision(precision);
+  return builder_.Finish();
+}
+
+/// Date is either a 32-bit or 64-bit signed integer type representing an
+/// elapsed time since UNIX epoch (1970-01-01), stored in either of two units:
+///
+/// * Milliseconds (64 bits) indicating UNIX time elapsed since the epoch (no
+///   leap seconds), where the values are evenly divisible by 86400000
+/// * Days (32 bits) since the UNIX epoch
+struct Date FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef DateBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE { VT_UNIT = 4 };
+  cudf::io::parquet::flatbuf::DateUnit unit() const
+  {
+    return static_cast<cudf::io::parquet::flatbuf::DateUnit>(GetField<int16_t>(VT_UNIT, 1));
+  }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int16_t>(verifier, VT_UNIT, 2) &&
+           verifier.EndTable();
+  }
+};
+
+struct DateBuilder {
+  typedef Date Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_unit(cudf::io::parquet::flatbuf::DateUnit unit)
+  {
+    fbb_.AddElement<int16_t>(Date::VT_UNIT, static_cast<int16_t>(unit), 1);
+  }
+  explicit DateBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Date> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Date>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Date> CreateDate(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  cudf::io::parquet::flatbuf::DateUnit unit = cudf::io::parquet::flatbuf::DateUnit_MILLISECOND)
+{
+  DateBuilder builder_(_fbb);
+  builder_.add_unit(unit);
+  return builder_.Finish();
+}
+
+/// Time is either a 32-bit or 64-bit signed integer type representing an
+/// elapsed time since midnight, stored in either of four units: seconds,
+/// milliseconds, microseconds or nanoseconds.
+///
+/// The integer `bitWidth` depends on the `unit` and must be one of the following:
+/// * SECOND and MILLISECOND: 32 bits
+/// * MICROSECOND and NANOSECOND: 64 bits
+///
+/// The allowed values are between 0 (inclusive) and 86400 (=24*60*60) seconds
+/// (exclusive), adjusted for the time unit (for example, up to 86400000
+/// exclusive for the MILLISECOND unit).
+/// This definition doesn't allow for leap seconds. Time values from
+/// measurements with leap seconds will need to be corrected when ingesting
+/// into Arrow (for example by replacing the value 86400 with 86399).
+struct Time FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef TimeBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE { VT_UNIT = 4, VT_BITWIDTH = 6 };
+  cudf::io::parquet::flatbuf::TimeUnit unit() const
+  {
+    return static_cast<cudf::io::parquet::flatbuf::TimeUnit>(GetField<int16_t>(VT_UNIT, 1));
+  }
+  int32_t bitWidth() const { return GetField<int32_t>(VT_BITWIDTH, 32); }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int16_t>(verifier, VT_UNIT, 2) &&
+           VerifyField<int32_t>(verifier, VT_BITWIDTH, 4) && verifier.EndTable();
+  }
+};
+
+struct TimeBuilder {
+  typedef Time Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_unit(cudf::io::parquet::flatbuf::TimeUnit unit)
+  {
+    fbb_.AddElement<int16_t>(Time::VT_UNIT, static_cast<int16_t>(unit), 1);
+  }
+  void add_bitWidth(int32_t bitWidth) { fbb_.AddElement<int32_t>(Time::VT_BITWIDTH, bitWidth, 32); }
+  explicit TimeBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Time> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Time>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Time> CreateTime(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  cudf::io::parquet::flatbuf::TimeUnit unit = cudf::io::parquet::flatbuf::TimeUnit_MILLISECOND,
+  int32_t bitWidth                          = 32)
+{
+  TimeBuilder builder_(_fbb);
+  builder_.add_bitWidth(bitWidth);
+  builder_.add_unit(unit);
+  return builder_.Finish();
+}
+
+/// Timestamp is a 64-bit signed integer representing an elapsed time since a
+/// fixed epoch, stored in either of four units: seconds, milliseconds,
+/// microseconds or nanoseconds, and is optionally annotated with a timezone.
+///
+/// Timestamp values do not include any leap seconds (in other words, all
+/// days are considered 86400 seconds long).
+///
+/// Timestamps with a non-empty timezone
+/// ------------------------------------
+///
+/// If a Timestamp column has a non-empty timezone value, its epoch is
+/// 1970-01-01 00:00:00 (January 1st 1970, midnight) in the *UTC* timezone
+/// (the Unix epoch), regardless of the Timestamp's own timezone.
+///
+/// Therefore, timestamp values with a non-empty timezone correspond to
+/// physical points in time together with some additional information about
+/// how the data was obtained and/or how to display it (the timezone).
+///
+///   For example, the timestamp value 0 with the timezone string "Europe/Paris"
+///   corresponds to "January 1st 1970, 00h00" in the UTC timezone, but the
+///   application may prefer to display it as "January 1st 1970, 01h00" in
+///   the Europe/Paris timezone (which is the same physical point in time).
+///
+/// One consequence is that timestamp values with a non-empty timezone
+/// can be compared and ordered directly, since they all share the same
+/// well-known point of reference (the Unix epoch).
+///
+/// Timestamps with an unset / empty timezone
+/// -----------------------------------------
+///
+/// If a Timestamp column has no timezone value, its epoch is
+/// 1970-01-01 00:00:00 (January 1st 1970, midnight) in an *unknown* timezone.
+///
+/// Therefore, timestamp values without a timezone cannot be meaningfully
+/// interpreted as physical points in time, but only as calendar / clock
+/// indications ("wall clock time") in an unspecified timezone.
+///
+///   For example, the timestamp value 0 with an empty timezone string
+///   corresponds to "January 1st 1970, 00h00" in an unknown timezone: there
+///   is not enough information to interpret it as a well-defined physical
+///   point in time.
+///
+/// One consequence is that timestamp values without a timezone cannot
+/// be reliably compared or ordered, since they may have different points of
+/// reference.  In particular, it is *not* possible to interpret an unset
+/// or empty timezone as the same as "UTC".
+///
+/// Conversion between timezones
+/// ----------------------------
+///
+/// If a Timestamp column has a non-empty timezone, changing the timezone
+/// to a different non-empty value is a metadata-only operation:
+/// the timestamp values need not change as their point of reference remains
+/// the same (the Unix epoch).
+///
+/// However, if a Timestamp column has no timezone value, changing it to a
+/// non-empty value requires to think about the desired semantics.
+/// One possibility is to assume that the original timestamp values are
+/// relative to the epoch of the timezone being set; timestamp values should
+/// then adjusted to the Unix epoch (for example, changing the timezone from
+/// empty to "Europe/Paris" would require converting the timestamp values
+/// from "Europe/Paris" to "UTC", which seems counter-intuitive but is
+/// nevertheless correct).
+///
+/// Guidelines for encoding data from external libraries
+/// ----------------------------------------------------
+///
+/// Date & time libraries often have multiple different data types for temporal
+/// data. In order to ease interoperability between different implementations the
+/// Arrow project has some recommendations for encoding these types into a Timestamp
+/// column.
+///
+/// An "instant" represents a physical point in time that has no relevant timezone
+/// (for example, astronomical data). To encode an instant, use a Timestamp with
+/// the timezone string set to "UTC", and make sure the Timestamp values
+/// are relative to the UTC epoch (January 1st 1970, midnight).
+///
+/// A "zoned date-time" represents a physical point in time annotated with an
+/// informative timezone (for example, the timezone in which the data was
+/// recorded).  To encode a zoned date-time, use a Timestamp with the timezone
+/// string set to the name of the timezone, and make sure the Timestamp values
+/// are relative to the UTC epoch (January 1st 1970, midnight).
+///
+///  (There is some ambiguity between an instant and a zoned date-time with the
+///   UTC timezone.  Both of these are stored the same in Arrow.  Typically,
+///   this distinction does not matter.  If it does, then an application should
+///   use custom metadata or an extension type to distinguish between the two cases.)
+///
+/// An "offset date-time" represents a physical point in time combined with an
+/// explicit offset from UTC.  To encode an offset date-time, use a Timestamp
+/// with the timezone string set to the numeric timezone offset string
+/// (e.g. "+03:00"), and make sure the Timestamp values are relative to
+/// the UTC epoch (January 1st 1970, midnight).
+///
+/// A "naive date-time" (also called "local date-time" in some libraries)
+/// represents a wall clock time combined with a calendar date, but with
+/// no indication of how to map this information to a physical point in time.
+/// Naive date-times must be handled with care because of this missing
+/// information, and also because daylight saving time (DST) may make
+/// some values ambiguous or nonexistent. A naive date-time may be
+/// stored as a struct with Date and Time fields. However, it may also be
+/// encoded into a Timestamp column with an empty timezone. The timestamp
+/// values should be computed "as if" the timezone of the date-time values
+/// was UTC; for example, the naive date-time "January 1st 1970, 00h00" would
+/// be encoded as timestamp value 0.
+struct Timestamp FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef TimestampBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE { VT_UNIT = 4, VT_TIMEZONE = 6 };
+  cudf::io::parquet::flatbuf::TimeUnit unit() const
+  {
+    return static_cast<cudf::io::parquet::flatbuf::TimeUnit>(GetField<int16_t>(VT_UNIT, 0));
+  }
+  /// The timezone is an optional string indicating the name of a timezone,
+  /// one of:
+  ///
+  /// * As used in the Olson timezone database (the "tz database" or
+  ///   "tzdata"), such as "America/New_York".
+  /// * An absolute timezone offset of the form "+XX:XX" or "-XX:XX",
+  ///   such as "+07:30".
+  ///
+  /// Whether a timezone string is present indicates different semantics about
+  /// the data (see above).
+  const ::flatbuffers::String* timezone() const
+  {
+    return GetPointer<const ::flatbuffers::String*>(VT_TIMEZONE);
+  }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int16_t>(verifier, VT_UNIT, 2) &&
+           VerifyOffset(verifier, VT_TIMEZONE) && verifier.VerifyString(timezone()) &&
+           verifier.EndTable();
+  }
+};
+
+struct TimestampBuilder {
+  typedef Timestamp Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_unit(cudf::io::parquet::flatbuf::TimeUnit unit)
+  {
+    fbb_.AddElement<int16_t>(Timestamp::VT_UNIT, static_cast<int16_t>(unit), 0);
+  }
+  void add_timezone(::flatbuffers::Offset<::flatbuffers::String> timezone)
+  {
+    fbb_.AddOffset(Timestamp::VT_TIMEZONE, timezone);
+  }
+  explicit TimestampBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Timestamp> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Timestamp>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Timestamp> CreateTimestamp(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  cudf::io::parquet::flatbuf::TimeUnit unit = cudf::io::parquet::flatbuf::TimeUnit_SECOND,
+  ::flatbuffers::Offset<::flatbuffers::String> timezone = 0)
+{
+  TimestampBuilder builder_(_fbb);
+  builder_.add_timezone(timezone);
+  builder_.add_unit(unit);
+  return builder_.Finish();
+}
+
+inline ::flatbuffers::Offset<Timestamp> CreateTimestampDirect(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  cudf::io::parquet::flatbuf::TimeUnit unit = cudf::io::parquet::flatbuf::TimeUnit_SECOND,
+  const char* timezone                      = nullptr)
+{
+  auto timezone__ = timezone ? _fbb.CreateString(timezone) : 0;
+  return cudf::io::parquet::flatbuf::CreateTimestamp(_fbb, unit, timezone__);
+}
+
+struct Interval FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef IntervalBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE { VT_UNIT = 4 };
+  cudf::io::parquet::flatbuf::IntervalUnit unit() const
+  {
+    return static_cast<cudf::io::parquet::flatbuf::IntervalUnit>(GetField<int16_t>(VT_UNIT, 0));
+  }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int16_t>(verifier, VT_UNIT, 2) &&
+           verifier.EndTable();
+  }
+};
+
+struct IntervalBuilder {
+  typedef Interval Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_unit(cudf::io::parquet::flatbuf::IntervalUnit unit)
+  {
+    fbb_.AddElement<int16_t>(Interval::VT_UNIT, static_cast<int16_t>(unit), 0);
+  }
+  explicit IntervalBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Interval> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Interval>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Interval> CreateInterval(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  cudf::io::parquet::flatbuf::IntervalUnit unit =
+    cudf::io::parquet::flatbuf::IntervalUnit_YEAR_MONTH)
+{
+  IntervalBuilder builder_(_fbb);
+  builder_.add_unit(unit);
+  return builder_.Finish();
+}
+
+struct Duration FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef DurationBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE { VT_UNIT = 4 };
+  cudf::io::parquet::flatbuf::TimeUnit unit() const
+  {
+    return static_cast<cudf::io::parquet::flatbuf::TimeUnit>(GetField<int16_t>(VT_UNIT, 1));
+  }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int16_t>(verifier, VT_UNIT, 2) &&
+           verifier.EndTable();
+  }
+};
+
+struct DurationBuilder {
+  typedef Duration Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_unit(cudf::io::parquet::flatbuf::TimeUnit unit)
+  {
+    fbb_.AddElement<int16_t>(Duration::VT_UNIT, static_cast<int16_t>(unit), 1);
+  }
+  explicit DurationBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Duration> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Duration>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Duration> CreateDuration(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  cudf::io::parquet::flatbuf::TimeUnit unit = cudf::io::parquet::flatbuf::TimeUnit_MILLISECOND)
+{
+  DurationBuilder builder_(_fbb);
+  builder_.add_unit(unit);
+  return builder_.Finish();
+}
+
+/// ----------------------------------------------------------------------
+/// user defined key value pairs to add custom metadata to arrow
+/// key namespacing is the responsibility of the user
+struct KeyValue FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef KeyValueBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE { VT_KEY = 4, VT_VALUE = 6 };
+  const ::flatbuffers::String* key() const
+  {
+    return GetPointer<const ::flatbuffers::String*>(VT_KEY);
+  }
+  const ::flatbuffers::String* value() const
+  {
+    return GetPointer<const ::flatbuffers::String*>(VT_VALUE);
+  }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyOffset(verifier, VT_KEY) &&
+           verifier.VerifyString(key()) && VerifyOffset(verifier, VT_VALUE) &&
+           verifier.VerifyString(value()) && verifier.EndTable();
+  }
+};
+
+struct KeyValueBuilder {
+  typedef KeyValue Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_key(::flatbuffers::Offset<::flatbuffers::String> key)
+  {
+    fbb_.AddOffset(KeyValue::VT_KEY, key);
+  }
+  void add_value(::flatbuffers::Offset<::flatbuffers::String> value)
+  {
+    fbb_.AddOffset(KeyValue::VT_VALUE, value);
+  }
+  explicit KeyValueBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<KeyValue> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<KeyValue>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<KeyValue> CreateKeyValue(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  ::flatbuffers::Offset<::flatbuffers::String> key   = 0,
+  ::flatbuffers::Offset<::flatbuffers::String> value = 0)
+{
+  KeyValueBuilder builder_(_fbb);
+  builder_.add_value(value);
+  builder_.add_key(key);
+  return builder_.Finish();
+}
+
+inline ::flatbuffers::Offset<KeyValue> CreateKeyValueDirect(::flatbuffers::FlatBufferBuilder& _fbb,
+                                                            const char* key   = nullptr,
+                                                            const char* value = nullptr)
+{
+  auto key__   = key ? _fbb.CreateString(key) : 0;
+  auto value__ = value ? _fbb.CreateString(value) : 0;
+  return cudf::io::parquet::flatbuf::CreateKeyValue(_fbb, key__, value__);
+}
+
+struct DictionaryEncoding FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef DictionaryEncodingBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE {
+    VT_ID             = 4,
+    VT_INDEXTYPE      = 6,
+    VT_ISORDERED      = 8,
+    VT_DICTIONARYKIND = 10
+  };
+  /// The known dictionary id in the application where this data is used. In
+  /// the file or streaming formats, the dictionary ids are found in the
+  /// DictionaryBatch messages
+  int64_t id() const { return GetField<int64_t>(VT_ID, 0); }
+  /// The dictionary indices are constrained to be non-negative integers. If
+  /// this field is null, the indices must be signed int32. To maximize
+  /// cross-language compatibility and performance, implementations are
+  /// recommended to prefer signed integer types over unsigned integer types
+  /// and to avoid uint64 indices unless they are required by an application.
+  const cudf::io::parquet::flatbuf::Int* indexType() const
+  {
+    return GetPointer<const cudf::io::parquet::flatbuf::Int*>(VT_INDEXTYPE);
+  }
+  /// By default, dictionaries are not ordered, or the order does not have
+  /// semantic meaning. In some statistical, applications, dictionary-encoding
+  /// is used to represent ordered categorical data, and we provide a way to
+  /// preserve that metadata here
+  bool isOrdered() const { return GetField<uint8_t>(VT_ISORDERED, 0) != 0; }
+  cudf::io::parquet::flatbuf::DictionaryKind dictionaryKind() const
+  {
+    return static_cast<cudf::io::parquet::flatbuf::DictionaryKind>(
+      GetField<int16_t>(VT_DICTIONARYKIND, 0));
+  }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int64_t>(verifier, VT_ID, 8) &&
+           VerifyOffset(verifier, VT_INDEXTYPE) && verifier.VerifyTable(indexType()) &&
+           VerifyField<uint8_t>(verifier, VT_ISORDERED, 1) &&
+           VerifyField<int16_t>(verifier, VT_DICTIONARYKIND, 2) && verifier.EndTable();
+  }
+};
+
+struct DictionaryEncodingBuilder {
+  typedef DictionaryEncoding Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_id(int64_t id) { fbb_.AddElement<int64_t>(DictionaryEncoding::VT_ID, id, 0); }
+  void add_indexType(::flatbuffers::Offset<cudf::io::parquet::flatbuf::Int> indexType)
+  {
+    fbb_.AddOffset(DictionaryEncoding::VT_INDEXTYPE, indexType);
+  }
+  void add_isOrdered(bool isOrdered)
+  {
+    fbb_.AddElement<uint8_t>(DictionaryEncoding::VT_ISORDERED, static_cast<uint8_t>(isOrdered), 0);
+  }
+  void add_dictionaryKind(cudf::io::parquet::flatbuf::DictionaryKind dictionaryKind)
+  {
+    fbb_.AddElement<int16_t>(
+      DictionaryEncoding::VT_DICTIONARYKIND, static_cast<int16_t>(dictionaryKind), 0);
+  }
+  explicit DictionaryEncodingBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<DictionaryEncoding> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<DictionaryEncoding>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<DictionaryEncoding> CreateDictionaryEncoding(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  int64_t id                                                       = 0,
+  ::flatbuffers::Offset<cudf::io::parquet::flatbuf::Int> indexType = 0,
+  bool isOrdered                                                   = false,
+  cudf::io::parquet::flatbuf::DictionaryKind dictionaryKind =
+    cudf::io::parquet::flatbuf::DictionaryKind_DenseArray)
+{
+  DictionaryEncodingBuilder builder_(_fbb);
+  builder_.add_id(id);
+  builder_.add_indexType(indexType);
+  builder_.add_dictionaryKind(dictionaryKind);
+  builder_.add_isOrdered(isOrdered);
+  return builder_.Finish();
+}
+
+/// ----------------------------------------------------------------------
+/// A field represents a named column in a record / row batch or child of a
+/// nested type.
+struct Field FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef FieldBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE {
+    VT_NAME            = 4,
+    VT_NULLABLE        = 6,
+    VT_TYPE_TYPE       = 8,
+    VT_TYPE            = 10,
+    VT_DICTIONARY      = 12,
+    VT_CHILDREN        = 14,
+    VT_CUSTOM_METADATA = 16
+  };
+  /// Name is not required, in i.e. a List
+  const ::flatbuffers::String* name() const
+  {
+    return GetPointer<const ::flatbuffers::String*>(VT_NAME);
+  }
+  /// Whether or not this field can contain nulls. Should be true in general.
+  bool nullable() const { return GetField<uint8_t>(VT_NULLABLE, 0) != 0; }
+  cudf::io::parquet::flatbuf::Type type_type() const
+  {
+    return static_cast<cudf::io::parquet::flatbuf::Type>(GetField<uint8_t>(VT_TYPE_TYPE, 0));
+  }
+  /// This is the type of the decoded value if the field is dictionary encoded.
+  const void* type() const { return GetPointer<const void*>(VT_TYPE); }
+  template <typename T>
+  const T* type_as() const;
+  const cudf::io::parquet::flatbuf::Null* type_as_Null() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Null
+             ? static_cast<const cudf::io::parquet::flatbuf::Null*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::Int* type_as_Int() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Int
+             ? static_cast<const cudf::io::parquet::flatbuf::Int*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::FloatingPoint* type_as_FloatingPoint() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_FloatingPoint
+             ? static_cast<const cudf::io::parquet::flatbuf::FloatingPoint*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::Binary* type_as_Binary() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Binary
+             ? static_cast<const cudf::io::parquet::flatbuf::Binary*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::Utf8* type_as_Utf8() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Utf8
+             ? static_cast<const cudf::io::parquet::flatbuf::Utf8*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::Bool* type_as_Bool() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Bool
+             ? static_cast<const cudf::io::parquet::flatbuf::Bool*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::Decimal* type_as_Decimal() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Decimal
+             ? static_cast<const cudf::io::parquet::flatbuf::Decimal*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::Date* type_as_Date() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Date
+             ? static_cast<const cudf::io::parquet::flatbuf::Date*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::Time* type_as_Time() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Time
+             ? static_cast<const cudf::io::parquet::flatbuf::Time*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::Timestamp* type_as_Timestamp() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Timestamp
+             ? static_cast<const cudf::io::parquet::flatbuf::Timestamp*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::Interval* type_as_Interval() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Interval
+             ? static_cast<const cudf::io::parquet::flatbuf::Interval*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::List* type_as_List() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_List
+             ? static_cast<const cudf::io::parquet::flatbuf::List*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::Struct_* type_as_Struct_() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Struct_
+             ? static_cast<const cudf::io::parquet::flatbuf::Struct_*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::Union* type_as_Union() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Union
+             ? static_cast<const cudf::io::parquet::flatbuf::Union*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::FixedSizeBinary* type_as_FixedSizeBinary() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_FixedSizeBinary
+             ? static_cast<const cudf::io::parquet::flatbuf::FixedSizeBinary*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::FixedSizeList* type_as_FixedSizeList() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_FixedSizeList
+             ? static_cast<const cudf::io::parquet::flatbuf::FixedSizeList*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::Map* type_as_Map() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Map
+             ? static_cast<const cudf::io::parquet::flatbuf::Map*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::Duration* type_as_Duration() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Duration
+             ? static_cast<const cudf::io::parquet::flatbuf::Duration*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::LargeBinary* type_as_LargeBinary() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_LargeBinary
+             ? static_cast<const cudf::io::parquet::flatbuf::LargeBinary*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::LargeUtf8* type_as_LargeUtf8() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_LargeUtf8
+             ? static_cast<const cudf::io::parquet::flatbuf::LargeUtf8*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::LargeList* type_as_LargeList() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_LargeList
+             ? static_cast<const cudf::io::parquet::flatbuf::LargeList*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::RunEndEncoded* type_as_RunEndEncoded() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_RunEndEncoded
+             ? static_cast<const cudf::io::parquet::flatbuf::RunEndEncoded*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::BinaryView* type_as_BinaryView() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_BinaryView
+             ? static_cast<const cudf::io::parquet::flatbuf::BinaryView*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::Utf8View* type_as_Utf8View() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_Utf8View
+             ? static_cast<const cudf::io::parquet::flatbuf::Utf8View*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::ListView* type_as_ListView() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_ListView
+             ? static_cast<const cudf::io::parquet::flatbuf::ListView*>(type())
+             : nullptr;
+  }
+  const cudf::io::parquet::flatbuf::LargeListView* type_as_LargeListView() const
+  {
+    return type_type() == cudf::io::parquet::flatbuf::Type_LargeListView
+             ? static_cast<const cudf::io::parquet::flatbuf::LargeListView*>(type())
+             : nullptr;
+  }
+  /// Present only if the field is dictionary encoded.
+  const cudf::io::parquet::flatbuf::DictionaryEncoding* dictionary() const
+  {
+    return GetPointer<const cudf::io::parquet::flatbuf::DictionaryEncoding*>(VT_DICTIONARY);
+  }
+  /// children apply only to nested data types like Struct, List and Union. For
+  /// primitive types children will have length 0.
+  const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>* children()
+    const
+  {
+    return GetPointer<
+      const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>*>(
+      VT_CHILDREN);
+  }
+  /// User-defined metadata
+  const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>*
+  custom_metadata() const
+  {
+    return GetPointer<
+      const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>*>(
+      VT_CUSTOM_METADATA);
+  }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyOffset(verifier, VT_NAME) &&
+           verifier.VerifyString(name()) && VerifyField<uint8_t>(verifier, VT_NULLABLE, 1) &&
+           VerifyField<uint8_t>(verifier, VT_TYPE_TYPE, 1) && VerifyOffset(verifier, VT_TYPE) &&
+           VerifyType(verifier, type(), type_type()) && VerifyOffset(verifier, VT_DICTIONARY) &&
+           verifier.VerifyTable(dictionary()) && VerifyOffset(verifier, VT_CHILDREN) &&
+           verifier.VerifyVector(children()) && verifier.VerifyVectorOfTables(children()) &&
+           VerifyOffset(verifier, VT_CUSTOM_METADATA) && verifier.VerifyVector(custom_metadata()) &&
+           verifier.VerifyVectorOfTables(custom_metadata()) && verifier.EndTable();
+  }
+};
+
+template <>
+inline const cudf::io::parquet::flatbuf::Null* Field::type_as<cudf::io::parquet::flatbuf::Null>()
+  const
+{
+  return type_as_Null();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::Int* Field::type_as<cudf::io::parquet::flatbuf::Int>()
+  const
+{
+  return type_as_Int();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::FloatingPoint*
+Field::type_as<cudf::io::parquet::flatbuf::FloatingPoint>() const
+{
+  return type_as_FloatingPoint();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::Binary*
+Field::type_as<cudf::io::parquet::flatbuf::Binary>() const
+{
+  return type_as_Binary();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::Utf8* Field::type_as<cudf::io::parquet::flatbuf::Utf8>()
+  const
+{
+  return type_as_Utf8();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::Bool* Field::type_as<cudf::io::parquet::flatbuf::Bool>()
+  const
+{
+  return type_as_Bool();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::Decimal*
+Field::type_as<cudf::io::parquet::flatbuf::Decimal>() const
+{
+  return type_as_Decimal();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::Date* Field::type_as<cudf::io::parquet::flatbuf::Date>()
+  const
+{
+  return type_as_Date();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::Time* Field::type_as<cudf::io::parquet::flatbuf::Time>()
+  const
+{
+  return type_as_Time();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::Timestamp*
+Field::type_as<cudf::io::parquet::flatbuf::Timestamp>() const
+{
+  return type_as_Timestamp();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::Interval*
+Field::type_as<cudf::io::parquet::flatbuf::Interval>() const
+{
+  return type_as_Interval();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::List* Field::type_as<cudf::io::parquet::flatbuf::List>()
+  const
+{
+  return type_as_List();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::Struct_*
+Field::type_as<cudf::io::parquet::flatbuf::Struct_>() const
+{
+  return type_as_Struct_();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::Union* Field::type_as<cudf::io::parquet::flatbuf::Union>()
+  const
+{
+  return type_as_Union();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::FixedSizeBinary*
+Field::type_as<cudf::io::parquet::flatbuf::FixedSizeBinary>() const
+{
+  return type_as_FixedSizeBinary();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::FixedSizeList*
+Field::type_as<cudf::io::parquet::flatbuf::FixedSizeList>() const
+{
+  return type_as_FixedSizeList();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::Map* Field::type_as<cudf::io::parquet::flatbuf::Map>()
+  const
+{
+  return type_as_Map();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::Duration*
+Field::type_as<cudf::io::parquet::flatbuf::Duration>() const
+{
+  return type_as_Duration();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::LargeBinary*
+Field::type_as<cudf::io::parquet::flatbuf::LargeBinary>() const
+{
+  return type_as_LargeBinary();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::LargeUtf8*
+Field::type_as<cudf::io::parquet::flatbuf::LargeUtf8>() const
+{
+  return type_as_LargeUtf8();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::LargeList*
+Field::type_as<cudf::io::parquet::flatbuf::LargeList>() const
+{
+  return type_as_LargeList();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::RunEndEncoded*
+Field::type_as<cudf::io::parquet::flatbuf::RunEndEncoded>() const
+{
+  return type_as_RunEndEncoded();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::BinaryView*
+Field::type_as<cudf::io::parquet::flatbuf::BinaryView>() const
+{
+  return type_as_BinaryView();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::Utf8View*
+Field::type_as<cudf::io::parquet::flatbuf::Utf8View>() const
+{
+  return type_as_Utf8View();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::ListView*
+Field::type_as<cudf::io::parquet::flatbuf::ListView>() const
+{
+  return type_as_ListView();
+}
+
+template <>
+inline const cudf::io::parquet::flatbuf::LargeListView*
+Field::type_as<cudf::io::parquet::flatbuf::LargeListView>() const
+{
+  return type_as_LargeListView();
+}
+
+struct FieldBuilder {
+  typedef Field Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_name(::flatbuffers::Offset<::flatbuffers::String> name)
+  {
+    fbb_.AddOffset(Field::VT_NAME, name);
+  }
+  void add_nullable(bool nullable)
+  {
+    fbb_.AddElement<uint8_t>(Field::VT_NULLABLE, static_cast<uint8_t>(nullable), 0);
+  }
+  void add_type_type(cudf::io::parquet::flatbuf::Type type_type)
+  {
+    fbb_.AddElement<uint8_t>(Field::VT_TYPE_TYPE, static_cast<uint8_t>(type_type), 0);
+  }
+  void add_type(::flatbuffers::Offset<void> type) { fbb_.AddOffset(Field::VT_TYPE, type); }
+  void add_dictionary(
+    ::flatbuffers::Offset<cudf::io::parquet::flatbuf::DictionaryEncoding> dictionary)
+  {
+    fbb_.AddOffset(Field::VT_DICTIONARY, dictionary);
+  }
+  void add_children(
+    ::flatbuffers::Offset<
+      ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>> children)
+  {
+    fbb_.AddOffset(Field::VT_CHILDREN, children);
+  }
+  void add_custom_metadata(
+    ::flatbuffers::Offset<
+      ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>>
+      custom_metadata)
+  {
+    fbb_.AddOffset(Field::VT_CUSTOM_METADATA, custom_metadata);
+  }
+  explicit FieldBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Field> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Field>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Field> CreateField(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  ::flatbuffers::Offset<::flatbuffers::String> name = 0,
+  bool nullable                                     = false,
+  cudf::io::parquet::flatbuf::Type type_type        = cudf::io::parquet::flatbuf::Type_NONE,
+  ::flatbuffers::Offset<void> type                  = 0,
+  ::flatbuffers::Offset<cudf::io::parquet::flatbuf::DictionaryEncoding> dictionary = 0,
+  ::flatbuffers::Offset<
+    ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>> children = 0,
+  ::flatbuffers::Offset<::flatbuffers::Vector<
+    ::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>> custom_metadata             = 0)
+{
+  FieldBuilder builder_(_fbb);
+  builder_.add_custom_metadata(custom_metadata);
+  builder_.add_children(children);
+  builder_.add_dictionary(dictionary);
+  builder_.add_type(type);
+  builder_.add_name(name);
+  builder_.add_type_type(type_type);
+  builder_.add_nullable(nullable);
+  return builder_.Finish();
+}
+
+inline ::flatbuffers::Offset<Field> CreateFieldDirect(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  const char* name                           = nullptr,
+  bool nullable                              = false,
+  cudf::io::parquet::flatbuf::Type type_type = cudf::io::parquet::flatbuf::Type_NONE,
+  ::flatbuffers::Offset<void> type           = 0,
+  ::flatbuffers::Offset<cudf::io::parquet::flatbuf::DictionaryEncoding> dictionary      = 0,
+  const std::vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>* children = nullptr,
+  const std::vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>* custom_metadata =
+    nullptr)
+{
+  auto name__ = name ? _fbb.CreateString(name) : 0;
+  auto children__ =
+    children
+      ? _fbb.CreateVector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>(*children)
+      : 0;
+  auto custom_metadata__ =
+    custom_metadata
+      ? _fbb.CreateVector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>(
+          *custom_metadata)
+      : 0;
+  return cudf::io::parquet::flatbuf::CreateField(
+    _fbb, name__, nullable, type_type, type, dictionary, children__, custom_metadata__);
+}
+
+/// ----------------------------------------------------------------------
+/// A Schema describes the columns in a row batch
+struct Schema FLATBUFFERS_FINAL_CLASS : private ::flatbuffers::Table {
+  typedef SchemaBuilder Builder;
+  enum FlatBuffersVTableOffset FLATBUFFERS_VTABLE_UNDERLYING_TYPE {
+    VT_ENDIANNESS      = 4,
+    VT_FIELDS          = 6,
+    VT_CUSTOM_METADATA = 8,
+    VT_FEATURES        = 10
+  };
+  /// endianness of the buffer
+  /// it is Little Endian by default
+  /// if endianness doesn't match the underlying system then the vectors need to be converted
+  cudf::io::parquet::flatbuf::Endianness endianness() const
+  {
+    return static_cast<cudf::io::parquet::flatbuf::Endianness>(GetField<int16_t>(VT_ENDIANNESS, 0));
+  }
+  const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>* fields()
+    const
+  {
+    return GetPointer<
+      const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>*>(
+      VT_FIELDS);
+  }
+  const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>*
+  custom_metadata() const
+  {
+    return GetPointer<
+      const ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>*>(
+      VT_CUSTOM_METADATA);
+  }
+  /// Features used in the stream/file.
+  const ::flatbuffers::Vector<int64_t>* features() const
+  {
+    return GetPointer<const ::flatbuffers::Vector<int64_t>*>(VT_FEATURES);
+  }
+  bool Verify(::flatbuffers::Verifier& verifier) const
+  {
+    return VerifyTableStart(verifier) && VerifyField<int16_t>(verifier, VT_ENDIANNESS, 2) &&
+           VerifyOffset(verifier, VT_FIELDS) && verifier.VerifyVector(fields()) &&
+           verifier.VerifyVectorOfTables(fields()) && VerifyOffset(verifier, VT_CUSTOM_METADATA) &&
+           verifier.VerifyVector(custom_metadata()) &&
+           verifier.VerifyVectorOfTables(custom_metadata()) &&
+           VerifyOffset(verifier, VT_FEATURES) && verifier.VerifyVector(features()) &&
+           verifier.EndTable();
+  }
+};
+
+struct SchemaBuilder {
+  typedef Schema Table;
+  ::flatbuffers::FlatBufferBuilder& fbb_;
+  ::flatbuffers::uoffset_t start_;
+  void add_endianness(cudf::io::parquet::flatbuf::Endianness endianness)
+  {
+    fbb_.AddElement<int16_t>(Schema::VT_ENDIANNESS, static_cast<int16_t>(endianness), 0);
+  }
+  void add_fields(
+    ::flatbuffers::Offset<
+      ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>> fields)
+  {
+    fbb_.AddOffset(Schema::VT_FIELDS, fields);
+  }
+  void add_custom_metadata(
+    ::flatbuffers::Offset<
+      ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>>
+      custom_metadata)
+  {
+    fbb_.AddOffset(Schema::VT_CUSTOM_METADATA, custom_metadata);
+  }
+  void add_features(::flatbuffers::Offset<::flatbuffers::Vector<int64_t>> features)
+  {
+    fbb_.AddOffset(Schema::VT_FEATURES, features);
+  }
+  explicit SchemaBuilder(::flatbuffers::FlatBufferBuilder& _fbb) : fbb_(_fbb)
+  {
+    start_ = fbb_.StartTable();
+  }
+  ::flatbuffers::Offset<Schema> Finish()
+  {
+    const auto end = fbb_.EndTable(start_);
+    auto o         = ::flatbuffers::Offset<Schema>(end);
+    return o;
+  }
+};
+
+inline ::flatbuffers::Offset<Schema> CreateSchema(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  cudf::io::parquet::flatbuf::Endianness endianness = cudf::io::parquet::flatbuf::Endianness_Little,
+  ::flatbuffers::Offset<
+    ::flatbuffers::Vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>> fields = 0,
+  ::flatbuffers::Offset<::flatbuffers::Vector<
+    ::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>> custom_metadata           = 0,
+  ::flatbuffers::Offset<::flatbuffers::Vector<int64_t>> features                            = 0)
+{
+  SchemaBuilder builder_(_fbb);
+  builder_.add_features(features);
+  builder_.add_custom_metadata(custom_metadata);
+  builder_.add_fields(fields);
+  builder_.add_endianness(endianness);
+  return builder_.Finish();
+}
+
+inline ::flatbuffers::Offset<Schema> CreateSchemaDirect(
+  ::flatbuffers::FlatBufferBuilder& _fbb,
+  cudf::io::parquet::flatbuf::Endianness endianness = cudf::io::parquet::flatbuf::Endianness_Little,
+  const std::vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>* fields = nullptr,
+  const std::vector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>* custom_metadata =
+    nullptr,
+  const std::vector<int64_t>* features = nullptr)
+{
+  auto fields__ =
+    fields ? _fbb.CreateVector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::Field>>(*fields)
+           : 0;
+  auto custom_metadata__ =
+    custom_metadata
+      ? _fbb.CreateVector<::flatbuffers::Offset<cudf::io::parquet::flatbuf::KeyValue>>(
+          *custom_metadata)
+      : 0;
+  auto features__ = features ? _fbb.CreateVector<int64_t>(*features) : 0;
+  return cudf::io::parquet::flatbuf::CreateSchema(
+    _fbb, endianness, fields__, custom_metadata__, features__);
+}
+
+inline bool VerifyType(::flatbuffers::Verifier& verifier, const void* obj, Type type)
+{
+  switch (type) {
+    case Type_NONE: {
+      return true;
+    }
+    case Type_Null: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Null*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_Int: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Int*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_FloatingPoint: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::FloatingPoint*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_Binary: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Binary*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_Utf8: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Utf8*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_Bool: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Bool*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_Decimal: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Decimal*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_Date: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Date*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_Time: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Time*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_Timestamp: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Timestamp*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_Interval: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Interval*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_List: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::List*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_Struct_: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Struct_*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_Union: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Union*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_FixedSizeBinary: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::FixedSizeBinary*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_FixedSizeList: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::FixedSizeList*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_Map: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Map*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_Duration: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Duration*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_LargeBinary: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::LargeBinary*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_LargeUtf8: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::LargeUtf8*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_LargeList: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::LargeList*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_RunEndEncoded: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::RunEndEncoded*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_BinaryView: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::BinaryView*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_Utf8View: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::Utf8View*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_ListView: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::ListView*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    case Type_LargeListView: {
+      auto ptr = reinterpret_cast<const cudf::io::parquet::flatbuf::LargeListView*>(obj);
+      return verifier.VerifyTable(ptr);
+    }
+    default: return true;
+  }
+}
+
+inline bool VerifyTypeVector(::flatbuffers::Verifier& verifier,
+                             const ::flatbuffers::Vector<::flatbuffers::Offset<void>>* values,
+                             const ::flatbuffers::Vector<uint8_t>* types)
+{
+  if (!values || !types) return !values && !types;
+  if (values->size() != types->size()) return false;
+  for (::flatbuffers::uoffset_t i = 0; i < values->size(); ++i) {
+    if (!VerifyType(verifier, values->Get(i), types->GetEnum<Type>(i))) { return false; }
+  }
+  return true;
+}
+
+inline const cudf::io::parquet::flatbuf::Schema* GetSchema(const void* buf)
+{
+  return ::flatbuffers::GetRoot<cudf::io::parquet::flatbuf::Schema>(buf);
+}
+
+inline const cudf::io::parquet::flatbuf::Schema* GetSizePrefixedSchema(const void* buf)
+{
+  return ::flatbuffers::GetSizePrefixedRoot<cudf::io::parquet::flatbuf::Schema>(buf);
+}
+
+inline bool VerifySchemaBuffer(::flatbuffers::Verifier& verifier)
+{
+  return verifier.VerifyBuffer<cudf::io::parquet::flatbuf::Schema>(nullptr);
+}
+
+inline bool VerifySizePrefixedSchemaBuffer(::flatbuffers::Verifier& verifier)
+{
+  return verifier.VerifySizePrefixedBuffer<cudf::io::parquet::flatbuf::Schema>(nullptr);
+}
+
+inline void FinishSchemaBuffer(::flatbuffers::FlatBufferBuilder& fbb,
+                               ::flatbuffers::Offset<cudf::io::parquet::flatbuf::Schema> root)
+{
+  fbb.Finish(root);
+}
+
+inline void FinishSizePrefixedSchemaBuffer(
+  ::flatbuffers::FlatBufferBuilder& fbb,
+  ::flatbuffers::Offset<cudf::io::parquet::flatbuf::Schema> root)
+{
+  fbb.FinishSizePrefixed(root);
+}
+
+}  // namespace flatbuf
+}  // namespace parquet
+}  // namespace io
+}  // namespace cudf
+
+#endif  // FLATBUFFERS_GENERATED_SCHEMA_CUDF_IO_PARQUET_FLATBUF_H_
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/allocator.h b/cpp/include/cudf/io/ipc/flatbuffers/allocator.h
new file mode 100644
index 00000000000..f6fe10044a2
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/allocator.h
@@ -0,0 +1,73 @@
+/*
+ * Copyright 2021 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_ALLOCATOR_H_
+#define FLATBUFFERS_ALLOCATOR_H_
+
+#include <cudf/io/ipc/flatbuffers/base.h>
+
+namespace flatbuffers {
+
+// Allocator interface. This is flatbuffers-specific and meant only for
+// `vector_downward` usage.
+class Allocator {
+ public:
+  virtual ~Allocator() {}
+
+  // Allocate `size` bytes of memory.
+  virtual uint8_t* allocate(size_t size) = 0;
+
+  // Deallocate `size` bytes of memory at `p` allocated by this allocator.
+  virtual void deallocate(uint8_t* p, size_t size) = 0;
+
+  // Reallocate `new_size` bytes of memory, replacing the old region of size
+  // `old_size` at `p`. In contrast to a normal realloc, this grows downwards,
+  // and is intended specifcally for `vector_downward` use.
+  // `in_use_back` and `in_use_front` indicate how much of `old_size` is
+  // actually in use at each end, and needs to be copied.
+  virtual uint8_t* reallocate_downward(
+    uint8_t* old_p, size_t old_size, size_t new_size, size_t in_use_back, size_t in_use_front)
+  {
+    FLATBUFFERS_ASSERT(new_size > old_size);  // vector_downward only grows
+    uint8_t* new_p = allocate(new_size);
+    memcpy_downward(old_p, old_size, new_p, new_size, in_use_back, in_use_front);
+    deallocate(old_p, old_size);
+    return new_p;
+  }
+
+ protected:
+  // Called by `reallocate_downward` to copy memory from `old_p` of `old_size`
+  // to `new_p` of `new_size`. Only memory of size `in_use_front` and
+  // `in_use_back` will be copied from the front and back of the old memory
+  // allocation.
+  void memcpy_downward(uint8_t* old_p,
+                       size_t old_size,
+                       uint8_t* new_p,
+                       size_t new_size,
+                       size_t in_use_back,
+                       size_t in_use_front)
+  {
+    memcpy(new_p + new_size - in_use_back, old_p + old_size - in_use_back, in_use_back);
+    memcpy(new_p, old_p, in_use_front);
+  }
+};
+
+}  // namespace flatbuffers
+
+#endif  // FLATBUFFERS_ALLOCATOR_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/array.h b/cpp/include/cudf/io/ipc/flatbuffers/array.h
new file mode 100644
index 00000000000..bcd68b3ca74
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/array.h
@@ -0,0 +1,267 @@
+/*
+ * Copyright 2021 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_ARRAY_H_
+#define FLATBUFFERS_ARRAY_H_
+
+#include <cudf/io/ipc/flatbuffers/base.h>
+#include <cudf/io/ipc/flatbuffers/stl_emulation.h>
+#include <cudf/io/ipc/flatbuffers/vector.h>
+
+#include <cstdint>
+#include <memory>
+
+namespace flatbuffers {
+
+// This is used as a helper type for accessing arrays.
+template <typename T, uint16_t length>
+class Array {
+  // Array<T> can carry only POD data types (scalars or structs).
+  typedef typename flatbuffers::bool_constant<flatbuffers::is_scalar<T>::value> scalar_tag;
+  typedef
+    typename flatbuffers::conditional<scalar_tag::value, T, const T*>::type IndirectHelperType;
+
+ public:
+  typedef uint16_t size_type;
+  typedef typename IndirectHelper<IndirectHelperType>::return_type return_type;
+  typedef VectorConstIterator<T, return_type, uoffset_t> const_iterator;
+  typedef VectorReverseIterator<const_iterator> const_reverse_iterator;
+
+  // If T is a LE-scalar or a struct (!scalar_tag::value).
+  static FLATBUFFERS_CONSTEXPR bool is_span_observable =
+    (scalar_tag::value && (FLATBUFFERS_LITTLEENDIAN || sizeof(T) == 1)) || !scalar_tag::value;
+
+  FLATBUFFERS_CONSTEXPR uint16_t size() const { return length; }
+
+  return_type Get(uoffset_t i) const
+  {
+    FLATBUFFERS_ASSERT(i < size());
+    return IndirectHelper<IndirectHelperType>::Read(Data(), i);
+  }
+
+  return_type operator[](uoffset_t i) const { return Get(i); }
+
+  // If this is a Vector of enums, T will be its storage type, not the enum
+  // type. This function makes it convenient to retrieve value with enum
+  // type E.
+  template <typename E>
+  E GetEnum(uoffset_t i) const
+  {
+    return static_cast<E>(Get(i));
+  }
+
+  const_iterator begin() const { return const_iterator(Data(), 0); }
+  const_iterator end() const { return const_iterator(Data(), size()); }
+
+  const_reverse_iterator rbegin() const { return const_reverse_iterator(end()); }
+  const_reverse_iterator rend() const { return const_reverse_iterator(begin()); }
+
+  const_iterator cbegin() const { return begin(); }
+  const_iterator cend() const { return end(); }
+
+  const_reverse_iterator crbegin() const { return rbegin(); }
+  const_reverse_iterator crend() const { return rend(); }
+
+  // Get a mutable pointer to elements inside this array.
+  // This method used to mutate arrays of structs followed by a @p Mutate
+  // operation. For primitive types use @p Mutate directly.
+  // @warning Assignments and reads to/from the dereferenced pointer are not
+  //  automatically converted to the correct endianness.
+  typename flatbuffers::conditional<scalar_tag::value, void, T*>::type GetMutablePointer(
+    uoffset_t i) const
+  {
+    FLATBUFFERS_ASSERT(i < size());
+    return const_cast<T*>(&data()[i]);
+  }
+
+  // Change elements if you have a non-const pointer to this object.
+  void Mutate(uoffset_t i, const T& val) { MutateImpl(scalar_tag(), i, val); }
+
+  // The raw data in little endian format. Use with care.
+  const uint8_t* Data() const { return data_; }
+
+  uint8_t* Data() { return data_; }
+
+  // Similarly, but typed, much like std::vector::data
+  const T* data() const { return reinterpret_cast<const T*>(Data()); }
+  T* data() { return reinterpret_cast<T*>(Data()); }
+
+  // Copy data from a span with endian conversion.
+  // If this Array and the span overlap, the behavior is undefined.
+  void CopyFromSpan(flatbuffers::span<const T, length> src)
+  {
+    const auto p1 = reinterpret_cast<const uint8_t*>(src.data());
+    const auto p2 = Data();
+    FLATBUFFERS_ASSERT(!(p1 >= p2 && p1 < (p2 + length)) && !(p2 >= p1 && p2 < (p1 + length)));
+    (void)p1;
+    (void)p2;
+    CopyFromSpanImpl(flatbuffers::bool_constant<is_span_observable>(), src);
+  }
+
+ protected:
+  void MutateImpl(flatbuffers::true_type, uoffset_t i, const T& val)
+  {
+    FLATBUFFERS_ASSERT(i < size());
+    WriteScalar(data() + i, val);
+  }
+
+  void MutateImpl(flatbuffers::false_type, uoffset_t i, const T& val)
+  {
+    *(GetMutablePointer(i)) = val;
+  }
+
+  void CopyFromSpanImpl(flatbuffers::true_type, flatbuffers::span<const T, length> src)
+  {
+    // Use std::memcpy() instead of std::copy() to avoid performance degradation
+    // due to aliasing if T is char or unsigned char.
+    // The size is known at compile time, so memcpy would be inlined.
+    std::memcpy(data(), src.data(), length * sizeof(T));
+  }
+
+  // Copy data from flatbuffers::span with endian conversion.
+  void CopyFromSpanImpl(flatbuffers::false_type, flatbuffers::span<const T, length> src)
+  {
+    for (size_type k = 0; k < length; k++) {
+      Mutate(k, src[k]);
+    }
+  }
+
+  // This class is only used to access pre-existing data. Don't ever
+  // try to construct these manually.
+  // 'constexpr' allows us to use 'size()' at compile time.
+  // @note Must not use 'FLATBUFFERS_CONSTEXPR' here, as const is not allowed on
+  //  a constructor.
+#if defined(__cpp_constexpr)
+  constexpr Array();
+#else
+  Array();
+#endif
+
+  uint8_t data_[length * sizeof(T)];
+
+ private:
+  // This class is a pointer. Copying will therefore create an invalid object.
+  // Private and unimplemented copy constructor.
+  Array(const Array&);
+  Array& operator=(const Array&);
+};
+
+// Specialization for Array[struct] with access using Offset<void> pointer.
+// This specialization used by idl_gen_text.cpp.
+template <typename T, uint16_t length, template <typename> class OffsetT>
+class Array<OffsetT<T>, length> {
+  static_assert(flatbuffers::is_same<T, void>::value, "unexpected type T");
+
+ public:
+  typedef const void* return_type;
+  typedef uint16_t size_type;
+
+  const uint8_t* Data() const { return data_; }
+
+  // Make idl_gen_text.cpp::PrintContainer happy.
+  return_type operator[](uoffset_t) const
+  {
+    FLATBUFFERS_ASSERT(false);
+    return nullptr;
+  }
+
+ private:
+  // This class is only used to access pre-existing data.
+  Array();
+  Array(const Array&);
+  Array& operator=(const Array&);
+
+  uint8_t data_[1];
+};
+
+template <class U, uint16_t N>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<U, N> make_span(Array<U, N>& arr) FLATBUFFERS_NOEXCEPT
+{
+  static_assert(Array<U, N>::is_span_observable,
+                "wrong type U, only plain struct, LE-scalar, or byte types are allowed");
+  return span<U, N>(arr.data(), N);
+}
+
+template <class U, uint16_t N>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const U, N> make_span(const Array<U, N>& arr)
+  FLATBUFFERS_NOEXCEPT
+{
+  static_assert(Array<U, N>::is_span_observable,
+                "wrong type U, only plain struct, LE-scalar, or byte types are allowed");
+  return span<const U, N>(arr.data(), N);
+}
+
+template <class U, uint16_t N>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<uint8_t, sizeof(U) * N> make_bytes_span(
+  Array<U, N>& arr) FLATBUFFERS_NOEXCEPT
+{
+  static_assert(Array<U, N>::is_span_observable,
+                "internal error, Array<T> might hold only scalars or structs");
+  return span<uint8_t, sizeof(U) * N>(arr.Data(), sizeof(U) * N);
+}
+
+template <class U, uint16_t N>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const uint8_t, sizeof(U) * N> make_bytes_span(
+  const Array<U, N>& arr) FLATBUFFERS_NOEXCEPT
+{
+  static_assert(Array<U, N>::is_span_observable,
+                "internal error, Array<T> might hold only scalars or structs");
+  return span<const uint8_t, sizeof(U) * N>(arr.Data(), sizeof(U) * N);
+}
+
+// Cast a raw T[length] to a raw flatbuffers::Array<T, length>
+// without endian conversion. Use with care.
+// TODO: move these Cast-methods to `internal` namespace.
+template <typename T, uint16_t length>
+Array<T, length>& CastToArray(T (&arr)[length])
+{
+  return *reinterpret_cast<Array<T, length>*>(arr);
+}
+
+template <typename T, uint16_t length>
+const Array<T, length>& CastToArray(const T (&arr)[length])
+{
+  return *reinterpret_cast<const Array<T, length>*>(arr);
+}
+
+template <typename E, typename T, uint16_t length>
+Array<E, length>& CastToArrayOfEnum(T (&arr)[length])
+{
+  static_assert(sizeof(E) == sizeof(T), "invalid enum type E");
+  return *reinterpret_cast<Array<E, length>*>(arr);
+}
+
+template <typename E, typename T, uint16_t length>
+const Array<E, length>& CastToArrayOfEnum(const T (&arr)[length])
+{
+  static_assert(sizeof(E) == sizeof(T), "invalid enum type E");
+  return *reinterpret_cast<const Array<E, length>*>(arr);
+}
+
+template <typename T, uint16_t length>
+bool operator==(const Array<T, length>& lhs, const Array<T, length>& rhs) noexcept
+{
+  return std::addressof(lhs) == std::addressof(rhs) ||
+         (lhs.size() == rhs.size() &&
+          std::memcmp(lhs.Data(), rhs.Data(), rhs.size() * sizeof(T)) == 0);
+}
+
+}  // namespace flatbuffers
+
+#endif  // FLATBUFFERS_ARRAY_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/base.h b/cpp/include/cudf/io/ipc/flatbuffers/base.h
new file mode 100644
index 00000000000..cbe241cb116
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/base.h
@@ -0,0 +1,498 @@
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+#ifndef FLATBUFFERS_BASE_H_
+#define FLATBUFFERS_BASE_H_
+
+// clang-format off
+
+// If activate should be declared and included first.
+#if defined(FLATBUFFERS_MEMORY_LEAK_TRACKING) && \
+    defined(_MSC_VER) && defined(_DEBUG)
+  // The _CRTDBG_MAP_ALLOC inside <crtdbg.h> will replace
+  // calloc/free (etc) to its debug version using #define directives.
+  #define _CRTDBG_MAP_ALLOC
+  #include <stdlib.h>
+  #include <crtdbg.h>
+  // Replace operator new by trace-enabled version.
+  #define DEBUG_NEW new(_NORMAL_BLOCK, __FILE__, __LINE__)
+  #define new DEBUG_NEW
+#endif
+
+#if !defined(FLATBUFFERS_ASSERT)
+#include <assert.h>
+#define FLATBUFFERS_ASSERT assert
+#elif defined(FLATBUFFERS_ASSERT_INCLUDE)
+// Include file with forward declaration
+#include FLATBUFFERS_ASSERT_INCLUDE
+#endif
+
+#ifndef ARDUINO
+#include <cstdint>
+#endif
+
+#include <cstddef>
+#include <cstdlib>
+#include <cstring>
+
+#if defined(ARDUINO) && !defined(ARDUINOSTL_M_H) && defined(__AVR__)
+  #include <utility.h>
+#else
+  #include <utility>
+#endif
+
+#include <string>
+#include <type_traits>
+#include <vector>
+#include <set>
+#include <algorithm>
+#include <limits>
+#include <iterator>
+#include <memory>
+
+#if defined(__unix__) && !defined(FLATBUFFERS_LOCALE_INDEPENDENT)
+  #include <unistd.h>
+#endif
+
+#ifdef __ANDROID__
+  #include <android/api-level.h>
+#endif
+
+#if defined(__ICCARM__)
+#include <intrinsics.h>
+#endif
+
+// Note the __clang__ check is needed, because clang presents itself
+// as an older GNUC compiler (4.2).
+// Clang 3.3 and later implement all of the ISO C++ 2011 standard.
+// Clang 3.4 and later implement all of the ISO C++ 2014 standard.
+// http://clang.llvm.org/cxx_status.html
+
+// Note the MSVC value '__cplusplus' may be incorrect:
+// The '__cplusplus' predefined macro in the MSVC stuck at the value 199711L,
+// indicating (erroneously!) that the compiler conformed to the C++98 Standard.
+// This value should be correct starting from MSVC2017-15.7-Preview-3.
+// The '__cplusplus' will be valid only if MSVC2017-15.7-P3 and the `/Zc:__cplusplus` switch is set.
+// Workaround (for details see MSDN):
+// Use the _MSC_VER and _MSVC_LANG definition instead of the __cplusplus  for compatibility.
+// The _MSVC_LANG macro reports the Standard version regardless of the '/Zc:__cplusplus' switch.
+
+#if defined(__GNUC__) && !defined(__clang__)
+  #define FLATBUFFERS_GCC (__GNUC__ * 10000 + __GNUC_MINOR__ * 100 + __GNUC_PATCHLEVEL__)
+#else
+  #define FLATBUFFERS_GCC 0
+#endif
+
+#if defined(__clang__)
+  #define FLATBUFFERS_CLANG (__clang_major__ * 10000 + __clang_minor__ * 100 + __clang_patchlevel__)
+#else
+  #define FLATBUFFERS_CLANG 0
+#endif
+
+/// @cond FLATBUFFERS_INTERNAL
+#if __cplusplus <= 199711L && \
+    (!defined(_MSC_VER) || _MSC_VER < 1600) && \
+    (!defined(__GNUC__) || \
+      (__GNUC__ * 10000 + __GNUC_MINOR__ * 100 + __GNUC_PATCHLEVEL__ < 40400))
+  #error A C++11 compatible compiler with support for the auto typing is \
+         required for FlatBuffers.
+  #error __cplusplus _MSC_VER __GNUC__  __GNUC_MINOR__  __GNUC_PATCHLEVEL__
+#endif
+
+#if !defined(__clang__) && \
+    defined(__GNUC__) && \
+    (__GNUC__ * 10000 + __GNUC_MINOR__ * 100 + __GNUC_PATCHLEVEL__ < 40600)
+  // Backwards compatibility for g++ 4.4, and 4.5 which don't have the nullptr
+  // and constexpr keywords. Note the __clang__ check is needed, because clang
+  // presents itself as an older GNUC compiler.
+  #ifndef nullptr_t
+    const class nullptr_t {
+    public:
+      template<class T> inline operator T*() const { return 0; }
+    private:
+      void operator&() const;
+    } nullptr = {};
+  #endif
+  #ifndef constexpr
+    #define constexpr const
+  #endif
+#endif
+
+// The wire format uses a little endian encoding (since that's efficient for
+// the common platforms).
+#if defined(__s390x__)
+  #define FLATBUFFERS_LITTLEENDIAN 0
+#endif // __s390x__
+#if !defined(FLATBUFFERS_LITTLEENDIAN)
+  #if defined(__GNUC__) || defined(__clang__) || defined(__ICCARM__)
+    #if (defined(__BIG_ENDIAN__) || \
+         (defined(__BYTE_ORDER__) && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__))
+      #define FLATBUFFERS_LITTLEENDIAN 0
+    #else
+      #define FLATBUFFERS_LITTLEENDIAN 1
+    #endif // __BIG_ENDIAN__
+  #elif defined(_MSC_VER)
+    #if defined(_M_PPC)
+      #define FLATBUFFERS_LITTLEENDIAN 0
+    #else
+      #define FLATBUFFERS_LITTLEENDIAN 1
+    #endif
+  #else
+    #error Unable to determine endianness, define FLATBUFFERS_LITTLEENDIAN.
+  #endif
+#endif // !defined(FLATBUFFERS_LITTLEENDIAN)
+
+#define FLATBUFFERS_VERSION_MAJOR 24
+#define FLATBUFFERS_VERSION_MINOR 3
+#define FLATBUFFERS_VERSION_REVISION 25
+#define FLATBUFFERS_STRING_EXPAND(X) #X
+#define FLATBUFFERS_STRING(X) FLATBUFFERS_STRING_EXPAND(X)
+namespace flatbuffers {
+  // Returns version as string  "MAJOR.MINOR.REVISION".
+  const char* FLATBUFFERS_VERSION();
+}
+
+#if (!defined(_MSC_VER) || _MSC_VER > 1600) && \
+    (!defined(__GNUC__) || (__GNUC__ * 100 + __GNUC_MINOR__ >= 407)) || \
+    defined(__clang__)
+  #define FLATBUFFERS_FINAL_CLASS final
+  #define FLATBUFFERS_OVERRIDE override
+  #define FLATBUFFERS_EXPLICIT_CPP11 explicit
+  #define FLATBUFFERS_VTABLE_UNDERLYING_TYPE : ::flatbuffers::voffset_t
+#else
+  #define FLATBUFFERS_FINAL_CLASS
+  #define FLATBUFFERS_OVERRIDE
+  #define FLATBUFFERS_EXPLICIT_CPP11
+  #define FLATBUFFERS_VTABLE_UNDERLYING_TYPE
+#endif
+
+#if (!defined(_MSC_VER) || _MSC_VER >= 1900) && \
+    (!defined(__GNUC__) || (__GNUC__ * 100 + __GNUC_MINOR__ >= 406)) || \
+    (defined(__cpp_constexpr) && __cpp_constexpr >= 200704)
+  #define FLATBUFFERS_CONSTEXPR constexpr
+  #define FLATBUFFERS_CONSTEXPR_CPP11 constexpr
+  #define FLATBUFFERS_CONSTEXPR_DEFINED
+#else
+  #define FLATBUFFERS_CONSTEXPR const
+  #define FLATBUFFERS_CONSTEXPR_CPP11
+#endif
+
+#if (defined(__cplusplus) && __cplusplus >= 201402L) || \
+    (defined(__cpp_constexpr) && __cpp_constexpr >= 201304)
+  #define FLATBUFFERS_CONSTEXPR_CPP14 FLATBUFFERS_CONSTEXPR_CPP11
+#else
+  #define FLATBUFFERS_CONSTEXPR_CPP14
+#endif
+
+#if (defined(__GXX_EXPERIMENTAL_CXX0X__) && (__GNUC__ * 100 + __GNUC_MINOR__ >= 406)) || \
+    (defined(_MSC_FULL_VER) && (_MSC_FULL_VER >= 190023026)) || \
+    defined(__clang__)
+  #define FLATBUFFERS_NOEXCEPT noexcept
+#else
+  #define FLATBUFFERS_NOEXCEPT
+#endif
+
+// NOTE: the FLATBUFFERS_DELETE_FUNC macro may change the access mode to
+// private, so be sure to put it at the end or reset access mode explicitly.
+#if (!defined(_MSC_VER) || _MSC_FULL_VER >= 180020827) && \
+    (!defined(__GNUC__) || (__GNUC__ * 100 + __GNUC_MINOR__ >= 404)) || \
+    defined(__clang__)
+  #define FLATBUFFERS_DELETE_FUNC(func) func = delete
+#else
+  #define FLATBUFFERS_DELETE_FUNC(func) private: func
+#endif
+
+#if (!defined(_MSC_VER) || _MSC_VER >= 1900) && \
+    (!defined(__GNUC__) || (__GNUC__ * 100 + __GNUC_MINOR__ >= 409)) || \
+    defined(__clang__)
+  #define FLATBUFFERS_DEFAULT_DECLARATION
+#endif
+
+// Check if we can use template aliases
+// Not possible if Microsoft Compiler before 2012
+// Possible is the language feature __cpp_alias_templates is defined well
+// Or possible if the C++ std is C+11 or newer
+#if (defined(_MSC_VER) && _MSC_VER > 1700 /* MSVC2012 */) \
+    || (defined(__cpp_alias_templates) && __cpp_alias_templates >= 200704) \
+    || (defined(__cplusplus) && __cplusplus >= 201103L)
+  #define FLATBUFFERS_TEMPLATES_ALIASES
+#endif
+
+#ifndef FLATBUFFERS_HAS_STRING_VIEW
+  // Only provide flatbuffers::string_view if __has_include can be used
+  // to detect a header that provides an implementation
+  #if defined(__has_include)
+    // Check for std::string_view (in c++17)
+    #if __has_include(<string_view>) && (__cplusplus >= 201606 || (defined(_HAS_CXX17) && _HAS_CXX17))
+      #include <string_view>
+      namespace flatbuffers {
+        typedef std::string_view string_view;
+      }
+      #define FLATBUFFERS_HAS_STRING_VIEW 1
+    // Check for std::experimental::string_view (in c++14, compiler-dependent)
+    #elif __has_include(<experimental/string_view>) && (__cplusplus >= 201411)
+      #include <experimental/string_view>
+      namespace flatbuffers {
+        typedef std::experimental::string_view string_view;
+      }
+      #define FLATBUFFERS_HAS_STRING_VIEW 1
+    // Check for absl::string_view
+    #elif __has_include("absl/strings/string_view.h") && \
+          __has_include("absl/base/config.h") && \
+          (__cplusplus >= 201411)
+      #include "absl/base/config.h"
+      #if !defined(ABSL_USES_STD_STRING_VIEW)
+        #include "absl/strings/string_view.h"
+        namespace flatbuffers {
+          typedef absl::string_view string_view;
+        }
+        #define FLATBUFFERS_HAS_STRING_VIEW 1
+      #endif
+    #endif
+  #endif // __has_include
+#endif // !FLATBUFFERS_HAS_STRING_VIEW
+
+#ifndef FLATBUFFERS_GENERAL_HEAP_ALLOC_OK
+  // Allow heap allocations to be used
+  #define FLATBUFFERS_GENERAL_HEAP_ALLOC_OK 1
+#endif // !FLATBUFFERS_GENERAL_HEAP_ALLOC_OK
+
+#ifndef FLATBUFFERS_HAS_NEW_STRTOD
+  // Modern (C++11) strtod and strtof functions are available for use.
+  // 1) nan/inf strings as argument of strtod;
+  // 2) hex-float  as argument of  strtod/strtof.
+  #if (defined(_MSC_VER) && _MSC_VER >= 1900) || \
+      (defined(__GNUC__) && (__GNUC__ * 100 + __GNUC_MINOR__ >= 409)) || \
+      (defined(__clang__))
+    #define FLATBUFFERS_HAS_NEW_STRTOD 1
+  #endif
+#endif // !FLATBUFFERS_HAS_NEW_STRTOD
+
+#ifndef FLATBUFFERS_LOCALE_INDEPENDENT
+  // Enable locale independent functions {strtof_l, strtod_l,strtoll_l,
+  // strtoull_l}.
+  #if (defined(_MSC_VER) && _MSC_VER >= 1800) || \
+      (defined(__ANDROID_API__) && __ANDROID_API__>= 21) || \
+      (defined(_XOPEN_VERSION) && (_XOPEN_VERSION >= 700)) && \
+        (!defined(__Fuchsia__) && !defined(__ANDROID_API__))
+    #define FLATBUFFERS_LOCALE_INDEPENDENT 1
+  #else
+    #define FLATBUFFERS_LOCALE_INDEPENDENT 0
+  #endif
+#endif  // !FLATBUFFERS_LOCALE_INDEPENDENT
+
+// Suppress Undefined Behavior Sanitizer (recoverable only). Usage:
+// - FLATBUFFERS_SUPPRESS_UBSAN("undefined")
+// - FLATBUFFERS_SUPPRESS_UBSAN("signed-integer-overflow")
+#if defined(__clang__) && (__clang_major__ > 3 || (__clang_major__ == 3 && __clang_minor__ >=7))
+  #define FLATBUFFERS_SUPPRESS_UBSAN(type) __attribute__((no_sanitize(type)))
+#elif defined(__GNUC__) && (__GNUC__ * 100 + __GNUC_MINOR__ >= 409)
+  #define FLATBUFFERS_SUPPRESS_UBSAN(type) __attribute__((no_sanitize_undefined))
+#else
+  #define FLATBUFFERS_SUPPRESS_UBSAN(type)
+#endif
+
+namespace flatbuffers {
+  // This is constexpr function used for checking compile-time constants.
+  // Avoid `#pragma warning(disable: 4127) // C4127: expression is constant`.
+  template<typename T> FLATBUFFERS_CONSTEXPR inline bool IsConstTrue(T t) {
+    return !!t;
+  }
+}
+
+// Enable C++ attribute [[]] if std:c++17 or higher.
+#if ((__cplusplus >= 201703L) \
+    || (defined(_MSVC_LANG) &&  (_MSVC_LANG >= 201703L)))
+  // All attributes unknown to an implementation are ignored without causing an error.
+  #define FLATBUFFERS_ATTRIBUTE(attr) attr
+
+  #define FLATBUFFERS_FALLTHROUGH() [[fallthrough]]
+#else
+  #define FLATBUFFERS_ATTRIBUTE(attr)
+
+  #if FLATBUFFERS_CLANG >= 30800
+    #define FLATBUFFERS_FALLTHROUGH() [[clang::fallthrough]]
+  #elif FLATBUFFERS_GCC >= 70300
+    #define FLATBUFFERS_FALLTHROUGH() [[gnu::fallthrough]]
+  #else
+    #define FLATBUFFERS_FALLTHROUGH()
+  #endif
+#endif
+
+/// @endcond
+
+/// @file
+namespace flatbuffers {
+
+/// @cond FLATBUFFERS_INTERNAL
+// Our default offset / size type, 32bit on purpose on 64bit systems.
+// Also, using a consistent offset type maintains compatibility of serialized
+// offset values between 32bit and 64bit systems.
+typedef uint32_t uoffset_t;
+typedef uint64_t uoffset64_t;
+
+// Signed offsets for references that can go in both directions.
+typedef int32_t soffset_t;
+typedef int64_t soffset64_t;
+
+// Offset/index used in v-tables, can be changed to uint8_t in
+// format forks to save a bit of space if desired.
+typedef uint16_t voffset_t;
+
+typedef uintmax_t largest_scalar_t;
+
+// In 32bits, this evaluates to 2GB - 1
+#define FLATBUFFERS_MAX_BUFFER_SIZE std::numeric_limits<::flatbuffers::soffset_t>::max()
+#define FLATBUFFERS_MAX_64_BUFFER_SIZE std::numeric_limits<::flatbuffers::soffset64_t>::max()
+
+// The minimum size buffer that can be a valid flatbuffer.
+// Includes the offset to the root table (uoffset_t), the offset to the vtable
+// of the root table (soffset_t), the size of the vtable (uint16_t), and the
+// size of the referring table (uint16_t).
+#define FLATBUFFERS_MIN_BUFFER_SIZE sizeof(uoffset_t) + sizeof(soffset_t) + \
+   sizeof(uint16_t) + sizeof(uint16_t)
+
+// We support aligning the contents of buffers up to this size.
+#ifndef FLATBUFFERS_MAX_ALIGNMENT
+  #define FLATBUFFERS_MAX_ALIGNMENT 32
+#endif
+
+/// @brief The length of a FlatBuffer file header.
+static const size_t kFileIdentifierLength = 4;
+
+inline bool VerifyAlignmentRequirements(size_t align, size_t min_align = 1) {
+  return (min_align <= align) && (align <= (FLATBUFFERS_MAX_ALIGNMENT)) &&
+         (align & (align - 1)) == 0;  // must be power of 2
+}
+
+#if defined(_MSC_VER)
+  #pragma warning(push)
+  #pragma warning(disable: 4127) // C4127: conditional expression is constant
+#endif
+
+template<typename T> T EndianSwap(T t) {
+  #if defined(_MSC_VER)
+    #define FLATBUFFERS_BYTESWAP16 _byteswap_ushort
+    #define FLATBUFFERS_BYTESWAP32 _byteswap_ulong
+    #define FLATBUFFERS_BYTESWAP64 _byteswap_uint64
+  #elif defined(__ICCARM__)
+    #define FLATBUFFERS_BYTESWAP16 __REV16
+    #define FLATBUFFERS_BYTESWAP32 __REV
+    #define FLATBUFFERS_BYTESWAP64(x) \
+       ((__REV(static_cast<uint32_t>(x >> 32U))) | (static_cast<uint64_t>(__REV(static_cast<uint32_t>(x)))) << 32U)
+  #else
+    #if defined(__GNUC__) && __GNUC__ * 100 + __GNUC_MINOR__ < 408 && !defined(__clang__)
+      // __builtin_bswap16 was missing prior to GCC 4.8.
+      #define FLATBUFFERS_BYTESWAP16(x) \
+        static_cast<uint16_t>(__builtin_bswap32(static_cast<uint32_t>(x) << 16))
+    #else
+      #define FLATBUFFERS_BYTESWAP16 __builtin_bswap16
+    #endif
+    #define FLATBUFFERS_BYTESWAP32 __builtin_bswap32
+    #define FLATBUFFERS_BYTESWAP64 __builtin_bswap64
+  #endif
+  if (sizeof(T) == 1) {   // Compile-time if-then's.
+    return t;
+  } else if (sizeof(T) == 2) {
+    union { T t; uint16_t i; } u = { t };
+    u.i = FLATBUFFERS_BYTESWAP16(u.i);
+    return u.t;
+  } else if (sizeof(T) == 4) {
+    union { T t; uint32_t i; } u = { t };
+    u.i = FLATBUFFERS_BYTESWAP32(u.i);
+    return u.t;
+  } else if (sizeof(T) == 8) {
+    union { T t; uint64_t i; } u = { t };
+    u.i = FLATBUFFERS_BYTESWAP64(u.i);
+    return u.t;
+  } else {
+    FLATBUFFERS_ASSERT(0);
+    return t;
+  }
+}
+
+#if defined(_MSC_VER)
+  #pragma warning(pop)
+#endif
+
+
+template<typename T> T EndianScalar(T t) {
+  #if FLATBUFFERS_LITTLEENDIAN
+    return t;
+  #else
+    return EndianSwap(t);
+  #endif
+}
+
+template<typename T>
+// UBSAN: C++ aliasing type rules, see std::bit_cast<> for details.
+FLATBUFFERS_SUPPRESS_UBSAN("alignment")
+T ReadScalar(const void *p) {
+  return EndianScalar(*reinterpret_cast<const T *>(p));
+}
+
+// See https://github.com/google/flatbuffers/issues/5950
+
+#if (FLATBUFFERS_GCC >= 100000) && (FLATBUFFERS_GCC < 110000)
+  #pragma GCC diagnostic push
+  #pragma GCC diagnostic ignored "-Wstringop-overflow"
+#endif
+
+template<typename T>
+// UBSAN: C++ aliasing type rules, see std::bit_cast<> for details.
+FLATBUFFERS_SUPPRESS_UBSAN("alignment")
+void WriteScalar(void *p, T t) {
+  *reinterpret_cast<T *>(p) = EndianScalar(t);
+}
+
+template<typename T> struct Offset;
+template<typename T> FLATBUFFERS_SUPPRESS_UBSAN("alignment") void WriteScalar(void *p, Offset<T> t) {
+  *reinterpret_cast<uoffset_t *>(p) = EndianScalar(t.o);
+}
+
+#if (FLATBUFFERS_GCC >= 100000) && (FLATBUFFERS_GCC < 110000)
+  #pragma GCC diagnostic pop
+#endif
+
+// Computes how many bytes you'd have to pad to be able to write an
+// "scalar_size" scalar if the buffer had grown to "buf_size" (downwards in
+// memory).
+FLATBUFFERS_SUPPRESS_UBSAN("unsigned-integer-overflow")
+inline size_t PaddingBytes(size_t buf_size, size_t scalar_size) {
+  return ((~buf_size) + 1) & (scalar_size - 1);
+}
+
+// Generic 'operator==' with conditional specialisations.
+// T e - new value of a scalar field.
+// T def - default of scalar (is known at compile-time).
+template<typename T> inline bool IsTheSameAs(T e, T def) { return e == def; }
+
+#if defined(FLATBUFFERS_NAN_DEFAULTS) && \
+    defined(FLATBUFFERS_HAS_NEW_STRTOD) && (FLATBUFFERS_HAS_NEW_STRTOD > 0)
+// Like `operator==(e, def)` with weak NaN if T=(float|double).
+template<typename T> inline bool IsFloatTheSameAs(T e, T def) {
+  return (e == def) || ((def != def) && (e != e));
+}
+template<> inline bool IsTheSameAs<float>(float e, float def) {
+  return IsFloatTheSameAs(e, def);
+}
+template<> inline bool IsTheSameAs<double>(double e, double def) {
+  return IsFloatTheSameAs(e, def);
+}
+#endif
+
+// Check 'v' is out of closed range [low; high].
+// Workaround for GCC warning [-Werror=type-limits]:
+// comparison is always true due to limited range of data type.
+template<typename T>
+inline bool IsOutRange(const T &v, const T &low, const T &high) {
+  return (v < low) || (high < v);
+}
+
+// Check 'v' is in closed range [low; high].
+template<typename T>
+inline bool IsInRange(const T &v, const T &low, const T &high) {
+  return !IsOutRange(v, low, high);
+}
+
+}  // namespace flatbuffers
+#endif  // FLATBUFFERS_BASE_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/buffer.h b/cpp/include/cudf/io/ipc/flatbuffers/buffer.h
new file mode 100644
index 00000000000..9b2d98cd9e5
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/buffer.h
@@ -0,0 +1,222 @@
+/*
+ * Copyright 2021 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_BUFFER_H_
+#define FLATBUFFERS_BUFFER_H_
+
+#include <cudf/io/ipc/flatbuffers/base.h>
+
+#include <algorithm>
+
+namespace flatbuffers {
+
+// Wrapper for uoffset_t to allow safe template specialization.
+// Value is allowed to be 0 to indicate a null object (see e.g. AddOffset).
+template <typename T = void>
+struct Offset {
+  // The type of offset to use.
+  typedef uoffset_t offset_type;
+
+  offset_type o;
+  Offset() : o(0) {}
+  Offset(const offset_type _o) : o(_o) {}
+  Offset<> Union() const { return o; }
+  bool IsNull() const { return !o; }
+};
+
+// Wrapper for uoffset64_t Offsets.
+template <typename T = void>
+struct Offset64 {
+  // The type of offset to use.
+  typedef uoffset64_t offset_type;
+
+  offset_type o;
+  Offset64() : o(0) {}
+  Offset64(const offset_type offset) : o(offset) {}
+  Offset64<> Union() const { return o; }
+  bool IsNull() const { return !o; }
+};
+
+// Litmus check for ensuring the Offsets are the expected size.
+static_assert(sizeof(Offset<>) == 4, "Offset has wrong size");
+static_assert(sizeof(Offset64<>) == 8, "Offset64 has wrong size");
+
+inline void EndianCheck()
+{
+  [[maybe_unused]] int endiantest = 1;
+  // If this fails, see FLATBUFFERS_LITTLEENDIAN above.
+  FLATBUFFERS_ASSERT(*reinterpret_cast<char*>(&endiantest) == FLATBUFFERS_LITTLEENDIAN);
+  (void)endiantest;
+}
+
+template <typename T>
+FLATBUFFERS_CONSTEXPR size_t AlignOf()
+{
+  // clang-format off
+  #ifdef _MSC_VER
+    return __alignof(T);
+  #else
+    #ifndef alignof
+      return __alignof__(T);
+    #else
+      return alignof(T);
+    #endif
+  #endif
+  // clang-format on
+}
+
+// Lexicographically compare two strings (possibly containing nulls), and
+// return true if the first is less than the second.
+static inline bool StringLessThan(const char* a_data,
+                                  uoffset_t a_size,
+                                  const char* b_data,
+                                  uoffset_t b_size)
+{
+  const auto cmp = memcmp(a_data, b_data, (std::min)(a_size, b_size));
+  return cmp == 0 ? a_size < b_size : cmp < 0;
+}
+
+// When we read serialized data from memory, in the case of most scalars,
+// we want to just read T, but in the case of Offset, we want to actually
+// perform the indirection and return a pointer.
+// The template specialization below does just that.
+// It is wrapped in a struct since function templates can't overload on the
+// return type like this.
+// The typedef is for the convenience of callers of this function
+// (avoiding the need for a trailing return decltype)
+template <typename T>
+struct IndirectHelper {
+  typedef T return_type;
+  typedef T mutable_return_type;
+  static const size_t element_stride = sizeof(T);
+
+  static return_type Read(const uint8_t* p, const size_t i)
+  {
+    return EndianScalar((reinterpret_cast<const T*>(p))[i]);
+  }
+  static mutable_return_type Read(uint8_t* p, const size_t i)
+  {
+    return reinterpret_cast<mutable_return_type>(Read(const_cast<const uint8_t*>(p), i));
+  }
+};
+
+// For vector of Offsets.
+template <typename T, template <typename> class OffsetT>
+struct IndirectHelper<OffsetT<T>> {
+  typedef const T* return_type;
+  typedef T* mutable_return_type;
+  typedef typename OffsetT<T>::offset_type offset_type;
+  static const offset_type element_stride = sizeof(offset_type);
+
+  static return_type Read(const uint8_t* const p, const offset_type i)
+  {
+    // Offsets are relative to themselves, so first update the pointer to
+    // point to the offset location.
+    const uint8_t* const offset_location = p + i * element_stride;
+
+    // Then read the scalar value of the offset (which may be 32 or 64-bits) and
+    // then determine the relative location from the offset location.
+    return reinterpret_cast<return_type>(offset_location +
+                                         ReadScalar<offset_type>(offset_location));
+  }
+  static mutable_return_type Read(uint8_t* const p, const offset_type i)
+  {
+    // Offsets are relative to themselves, so first update the pointer to
+    // point to the offset location.
+    uint8_t* const offset_location = p + i * element_stride;
+
+    // Then read the scalar value of the offset (which may be 32 or 64-bits) and
+    // then determine the relative location from the offset location.
+    return reinterpret_cast<mutable_return_type>(offset_location +
+                                                 ReadScalar<offset_type>(offset_location));
+  }
+};
+
+// For vector of structs.
+template <typename T>
+struct IndirectHelper<const T*> {
+  typedef const T* return_type;
+  typedef T* mutable_return_type;
+  static const size_t element_stride = sizeof(T);
+
+  static return_type Read(const uint8_t* const p, const size_t i)
+  {
+    // Structs are stored inline, relative to the first struct pointer.
+    return reinterpret_cast<return_type>(p + i * element_stride);
+  }
+  static mutable_return_type Read(uint8_t* const p, const size_t i)
+  {
+    // Structs are stored inline, relative to the first struct pointer.
+    return reinterpret_cast<mutable_return_type>(p + i * element_stride);
+  }
+};
+
+/// @brief Get a pointer to the file_identifier section of the buffer.
+/// @return Returns a const char pointer to the start of the file_identifier
+/// characters in the buffer.  The returned char * has length
+/// 'flatbuffers::FlatBufferBuilder::kFileIdentifierLength'.
+/// This function is UNDEFINED for FlatBuffers whose schema does not include
+/// a file_identifier (likely points at padding or the start of a the root
+/// vtable).
+inline const char* GetBufferIdentifier(const void* buf, bool size_prefixed = false)
+{
+  return reinterpret_cast<const char*>(buf) +
+         ((size_prefixed) ? 2 * sizeof(uoffset_t) : sizeof(uoffset_t));
+}
+
+// Helper to see if the identifier in a buffer has the expected value.
+inline bool BufferHasIdentifier(const void* buf, const char* identifier, bool size_prefixed = false)
+{
+  return strncmp(GetBufferIdentifier(buf, size_prefixed),
+                 identifier,
+                 flatbuffers::kFileIdentifierLength) == 0;
+}
+
+/// @cond FLATBUFFERS_INTERNAL
+// Helpers to get a typed pointer to the root object contained in the buffer.
+template <typename T>
+T* GetMutableRoot(void* buf)
+{
+  if (!buf) return nullptr;
+  EndianCheck();
+  return reinterpret_cast<T*>(reinterpret_cast<uint8_t*>(buf) +
+                              EndianScalar(*reinterpret_cast<uoffset_t*>(buf)));
+}
+
+template <typename T, typename SizeT = uoffset_t>
+T* GetMutableSizePrefixedRoot(void* buf)
+{
+  return GetMutableRoot<T>(reinterpret_cast<uint8_t*>(buf) + sizeof(SizeT));
+}
+
+template <typename T>
+const T* GetRoot(const void* buf)
+{
+  return GetMutableRoot<T>(const_cast<void*>(buf));
+}
+
+template <typename T, typename SizeT = uoffset_t>
+const T* GetSizePrefixedRoot(const void* buf)
+{
+  return GetRoot<T>(reinterpret_cast<const uint8_t*>(buf) + sizeof(SizeT));
+}
+
+}  // namespace flatbuffers
+
+#endif  // FLATBUFFERS_BUFFER_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/buffer_ref.h b/cpp/include/cudf/io/ipc/flatbuffers/buffer_ref.h
new file mode 100644
index 00000000000..f8e493ecdf9
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/buffer_ref.h
@@ -0,0 +1,58 @@
+/*
+ * Copyright 2021 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_BUFFER_REF_H_
+#define FLATBUFFERS_BUFFER_REF_H_
+
+#include <cudf/io/ipc/flatbuffers/base.h>
+#include <cudf/io/ipc/flatbuffers/verifier.h>
+
+namespace flatbuffers {
+
+// Convenient way to bundle a buffer and its length, to pass it around
+// typed by its root.
+// A BufferRef does not own its buffer.
+struct BufferRefBase {};  // for std::is_base_of
+
+template <typename T>
+struct BufferRef : BufferRefBase {
+  BufferRef() : buf(nullptr), len(0), must_free(false) {}
+  BufferRef(uint8_t* _buf, uoffset_t _len) : buf(_buf), len(_len), must_free(false) {}
+
+  ~BufferRef()
+  {
+    if (must_free) free(buf);
+  }
+
+  const T* GetRoot() const { return flatbuffers::GetRoot<T>(buf); }
+
+  bool Verify()
+  {
+    Verifier verifier(buf, len);
+    return verifier.VerifyBuffer<T>(nullptr);
+  }
+
+  uint8_t* buf;
+  uoffset_t len;
+  bool must_free;
+};
+
+}  // namespace flatbuffers
+
+#endif  // FLATBUFFERS_BUFFER_REF_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/default_allocator.h b/cpp/include/cudf/io/ipc/flatbuffers/default_allocator.h
new file mode 100644
index 00000000000..20fa65bc78e
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/default_allocator.h
@@ -0,0 +1,70 @@
+/*
+ * Copyright 2021 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_DEFAULT_ALLOCATOR_H_
+#define FLATBUFFERS_DEFAULT_ALLOCATOR_H_
+
+#include <cudf/io/ipc/flatbuffers/allocator.h>
+#include <cudf/io/ipc/flatbuffers/base.h>
+
+namespace flatbuffers {
+
+// DefaultAllocator uses new/delete to allocate memory regions
+class DefaultAllocator : public Allocator {
+ public:
+  uint8_t* allocate(size_t size) FLATBUFFERS_OVERRIDE { return new uint8_t[size]; }
+
+  void deallocate(uint8_t* p, size_t) FLATBUFFERS_OVERRIDE { delete[] p; }
+
+  static void dealloc(void* p, size_t) { delete[] static_cast<uint8_t*>(p); }
+};
+
+// These functions allow for a null allocator to mean use the default allocator,
+// as used by DetachedBuffer and vector_downward below.
+// This is to avoid having a statically or dynamically allocated default
+// allocator, or having to move it between the classes that may own it.
+inline uint8_t* Allocate(Allocator* allocator, size_t size)
+{
+  return allocator ? allocator->allocate(size) : DefaultAllocator().allocate(size);
+}
+
+inline void Deallocate(Allocator* allocator, uint8_t* p, size_t size)
+{
+  if (allocator)
+    allocator->deallocate(p, size);
+  else
+    DefaultAllocator().deallocate(p, size);
+}
+
+inline uint8_t* ReallocateDownward(Allocator* allocator,
+                                   uint8_t* old_p,
+                                   size_t old_size,
+                                   size_t new_size,
+                                   size_t in_use_back,
+                                   size_t in_use_front)
+{
+  return allocator
+           ? allocator->reallocate_downward(old_p, old_size, new_size, in_use_back, in_use_front)
+           : DefaultAllocator().reallocate_downward(
+               old_p, old_size, new_size, in_use_back, in_use_front);
+}
+
+}  // namespace flatbuffers
+
+#endif  // FLATBUFFERS_DEFAULT_ALLOCATOR_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/detached_buffer.h b/cpp/include/cudf/io/ipc/flatbuffers/detached_buffer.h
new file mode 100644
index 00000000000..35fc82f72d4
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/detached_buffer.h
@@ -0,0 +1,128 @@
+/*
+ * Copyright 2021 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_DETACHED_BUFFER_H_
+#define FLATBUFFERS_DETACHED_BUFFER_H_
+
+#include <cudf/io/ipc/flatbuffers/allocator.h>
+#include <cudf/io/ipc/flatbuffers/base.h>
+#include <cudf/io/ipc/flatbuffers/default_allocator.h>
+
+namespace flatbuffers {
+
+// DetachedBuffer is a finished flatbuffer memory region, detached from its
+// builder. The original memory region and allocator are also stored so that
+// the DetachedBuffer can manage the memory lifetime.
+class DetachedBuffer {
+ public:
+  DetachedBuffer()
+    : allocator_(nullptr),
+      own_allocator_(false),
+      buf_(nullptr),
+      reserved_(0),
+      cur_(nullptr),
+      size_(0)
+  {
+  }
+
+  DetachedBuffer(Allocator* allocator,
+                 bool own_allocator,
+                 uint8_t* buf,
+                 size_t reserved,
+                 uint8_t* cur,
+                 size_t sz)
+    : allocator_(allocator),
+      own_allocator_(own_allocator),
+      buf_(buf),
+      reserved_(reserved),
+      cur_(cur),
+      size_(sz)
+  {
+  }
+
+  DetachedBuffer(DetachedBuffer&& other) noexcept
+    : allocator_(other.allocator_),
+      own_allocator_(other.own_allocator_),
+      buf_(other.buf_),
+      reserved_(other.reserved_),
+      cur_(other.cur_),
+      size_(other.size_)
+  {
+    other.reset();
+  }
+
+  DetachedBuffer& operator=(DetachedBuffer&& other) noexcept
+  {
+    if (this == &other) return *this;
+
+    destroy();
+
+    allocator_     = other.allocator_;
+    own_allocator_ = other.own_allocator_;
+    buf_           = other.buf_;
+    reserved_      = other.reserved_;
+    cur_           = other.cur_;
+    size_          = other.size_;
+
+    other.reset();
+
+    return *this;
+  }
+
+  ~DetachedBuffer() { destroy(); }
+
+  const uint8_t* data() const { return cur_; }
+
+  uint8_t* data() { return cur_; }
+
+  size_t size() const { return size_; }
+
+  // These may change access mode, leave these at end of public section
+  FLATBUFFERS_DELETE_FUNC(DetachedBuffer(const DetachedBuffer& other));
+  FLATBUFFERS_DELETE_FUNC(DetachedBuffer& operator=(const DetachedBuffer& other));
+
+ protected:
+  Allocator* allocator_;
+  bool own_allocator_;
+  uint8_t* buf_;
+  size_t reserved_;
+  uint8_t* cur_;
+  size_t size_;
+
+  inline void destroy()
+  {
+    if (buf_) Deallocate(allocator_, buf_, reserved_);
+    if (own_allocator_ && allocator_) { delete allocator_; }
+    reset();
+  }
+
+  inline void reset()
+  {
+    allocator_     = nullptr;
+    own_allocator_ = false;
+    buf_           = nullptr;
+    reserved_      = 0;
+    cur_           = nullptr;
+    size_          = 0;
+  }
+};
+
+}  // namespace flatbuffers
+
+#endif  // FLATBUFFERS_DETACHED_BUFFER_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/flatbuffer_builder.h b/cpp/include/cudf/io/ipc/flatbuffers/flatbuffer_builder.h
new file mode 100644
index 00000000000..c901d637eb6
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/flatbuffer_builder.h
@@ -0,0 +1,1574 @@
+/*
+ * Copyright 2021 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_FLATBUFFER_BUILDER_H_
+#define FLATBUFFERS_FLATBUFFER_BUILDER_H_
+
+#include <cudf/io/ipc/flatbuffers/allocator.h>
+#include <cudf/io/ipc/flatbuffers/array.h>
+#include <cudf/io/ipc/flatbuffers/base.h>
+#include <cudf/io/ipc/flatbuffers/buffer.h>
+#include <cudf/io/ipc/flatbuffers/buffer_ref.h>
+#include <cudf/io/ipc/flatbuffers/default_allocator.h>
+#include <cudf/io/ipc/flatbuffers/detached_buffer.h>
+#include <cudf/io/ipc/flatbuffers/stl_emulation.h>
+#include <cudf/io/ipc/flatbuffers/string.h>
+#include <cudf/io/ipc/flatbuffers/struct.h>
+#include <cudf/io/ipc/flatbuffers/table.h>
+#include <cudf/io/ipc/flatbuffers/vector.h>
+#include <cudf/io/ipc/flatbuffers/vector_downward.h>
+#include <cudf/io/ipc/flatbuffers/verifier.h>
+
+#include <algorithm>
+#include <cstdint>
+#include <functional>
+#include <initializer_list>
+#include <type_traits>
+
+namespace flatbuffers {
+
+// Converts a Field ID to a virtual table offset.
+inline voffset_t FieldIndexToOffset(voffset_t field_id)
+{
+  // Should correspond to what EndTable() below builds up.
+  const voffset_t fixed_fields = 2 * sizeof(voffset_t);  // Vtable size and Object Size.
+  size_t offset                = fixed_fields + field_id * sizeof(voffset_t);
+  FLATBUFFERS_ASSERT(offset < std::numeric_limits<voffset_t>::max());
+  return static_cast<voffset_t>(offset);
+}
+
+template <typename T, typename Alloc = std::allocator<T>>
+const T* data(const std::vector<T, Alloc>& v)
+{
+  // Eventually the returned pointer gets passed down to memcpy, so
+  // we need it to be non-null to avoid undefined behavior.
+  static uint8_t t;
+  return v.empty() ? reinterpret_cast<const T*>(&t) : &v.front();
+}
+template <typename T, typename Alloc = std::allocator<T>>
+T* data(std::vector<T, Alloc>& v)
+{
+  // Eventually the returned pointer gets passed down to memcpy, so
+  // we need it to be non-null to avoid undefined behavior.
+  static uint8_t t;
+  return v.empty() ? reinterpret_cast<T*>(&t) : &v.front();
+}
+
+/// @addtogroup flatbuffers_cpp_api
+/// @{
+/// @class FlatBufferBuilder
+/// @brief Helper class to hold data needed in creation of a FlatBuffer.
+/// To serialize data, you typically call one of the `Create*()` functions in
+/// the generated code, which in turn call a sequence of `StartTable`/
+/// `PushElement`/`AddElement`/`EndTable`, or the builtin `CreateString`/
+/// `CreateVector` functions. Do this is depth-first order to build up a tree to
+/// the root. `Finish()` wraps up the buffer ready for transport.
+template <bool Is64Aware = false>
+class FlatBufferBuilderImpl {
+ public:
+  // This switches the size type of the builder, based on if its 64-bit aware
+  // (uoffset64_t) or not (uoffset_t).
+  typedef typename std::conditional<Is64Aware, uoffset64_t, uoffset_t>::type SizeT;
+
+  /// @brief Default constructor for FlatBufferBuilder.
+  /// @param[in] initial_size The initial size of the buffer, in bytes. Defaults
+  /// to `1024`.
+  /// @param[in] allocator An `Allocator` to use. If null will use
+  /// `DefaultAllocator`.
+  /// @param[in] own_allocator Whether the builder/vector should own the
+  /// allocator. Defaults to / `false`.
+  /// @param[in] buffer_minalign Force the buffer to be aligned to the given
+  /// minimum alignment upon reallocation. Only needed if you intend to store
+  /// types with custom alignment AND you wish to read the buffer in-place
+  /// directly after creation.
+  explicit FlatBufferBuilderImpl(size_t initial_size    = 1024,
+                                 Allocator* allocator   = nullptr,
+                                 bool own_allocator     = false,
+                                 size_t buffer_minalign = AlignOf<largest_scalar_t>())
+    : buf_(initial_size,
+           allocator,
+           own_allocator,
+           buffer_minalign,
+           static_cast<SizeT>(Is64Aware ? FLATBUFFERS_MAX_64_BUFFER_SIZE
+                                        : FLATBUFFERS_MAX_BUFFER_SIZE)),
+      num_field_loc(0),
+      max_voffset_(0),
+      length_of_64_bit_region_(0),
+      nested(false),
+      finished(false),
+      minalign_(1),
+      force_defaults_(false),
+      dedup_vtables_(true),
+      string_pool(nullptr)
+  {
+    EndianCheck();
+  }
+
+  /// @brief Move constructor for FlatBufferBuilder.
+  FlatBufferBuilderImpl(FlatBufferBuilderImpl&& other) noexcept
+    : buf_(1024,
+           nullptr,
+           false,
+           AlignOf<largest_scalar_t>(),
+           static_cast<SizeT>(Is64Aware ? FLATBUFFERS_MAX_64_BUFFER_SIZE
+                                        : FLATBUFFERS_MAX_BUFFER_SIZE)),
+      num_field_loc(0),
+      max_voffset_(0),
+      length_of_64_bit_region_(0),
+      nested(false),
+      finished(false),
+      minalign_(1),
+      force_defaults_(false),
+      dedup_vtables_(true),
+      string_pool(nullptr)
+  {
+    EndianCheck();
+    // Default construct and swap idiom.
+    // Lack of delegating constructors in vs2010 makes it more verbose than
+    // needed.
+    Swap(other);
+  }
+
+  /// @brief Move assignment operator for FlatBufferBuilder.
+  FlatBufferBuilderImpl& operator=(FlatBufferBuilderImpl&& other) noexcept
+  {
+    // Move construct a temporary and swap idiom
+    FlatBufferBuilderImpl temp(std::move(other));
+    Swap(temp);
+    return *this;
+  }
+
+  void Swap(FlatBufferBuilderImpl& other)
+  {
+    using std::swap;
+    buf_.swap(other.buf_);
+    swap(num_field_loc, other.num_field_loc);
+    swap(max_voffset_, other.max_voffset_);
+    swap(length_of_64_bit_region_, other.length_of_64_bit_region_);
+    swap(nested, other.nested);
+    swap(finished, other.finished);
+    swap(minalign_, other.minalign_);
+    swap(force_defaults_, other.force_defaults_);
+    swap(dedup_vtables_, other.dedup_vtables_);
+    swap(string_pool, other.string_pool);
+  }
+
+  ~FlatBufferBuilderImpl()
+  {
+    if (string_pool) delete string_pool;
+  }
+
+  void Reset()
+  {
+    Clear();       // clear builder state
+    buf_.reset();  // deallocate buffer
+  }
+
+  /// @brief Reset all the state in this FlatBufferBuilder so it can be reused
+  /// to construct another buffer.
+  void Clear()
+  {
+    ClearOffsets();
+    buf_.clear();
+    nested                   = false;
+    finished                 = false;
+    minalign_                = 1;
+    length_of_64_bit_region_ = 0;
+    if (string_pool) string_pool->clear();
+  }
+
+  /// @brief The current size of the serialized buffer, counting from the end.
+  /// @return Returns an `SizeT` with the current size of the buffer.
+  SizeT GetSize() const { return buf_.size(); }
+
+  /// @brief The current size of the serialized buffer relative to the end of
+  /// the 32-bit region.
+  /// @return Returns an `uoffset_t` with the current size of the buffer.
+  template <bool is_64 = Is64Aware>
+  // Only enable this method for the 64-bit builder, as only that builder is
+  // concerned with the 32/64-bit boundary, and should be the one to bare any
+  // run time costs.
+  typename std::enable_if<is_64, uoffset_t>::type GetSizeRelative32BitRegion() const
+  {
+    //[32-bit region][64-bit region]
+    //         [XXXXXXXXXXXXXXXXXXX] GetSize()
+    //               [YYYYYYYYYYYYY] length_of_64_bit_region_
+    //         [ZZZZ]                return size
+    return static_cast<uoffset_t>(GetSize() - length_of_64_bit_region_);
+  }
+
+  template <bool is_64 = Is64Aware>
+  // Only enable this method for the 32-bit builder.
+  typename std::enable_if<!is_64, uoffset_t>::type GetSizeRelative32BitRegion() const
+  {
+    return static_cast<uoffset_t>(GetSize());
+  }
+
+  /// @brief Get the serialized buffer (after you call `Finish()`).
+  /// @return Returns an `uint8_t` pointer to the FlatBuffer data inside the
+  /// buffer.
+  uint8_t* GetBufferPointer() const
+  {
+    Finished();
+    return buf_.data();
+  }
+
+  /// @brief Get the serialized buffer (after you call `Finish()`) as a span.
+  /// @return Returns a constructed flatbuffers::span that is a view over the
+  /// FlatBuffer data inside the buffer.
+  flatbuffers::span<uint8_t> GetBufferSpan() const
+  {
+    Finished();
+    return flatbuffers::span<uint8_t>(buf_.data(), buf_.size());
+  }
+
+  /// @brief Get a pointer to an unfinished buffer.
+  /// @return Returns a `uint8_t` pointer to the unfinished buffer.
+  uint8_t* GetCurrentBufferPointer() const { return buf_.data(); }
+
+  /// @brief Get the released DetachedBuffer.
+  /// @return A `DetachedBuffer` that owns the buffer and its allocator.
+  DetachedBuffer Release()
+  {
+    Finished();
+    DetachedBuffer buffer = buf_.release();
+    Clear();
+    return buffer;
+  }
+
+  /// @brief Get the released pointer to the serialized buffer.
+  /// @param size The size of the memory block containing
+  /// the serialized `FlatBuffer`.
+  /// @param offset The offset from the released pointer where the finished
+  /// `FlatBuffer` starts.
+  /// @return A raw pointer to the start of the memory block containing
+  /// the serialized `FlatBuffer`.
+  /// @remark If the allocator is owned, it gets deleted when the destructor is
+  /// called.
+  uint8_t* ReleaseRaw(size_t& size, size_t& offset)
+  {
+    Finished();
+    uint8_t* raw = buf_.release_raw(size, offset);
+    Clear();
+    return raw;
+  }
+
+  /// @brief get the minimum alignment this buffer needs to be accessed
+  /// properly. This is only known once all elements have been written (after
+  /// you call Finish()). You can use this information if you need to embed
+  /// a FlatBuffer in some other buffer, such that you can later read it
+  /// without first having to copy it into its own buffer.
+  size_t GetBufferMinAlignment() const
+  {
+    Finished();
+    return minalign_;
+  }
+
+  /// @cond FLATBUFFERS_INTERNAL
+  void Finished() const
+  {
+    // If you get this assert, you're attempting to get access a buffer
+    // which hasn't been finished yet. Be sure to call
+    // FlatBufferBuilder::Finish with your root table.
+    // If you really need to access an unfinished buffer, call
+    // GetCurrentBufferPointer instead.
+    FLATBUFFERS_ASSERT(finished);
+  }
+  /// @endcond
+
+  /// @brief In order to save space, fields that are set to their default value
+  /// don't get serialized into the buffer.
+  /// @param[in] fd When set to `true`, always serializes default values that
+  /// are set. Optional fields which are not set explicitly, will still not be
+  /// serialized.
+  void ForceDefaults(bool fd) { force_defaults_ = fd; }
+
+  /// @brief By default vtables are deduped in order to save space.
+  /// @param[in] dedup When set to `true`, dedup vtables.
+  void DedupVtables(bool dedup) { dedup_vtables_ = dedup; }
+
+  /// @cond FLATBUFFERS_INTERNAL
+  void Pad(size_t num_bytes) { buf_.fill(num_bytes); }
+
+  void TrackMinAlign(size_t elem_size)
+  {
+    if (elem_size > minalign_) minalign_ = elem_size;
+  }
+
+  void Align(size_t elem_size)
+  {
+    TrackMinAlign(elem_size);
+    buf_.fill(PaddingBytes(buf_.size(), elem_size));
+  }
+
+  void PushFlatBuffer(const uint8_t* bytes, size_t size)
+  {
+    PushBytes(bytes, size);
+    finished = true;
+  }
+
+  void PushBytes(const uint8_t* bytes, size_t size) { buf_.push(bytes, size); }
+
+  void PopBytes(size_t amount) { buf_.pop(amount); }
+
+  template <typename T>
+  void AssertScalarT()
+  {
+    // The code assumes power of 2 sizes and endian-swap-ability.
+    static_assert(flatbuffers::is_scalar<T>::value, "T must be a scalar type");
+  }
+
+  // Write a single aligned scalar to the buffer
+  template <typename T, typename ReturnT = uoffset_t>
+  ReturnT PushElement(T element)
+  {
+    AssertScalarT<T>();
+    Align(sizeof(T));
+    buf_.push_small(EndianScalar(element));
+    return CalculateOffset<ReturnT>();
+  }
+
+  template <typename T, template <typename> class OffsetT = Offset>
+  uoffset_t PushElement(OffsetT<T> off)
+  {
+    // Special case for offsets: see ReferTo below.
+    return PushElement(ReferTo(off.o));
+  }
+
+  // When writing fields, we track where they are, so we can create correct
+  // vtables later.
+  void TrackField(voffset_t field, uoffset_t off)
+  {
+    FieldLoc fl = {off, field};
+    buf_.scratch_push_small(fl);
+    num_field_loc++;
+    if (field > max_voffset_) { max_voffset_ = field; }
+  }
+
+  // Like PushElement, but additionally tracks the field this represents.
+  template <typename T>
+  void AddElement(voffset_t field, T e, T def)
+  {
+    // We don't serialize values equal to the default.
+    if (IsTheSameAs(e, def) && !force_defaults_) return;
+    TrackField(field, PushElement(e));
+  }
+
+  template <typename T>
+  void AddElement(voffset_t field, T e)
+  {
+    TrackField(field, PushElement(e));
+  }
+
+  template <typename T>
+  void AddOffset(voffset_t field, Offset<T> off)
+  {
+    if (off.IsNull()) return;  // Don't store.
+    AddElement(field, ReferTo(off.o), static_cast<uoffset_t>(0));
+  }
+
+  template <typename T>
+  void AddOffset(voffset_t field, Offset64<T> off)
+  {
+    if (off.IsNull()) return;  // Don't store.
+    AddElement(field, ReferTo(off.o), static_cast<uoffset64_t>(0));
+  }
+
+  template <typename T>
+  void AddStruct(voffset_t field, const T* structptr)
+  {
+    if (!structptr) return;  // Default, don't store.
+    Align(AlignOf<T>());
+    buf_.push_small(*structptr);
+    TrackField(field, CalculateOffset<uoffset_t>());
+  }
+
+  void AddStructOffset(voffset_t field, uoffset_t off) { TrackField(field, off); }
+
+  // Offsets initially are relative to the end of the buffer (downwards).
+  // This function converts them to be relative to the current location
+  // in the buffer (when stored here), pointing upwards.
+  uoffset_t ReferTo(uoffset_t off)
+  {
+    // Align to ensure GetSizeRelative32BitRegion() below is correct.
+    Align(sizeof(uoffset_t));
+    // 32-bit offsets are relative to the tail of the 32-bit region of the
+    // buffer. For most cases (without 64-bit entities) this is equivalent to
+    // size of the whole buffer (e.g. GetSize())
+    return ReferTo(off, GetSizeRelative32BitRegion());
+  }
+
+  uoffset64_t ReferTo(uoffset64_t off)
+  {
+    // Align to ensure GetSize() below is correct.
+    Align(sizeof(uoffset64_t));
+    // 64-bit offsets are relative to tail of the whole buffer
+    return ReferTo(off, GetSize());
+  }
+
+  template <typename T, typename T2>
+  T ReferTo(const T off, const T2 size)
+  {
+    FLATBUFFERS_ASSERT(off && off <= size);
+    return size - off + static_cast<T>(sizeof(T));
+  }
+
+  template <typename T>
+  T ReferTo(const T off, const T size)
+  {
+    FLATBUFFERS_ASSERT(off && off <= size);
+    return size - off + static_cast<T>(sizeof(T));
+  }
+
+  void NotNested()
+  {
+    // If you hit this, you're trying to construct a Table/Vector/String
+    // during the construction of its parent table (between the MyTableBuilder
+    // and table.Finish().
+    // Move the creation of these sub-objects to above the MyTableBuilder to
+    // not get this assert.
+    // Ignoring this assert may appear to work in simple cases, but the reason
+    // it is here is that storing objects in-line may cause vtable offsets
+    // to not fit anymore. It also leads to vtable duplication.
+    FLATBUFFERS_ASSERT(!nested);
+    // If you hit this, fields were added outside the scope of a table.
+    FLATBUFFERS_ASSERT(!num_field_loc);
+  }
+
+  // From generated code (or from the parser), we call StartTable/EndTable
+  // with a sequence of AddElement calls in between.
+  uoffset_t StartTable()
+  {
+    NotNested();
+    nested = true;
+    return GetSizeRelative32BitRegion();
+  }
+
+  // This finishes one serialized object by generating the vtable if it's a
+  // table, comparing it against existing vtables, and writing the
+  // resulting vtable offset.
+  uoffset_t EndTable(uoffset_t start)
+  {
+    // If you get this assert, a corresponding StartTable wasn't called.
+    FLATBUFFERS_ASSERT(nested);
+    // Write the vtable offset, which is the start of any Table.
+    // We fill its value later.
+    // This is relative to the end of the 32-bit region.
+    const uoffset_t vtable_offset_loc = static_cast<uoffset_t>(PushElement<soffset_t>(0));
+    // Write a vtable, which consists entirely of voffset_t elements.
+    // It starts with the number of offsets, followed by a type id, followed
+    // by the offsets themselves. In reverse:
+    // Include space for the last offset and ensure empty tables have a
+    // minimum size.
+    max_voffset_ =
+      (std::max)(static_cast<voffset_t>(max_voffset_ + sizeof(voffset_t)), FieldIndexToOffset(0));
+    buf_.fill_big(max_voffset_);
+    const uoffset_t table_object_size = vtable_offset_loc - start;
+    // Vtable use 16bit offsets.
+    FLATBUFFERS_ASSERT(table_object_size < 0x10000);
+    WriteScalar<voffset_t>(buf_.data() + sizeof(voffset_t),
+                           static_cast<voffset_t>(table_object_size));
+    WriteScalar<voffset_t>(buf_.data(), max_voffset_);
+    // Write the offsets into the table
+    for (auto it = buf_.scratch_end() - num_field_loc * sizeof(FieldLoc); it < buf_.scratch_end();
+         it += sizeof(FieldLoc)) {
+      auto field_location = reinterpret_cast<FieldLoc*>(it);
+      const voffset_t pos = static_cast<voffset_t>(vtable_offset_loc - field_location->off);
+      // If this asserts, it means you've set a field twice.
+      FLATBUFFERS_ASSERT(!ReadScalar<voffset_t>(buf_.data() + field_location->id));
+      WriteScalar<voffset_t>(buf_.data() + field_location->id, pos);
+    }
+    ClearOffsets();
+    auto vt1      = reinterpret_cast<voffset_t*>(buf_.data());
+    auto vt1_size = ReadScalar<voffset_t>(vt1);
+    auto vt_use   = GetSizeRelative32BitRegion();
+    // See if we already have generated a vtable with this exact same
+    // layout before. If so, make it point to the old one, remove this one.
+    if (dedup_vtables_) {
+      for (auto it = buf_.scratch_data(); it < buf_.scratch_end(); it += sizeof(uoffset_t)) {
+        auto vt_offset_ptr = reinterpret_cast<uoffset_t*>(it);
+        auto vt2           = reinterpret_cast<voffset_t*>(buf_.data_at(*vt_offset_ptr));
+        auto vt2_size      = ReadScalar<voffset_t>(vt2);
+        if (vt1_size != vt2_size || 0 != memcmp(vt2, vt1, vt1_size)) continue;
+        vt_use = *vt_offset_ptr;
+        buf_.pop(GetSizeRelative32BitRegion() - vtable_offset_loc);
+        break;
+      }
+    }
+    // If this is a new vtable, remember it.
+    if (vt_use == GetSizeRelative32BitRegion()) { buf_.scratch_push_small(vt_use); }
+    // Fill the vtable offset we created above.
+    // The offset points from the beginning of the object to where the vtable is
+    // stored.
+    // Offsets default direction is downward in memory for future format
+    // flexibility (storing all vtables at the start of the file).
+    WriteScalar(buf_.data_at(vtable_offset_loc + length_of_64_bit_region_),
+                static_cast<soffset_t>(vt_use) - static_cast<soffset_t>(vtable_offset_loc));
+    nested = false;
+    return vtable_offset_loc;
+  }
+
+  FLATBUFFERS_ATTRIBUTE([[deprecated("call the version above instead")]])
+  uoffset_t EndTable(uoffset_t start, voffset_t /*numfields*/) { return EndTable(start); }
+
+  // This checks a required field has been set in a given table that has
+  // just been constructed.
+  template <typename T>
+  void Required(Offset<T> table, voffset_t field)
+  {
+    auto table_ptr = reinterpret_cast<const Table*>(buf_.data_at(table.o));
+    bool ok        = table_ptr->GetOptionalFieldOffset(field) != 0;
+    // If this fails, the caller will show what field needs to be set.
+    FLATBUFFERS_ASSERT(ok);
+    (void)ok;
+  }
+
+  uoffset_t StartStruct(size_t alignment)
+  {
+    Align(alignment);
+    return GetSizeRelative32BitRegion();
+  }
+
+  uoffset_t EndStruct() { return GetSizeRelative32BitRegion(); }
+
+  void ClearOffsets()
+  {
+    buf_.scratch_pop(num_field_loc * sizeof(FieldLoc));
+    num_field_loc = 0;
+    max_voffset_  = 0;
+  }
+
+  // Aligns such that when "len" bytes are written, an object can be written
+  // after it (forward in the buffer) with "alignment" without padding.
+  void PreAlign(size_t len, size_t alignment)
+  {
+    if (len == 0) return;
+    TrackMinAlign(alignment);
+    buf_.fill(PaddingBytes(GetSize() + len, alignment));
+  }
+
+  // Aligns such than when "len" bytes are written, an object of type `AlignT`
+  // can be written after it (forward in the buffer) without padding.
+  template <typename AlignT>
+  void PreAlign(size_t len)
+  {
+    AssertScalarT<AlignT>();
+    PreAlign(len, AlignOf<AlignT>());
+  }
+  /// @endcond
+
+  /// @brief Store a string in the buffer, which can contain any binary data.
+  /// @param[in] str A const char pointer to the data to be stored as a string.
+  /// @param[in] len The number of bytes that should be stored from `str`.
+  /// @return Returns the offset in the buffer where the string starts.
+  template <template <typename> class OffsetT = Offset>
+  OffsetT<String> CreateString(const char* str, size_t len)
+  {
+    CreateStringImpl(str, len);
+    return OffsetT<String>(CalculateOffset<typename OffsetT<String>::offset_type>());
+  }
+
+  /// @brief Store a string in the buffer, which is null-terminated.
+  /// @param[in] str A const char pointer to a C-string to add to the buffer.
+  /// @return Returns the offset in the buffer where the string starts.
+  template <template <typename> class OffsetT = Offset>
+  OffsetT<String> CreateString(const char* str)
+  {
+    return CreateString<OffsetT>(str, strlen(str));
+  }
+
+  /// @brief Store a string in the buffer, which is null-terminated.
+  /// @param[in] str A char pointer to a C-string to add to the buffer.
+  /// @return Returns the offset in the buffer where the string starts.
+  template <template <typename> class OffsetT = Offset>
+  OffsetT<String> CreateString(char* str)
+  {
+    return CreateString<OffsetT>(str, strlen(str));
+  }
+
+  /// @brief Store a string in the buffer, which can contain any binary data.
+  /// @param[in] str A const reference to a std::string to store in the buffer.
+  /// @return Returns the offset in the buffer where the string starts.
+  template <template <typename> class OffsetT = Offset>
+  OffsetT<String> CreateString(const std::string& str)
+  {
+    return CreateString<OffsetT>(str.c_str(), str.length());
+  }
+
+// clang-format off
+  #ifdef FLATBUFFERS_HAS_STRING_VIEW
+  /// @brief Store a string in the buffer, which can contain any binary data.
+  /// @param[in] str A const string_view to copy in to the buffer.
+  /// @return Returns the offset in the buffer where the string starts.
+  template<template <typename> class OffsetT = Offset>
+  OffsetT<String>CreateString(flatbuffers::string_view str) {
+    return CreateString<OffsetT>(str.data(), str.size());
+  }
+  #endif // FLATBUFFERS_HAS_STRING_VIEW
+  // clang-format on
+
+  /// @brief Store a string in the buffer, which can contain any binary data.
+  /// @param[in] str A const pointer to a `String` struct to add to the buffer.
+  /// @return Returns the offset in the buffer where the string starts
+  template <template <typename> class OffsetT = Offset>
+  OffsetT<String> CreateString(const String* str)
+  {
+    return str ? CreateString<OffsetT>(str->c_str(), str->size()) : 0;
+  }
+
+  /// @brief Store a string in the buffer, which can contain any binary data.
+  /// @param[in] str A const reference to a std::string like type with support
+  /// of T::data() and T::length() to store in the buffer.
+  /// @return Returns the offset in the buffer where the string starts.
+  template <template <typename> class OffsetT = Offset,
+            // No need to explicitly declare the T type, let the compiler deduce
+            // it.
+            int&... ExplicitArgumentBarrier,
+            typename T>
+  OffsetT<String> CreateString(const T& str)
+  {
+    return CreateString<OffsetT>(str.data(), str.length());
+  }
+
+  /// @brief Store a string in the buffer, which can contain any binary data.
+  /// If a string with this exact contents has already been serialized before,
+  /// instead simply returns the offset of the existing string. This uses a map
+  /// stored on the heap, but only stores the numerical offsets.
+  /// @param[in] str A const char pointer to the data to be stored as a string.
+  /// @param[in] len The number of bytes that should be stored from `str`.
+  /// @return Returns the offset in the buffer where the string starts.
+  Offset<String> CreateSharedString(const char* str, size_t len)
+  {
+    FLATBUFFERS_ASSERT(FLATBUFFERS_GENERAL_HEAP_ALLOC_OK);
+    if (!string_pool) { string_pool = new StringOffsetMap(StringOffsetCompare(buf_)); }
+
+    const size_t size_before_string = buf_.size();
+    // Must first serialize the string, since the set is all offsets into
+    // buffer.
+    const Offset<String> off = CreateString<Offset>(str, len);
+    auto it                  = string_pool->find(off);
+    // If it exists we reuse existing serialized data!
+    if (it != string_pool->end()) {
+      // We can remove the string we serialized.
+      buf_.pop(buf_.size() - size_before_string);
+      return *it;
+    }
+    // Record this string for future use.
+    string_pool->insert(off);
+    return off;
+  }
+
+#ifdef FLATBUFFERS_HAS_STRING_VIEW
+  /// @brief Store a string in the buffer, which can contain any binary data.
+  /// If a string with this exact contents has already been serialized before,
+  /// instead simply returns the offset of the existing string. This uses a map
+  /// stored on the heap, but only stores the numerical offsets.
+  /// @param[in] str A const std::string_view to store in the buffer.
+  /// @return Returns the offset in the buffer where the string starts
+  Offset<String> CreateSharedString(const flatbuffers::string_view str)
+  {
+    return CreateSharedString(str.data(), str.size());
+  }
+#else
+  /// @brief Store a string in the buffer, which null-terminated.
+  /// If a string with this exact contents has already been serialized before,
+  /// instead simply returns the offset of the existing string. This uses a map
+  /// stored on the heap, but only stores the numerical offsets.
+  /// @param[in] str A const char pointer to a C-string to add to the buffer.
+  /// @return Returns the offset in the buffer where the string starts.
+  Offset<String> CreateSharedString(const char* str)
+  {
+    return CreateSharedString(str, strlen(str));
+  }
+
+  /// @brief Store a string in the buffer, which can contain any binary data.
+  /// If a string with this exact contents has already been serialized before,
+  /// instead simply returns the offset of the existing string. This uses a map
+  /// stored on the heap, but only stores the numerical offsets.
+  /// @param[in] str A const reference to a std::string to store in the buffer.
+  /// @return Returns the offset in the buffer where the string starts.
+  Offset<String> CreateSharedString(const std::string& str)
+  {
+    return CreateSharedString(str.c_str(), str.length());
+  }
+#endif
+
+  /// @brief Store a string in the buffer, which can contain any binary data.
+  /// If a string with this exact contents has already been serialized before,
+  /// instead simply returns the offset of the existing string. This uses a map
+  /// stored on the heap, but only stores the numerical offsets.
+  /// @param[in] str A const pointer to a `String` struct to add to the buffer.
+  /// @return Returns the offset in the buffer where the string starts
+  Offset<String> CreateSharedString(const String* str)
+  {
+    return str ? CreateSharedString(str->c_str(), str->size()) : 0;
+  }
+
+  /// @cond FLATBUFFERS_INTERNAL
+  template <typename LenT = uoffset_t, typename ReturnT = uoffset_t>
+  ReturnT EndVector(size_t len)
+  {
+    FLATBUFFERS_ASSERT(nested);  // Hit if no corresponding StartVector.
+    nested = false;
+    return PushElement<LenT, ReturnT>(static_cast<LenT>(len));
+  }
+
+  template <template <typename> class OffsetT = Offset, typename LenT = uint32_t>
+  void StartVector(size_t len, size_t elemsize, size_t alignment)
+  {
+    NotNested();
+    nested = true;
+    // Align to the Length type of the vector (either 32-bit or 64-bit), so
+    // that the length of the buffer can be added without padding.
+    PreAlign<LenT>(len * elemsize);
+    PreAlign(len * elemsize, alignment);  // Just in case elemsize > uoffset_t.
+  }
+
+  template <typename T, template <typename> class OffsetT = Offset, typename LenT = uint32_t>
+  void StartVector(size_t len)
+  {
+    return StartVector<OffsetT, LenT>(len, sizeof(T), AlignOf<T>());
+  }
+
+  // Call this right before StartVector/CreateVector if you want to force the
+  // alignment to be something different than what the element size would
+  // normally dictate.
+  // This is useful when storing a nested_flatbuffer in a vector of bytes,
+  // or when storing SIMD floats, etc.
+  void ForceVectorAlignment(const size_t len, const size_t elemsize, const size_t alignment)
+  {
+    if (len == 0) return;
+    FLATBUFFERS_ASSERT(VerifyAlignmentRequirements(alignment));
+    PreAlign(len * elemsize, alignment);
+  }
+
+  template <bool is_64 = Is64Aware>
+  typename std::enable_if<is_64, void>::type ForceVectorAlignment64(const size_t len,
+                                                                    const size_t elemsize,
+                                                                    const size_t alignment)
+  {
+    // If you hit this assertion, you are trying to force alignment on a
+    // vector with offset64 after serializing a 32-bit offset.
+    FLATBUFFERS_ASSERT(GetSize() == length_of_64_bit_region_);
+
+    // Call through.
+    ForceVectorAlignment(len, elemsize, alignment);
+
+    // Update the 64 bit region.
+    length_of_64_bit_region_ = GetSize();
+  }
+
+  // Similar to ForceVectorAlignment but for String fields.
+  void ForceStringAlignment(size_t len, size_t alignment)
+  {
+    if (len == 0) return;
+    FLATBUFFERS_ASSERT(VerifyAlignmentRequirements(alignment));
+    PreAlign((len + 1) * sizeof(char), alignment);
+  }
+
+  /// @endcond
+
+  /// @brief Serialize an array into a FlatBuffer `vector`.
+  /// @tparam T The data type of the array elements.
+  /// @tparam OffsetT the type of offset to return
+  /// @tparam VectorT the type of vector to cast to.
+  /// @param[in] v A pointer to the array of type `T` to serialize into the
+  /// buffer as a `vector`.
+  /// @param[in] len The number of elements to serialize.
+  /// @return Returns a typed `TOffset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T,
+            template <typename...> class OffsetT = Offset,
+            template <typename...> class VectorT = Vector>
+  OffsetT<VectorT<T>> CreateVector(const T* v, size_t len)
+  {
+    // The type of the length field in the vector.
+    typedef typename VectorT<T>::size_type LenT;
+    typedef typename OffsetT<VectorT<T>>::offset_type offset_type;
+    // If this assert hits, you're specifying a template argument that is
+    // causing the wrong overload to be selected, remove it.
+    AssertScalarT<T>();
+    StartVector<T, OffsetT, LenT>(len);
+    if (len > 0) {
+      // clang-format off
+      #if FLATBUFFERS_LITTLEENDIAN
+        PushBytes(reinterpret_cast<const uint8_t *>(v), len * sizeof(T));
+      #else
+        if (sizeof(T) == 1) {
+          PushBytes(reinterpret_cast<const uint8_t *>(v), len);
+        } else {
+          for (auto i = len; i > 0; ) {
+            PushElement(v[--i]);
+          }
+        }
+      #endif
+      // clang-format on
+    }
+    return OffsetT<VectorT<T>>(EndVector<LenT, offset_type>(len));
+  }
+
+  /// @brief Serialize an array like object into a FlatBuffer `vector`.
+  /// @tparam T The data type of the array elements.
+  /// @tparam C The type of the array.
+  /// @param[in] array A reference to an array like object of type `T` to
+  /// serialize into the buffer as a `vector`.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T, class C>
+  Offset<Vector<T>> CreateVector(const C& array)
+  {
+    return CreateVector(array.data(), array.size());
+  }
+
+  /// @brief Serialize an initializer list into a FlatBuffer `vector`.
+  /// @tparam T The data type of the initializer list elements.
+  /// @param[in] v The value of the initializer list.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T>
+  Offset<Vector<T>> CreateVector(std::initializer_list<T> v)
+  {
+    return CreateVector(v.begin(), v.size());
+  }
+
+  template <typename T>
+  Offset<Vector<Offset<T>>> CreateVector(const Offset<T>* v, size_t len)
+  {
+    StartVector<Offset<T>>(len);
+    for (auto i = len; i > 0;) {
+      PushElement(v[--i]);
+    }
+    return Offset<Vector<Offset<T>>>(EndVector(len));
+  }
+
+  /// @brief Serialize a `std::vector` into a FlatBuffer `vector`.
+  /// @tparam T The data type of the `std::vector` elements.
+  /// @param v A const reference to the `std::vector` to serialize into the
+  /// buffer as a `vector`.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T, typename Alloc = std::allocator<T>>
+  Offset<Vector<T>> CreateVector(const std::vector<T, Alloc>& v)
+  {
+    return CreateVector(data(v), v.size());
+  }
+
+  template <template <typename...> class VectorT = Vector64,
+            int&... ExplicitArgumentBarrier,
+            typename T>
+  Offset64<VectorT<T>> CreateVector64(const std::vector<T>& v)
+  {
+    return CreateVector<T, Offset64, VectorT>(data(v), v.size());
+  }
+
+  // vector<bool> may be implemented using a bit-set, so we can't access it as
+  // an array. Instead, read elements manually.
+  // Background: https://isocpp.org/blog/2012/11/on-vectorbool
+  Offset<Vector<uint8_t>> CreateVector(const std::vector<bool>& v)
+  {
+    StartVector<uint8_t>(v.size());
+    for (auto i = v.size(); i > 0;) {
+      PushElement(static_cast<uint8_t>(v[--i]));
+    }
+    return Offset<Vector<uint8_t>>(EndVector(v.size()));
+  }
+
+  /// @brief Serialize values returned by a function into a FlatBuffer `vector`.
+  /// This is a convenience function that takes care of iteration for you.
+  /// @tparam T The data type of the `std::vector` elements.
+  /// @param f A function that takes the current iteration 0..vector_size-1 and
+  /// returns any type that you can construct a FlatBuffers vector out of.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T>
+  Offset<Vector<T>> CreateVector(size_t vector_size, const std::function<T(size_t i)>& f)
+  {
+    FLATBUFFERS_ASSERT(FLATBUFFERS_GENERAL_HEAP_ALLOC_OK);
+    std::vector<T> elems(vector_size);
+    for (size_t i = 0; i < vector_size; i++)
+      elems[i] = f(i);
+    return CreateVector(elems);
+  }
+
+  /// @brief Serialize values returned by a function into a FlatBuffer `vector`.
+  /// This is a convenience function that takes care of iteration for you. This
+  /// uses a vector stored on the heap to store the intermediate results of the
+  /// iteration.
+  /// @tparam T The data type of the `std::vector` elements.
+  /// @param f A function that takes the current iteration 0..vector_size-1,
+  /// and the state parameter returning any type that you can construct a
+  /// FlatBuffers vector out of.
+  /// @param state State passed to f.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T, typename F, typename S>
+  Offset<Vector<T>> CreateVector(size_t vector_size, F f, S* state)
+  {
+    FLATBUFFERS_ASSERT(FLATBUFFERS_GENERAL_HEAP_ALLOC_OK);
+    std::vector<T> elems(vector_size);
+    for (size_t i = 0; i < vector_size; i++)
+      elems[i] = f(i, state);
+    return CreateVector(elems);
+  }
+
+  /// @brief Serialize a `std::vector<StringType>` into a FlatBuffer `vector`.
+  /// whereas StringType is any type that is accepted by the CreateString()
+  /// overloads.
+  /// This is a convenience function for a common case.
+  /// @param v A const reference to the `std::vector` to serialize into the
+  /// buffer as a `vector`.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename StringType = std::string, typename Alloc = std::allocator<StringType>>
+  Offset<Vector<Offset<String>>> CreateVectorOfStrings(const std::vector<StringType, Alloc>& v)
+  {
+    return CreateVectorOfStrings(v.cbegin(), v.cend());
+  }
+
+  /// @brief Serialize a collection of Strings into a FlatBuffer `vector`.
+  /// This is a convenience function for a common case.
+  /// @param begin The beginning iterator of the collection
+  /// @param end The ending iterator of the collection
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <class It>
+  Offset<Vector<Offset<String>>> CreateVectorOfStrings(It begin, It end)
+  {
+    auto distance = std::distance(begin, end);
+    FLATBUFFERS_ASSERT(distance >= 0);
+    auto size                 = static_cast<size_t>(distance);
+    auto scratch_buffer_usage = size * sizeof(Offset<String>);
+    // If there is not enough space to store the offsets, there definitely won't
+    // be enough space to store all the strings. So ensuring space for the
+    // scratch region is OK, for if it fails, it would have failed later.
+    buf_.ensure_space(scratch_buffer_usage);
+    for (auto it = begin; it != end; ++it) {
+      buf_.scratch_push_small(CreateString(*it));
+    }
+    StartVector<Offset<String>>(size);
+    for (size_t i = 1; i <= size; i++) {
+      // Note we re-evaluate the buf location each iteration to account for any
+      // underlying buffer resizing that may occur.
+      PushElement(
+        *reinterpret_cast<Offset<String>*>(buf_.scratch_end() - i * sizeof(Offset<String>)));
+    }
+    buf_.scratch_pop(scratch_buffer_usage);
+    return Offset<Vector<Offset<String>>>(EndVector(size));
+  }
+
+  /// @brief Serialize an array of structs into a FlatBuffer `vector`.
+  /// @tparam T The data type of the struct array elements.
+  /// @param[in] v A pointer to the array of type `T` to serialize into the
+  /// buffer as a `vector`.
+  /// @param[in] len The number of elements to serialize.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T,
+            template <typename...> class OffsetT = Offset,
+            template <typename...> class VectorT = Vector>
+  OffsetT<VectorT<const T*>> CreateVectorOfStructs(const T* v, size_t len)
+  {
+    // The type of the length field in the vector.
+    typedef typename VectorT<T>::size_type LenT;
+    typedef typename OffsetT<VectorT<const T*>>::offset_type offset_type;
+
+    StartVector<OffsetT, LenT>(len, sizeof(T), AlignOf<T>());
+    if (len > 0) { PushBytes(reinterpret_cast<const uint8_t*>(v), sizeof(T) * len); }
+    return OffsetT<VectorT<const T*>>(EndVector<LenT, offset_type>(len));
+  }
+
+  /// @brief Serialize an array of structs into a FlatBuffer `vector`.
+  /// @tparam T The data type of the struct array elements.
+  /// @param[in] filler A function that takes the current iteration
+  /// 0..vector_size-1 and a pointer to the struct that must be filled.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  /// This is mostly useful when flatbuffers are generated with mutation
+  /// accessors.
+  template <typename T>
+  Offset<Vector<const T*>> CreateVectorOfStructs(size_t vector_size,
+                                                 const std::function<void(size_t i, T*)>& filler)
+  {
+    T* structs = StartVectorOfStructs<T>(vector_size);
+    for (size_t i = 0; i < vector_size; i++) {
+      filler(i, structs);
+      structs++;
+    }
+    return EndVectorOfStructs<T>(vector_size);
+  }
+
+  /// @brief Serialize an array of structs into a FlatBuffer `vector`.
+  /// @tparam T The data type of the struct array elements.
+  /// @param[in] f A function that takes the current iteration 0..vector_size-1,
+  /// a pointer to the struct that must be filled and the state argument.
+  /// @param[in] state Arbitrary state to pass to f.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  /// This is mostly useful when flatbuffers are generated with mutation
+  /// accessors.
+  template <typename T, typename F, typename S>
+  Offset<Vector<const T*>> CreateVectorOfStructs(size_t vector_size, F f, S* state)
+  {
+    T* structs = StartVectorOfStructs<T>(vector_size);
+    for (size_t i = 0; i < vector_size; i++) {
+      f(i, structs, state);
+      structs++;
+    }
+    return EndVectorOfStructs<T>(vector_size);
+  }
+
+  /// @brief Serialize a `std::vector` of structs into a FlatBuffer `vector`.
+  /// @tparam T The data type of the `std::vector` struct elements.
+  /// @param[in] v A const reference to the `std::vector` of structs to
+  /// serialize into the buffer as a `vector`.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T,
+            template <typename...> class OffsetT = Offset,
+            template <typename...> class VectorT = Vector,
+            typename Alloc                       = std::allocator<T>>
+  OffsetT<VectorT<const T*>> CreateVectorOfStructs(const std::vector<T, Alloc>& v)
+  {
+    return CreateVectorOfStructs<T, OffsetT, VectorT>(data(v), v.size());
+  }
+
+  template <template <typename...> class VectorT = Vector64, int&..., typename T>
+  Offset64<VectorT<const T*>> CreateVectorOfStructs64(const std::vector<T>& v)
+  {
+    return CreateVectorOfStructs<T, Offset64, VectorT>(data(v), v.size());
+  }
+
+  /// @brief Serialize an array of native structs into a FlatBuffer `vector`.
+  /// @tparam T The data type of the struct array elements.
+  /// @tparam S The data type of the native struct array elements.
+  /// @param[in] v A pointer to the array of type `S` to serialize into the
+  /// buffer as a `vector`.
+  /// @param[in] len The number of elements to serialize.
+  /// @param[in] pack_func Pointer to a function to convert the native struct
+  /// to the FlatBuffer struct.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T, typename S>
+  Offset<Vector<const T*>> CreateVectorOfNativeStructs(const S* v,
+                                                       size_t len,
+                                                       T (*const pack_func)(const S&))
+  {
+    FLATBUFFERS_ASSERT(pack_func);
+    auto structs = StartVectorOfStructs<T>(len);
+    for (size_t i = 0; i < len; i++) {
+      structs[i] = pack_func(v[i]);
+    }
+    return EndVectorOfStructs<T>(len);
+  }
+
+  /// @brief Serialize an array of native structs into a FlatBuffer `vector`.
+  /// @tparam T The data type of the struct array elements.
+  /// @tparam S The data type of the native struct array elements.
+  /// @param[in] v A pointer to the array of type `S` to serialize into the
+  /// buffer as a `vector`.
+  /// @param[in] len The number of elements to serialize.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T, typename S>
+  Offset<Vector<const T*>> CreateVectorOfNativeStructs(const S* v, size_t len)
+  {
+    extern T Pack(const S&);
+    return CreateVectorOfNativeStructs(v, len, Pack);
+  }
+
+  /// @brief Serialize a `std::vector` of native structs into a FlatBuffer
+  /// `vector`.
+  /// @tparam T The data type of the `std::vector` struct elements.
+  /// @tparam S The data type of the `std::vector` native struct elements.
+  /// @param[in] v A const reference to the `std::vector` of structs to
+  /// serialize into the buffer as a `vector`.
+  /// @param[in] pack_func Pointer to a function to convert the native struct
+  /// to the FlatBuffer struct.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T, typename S, typename Alloc = std::allocator<T>>
+  Offset<Vector<const T*>> CreateVectorOfNativeStructs(const std::vector<S, Alloc>& v,
+                                                       T (*const pack_func)(const S&))
+  {
+    return CreateVectorOfNativeStructs<T, S>(data(v), v.size(), pack_func);
+  }
+
+  /// @brief Serialize a `std::vector` of native structs into a FlatBuffer
+  /// `vector`.
+  /// @tparam T The data type of the `std::vector` struct elements.
+  /// @tparam S The data type of the `std::vector` native struct elements.
+  /// @param[in] v A const reference to the `std::vector` of structs to
+  /// serialize into the buffer as a `vector`.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T, typename S, typename Alloc = std::allocator<S>>
+  Offset<Vector<const T*>> CreateVectorOfNativeStructs(const std::vector<S, Alloc>& v)
+  {
+    return CreateVectorOfNativeStructs<T, S>(data(v), v.size());
+  }
+
+  /// @cond FLATBUFFERS_INTERNAL
+  template <typename T>
+  struct StructKeyComparator {
+    bool operator()(const T& a, const T& b) const { return a.KeyCompareLessThan(&b); }
+  };
+  /// @endcond
+
+  /// @brief Serialize a `std::vector` of structs into a FlatBuffer `vector`
+  /// in sorted order.
+  /// @tparam T The data type of the `std::vector` struct elements.
+  /// @param[in] v A const reference to the `std::vector` of structs to
+  /// serialize into the buffer as a `vector`.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T, typename Alloc = std::allocator<T>>
+  Offset<Vector<const T*>> CreateVectorOfSortedStructs(std::vector<T, Alloc>* v)
+  {
+    return CreateVectorOfSortedStructs(data(*v), v->size());
+  }
+
+  /// @brief Serialize a `std::vector` of native structs into a FlatBuffer
+  /// `vector` in sorted order.
+  /// @tparam T The data type of the `std::vector` struct elements.
+  /// @tparam S The data type of the `std::vector` native struct elements.
+  /// @param[in] v A const reference to the `std::vector` of structs to
+  /// serialize into the buffer as a `vector`.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T, typename S, typename Alloc = std::allocator<T>>
+  Offset<Vector<const T*>> CreateVectorOfSortedNativeStructs(std::vector<S, Alloc>* v)
+  {
+    return CreateVectorOfSortedNativeStructs<T, S>(data(*v), v->size());
+  }
+
+  /// @brief Serialize an array of structs into a FlatBuffer `vector` in sorted
+  /// order.
+  /// @tparam T The data type of the struct array elements.
+  /// @param[in] v A pointer to the array of type `T` to serialize into the
+  /// buffer as a `vector`.
+  /// @param[in] len The number of elements to serialize.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T>
+  Offset<Vector<const T*>> CreateVectorOfSortedStructs(T* v, size_t len)
+  {
+    std::stable_sort(v, v + len, StructKeyComparator<T>());
+    return CreateVectorOfStructs(v, len);
+  }
+
+  /// @brief Serialize an array of native structs into a FlatBuffer `vector` in
+  /// sorted order.
+  /// @tparam T The data type of the struct array elements.
+  /// @tparam S The data type of the native struct array elements.
+  /// @param[in] v A pointer to the array of type `S` to serialize into the
+  /// buffer as a `vector`.
+  /// @param[in] len The number of elements to serialize.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T, typename S>
+  Offset<Vector<const T*>> CreateVectorOfSortedNativeStructs(S* v, size_t len)
+  {
+    extern T Pack(const S&);
+    auto structs = StartVectorOfStructs<T>(len);
+    for (size_t i = 0; i < len; i++) {
+      structs[i] = Pack(v[i]);
+    }
+    std::stable_sort(structs, structs + len, StructKeyComparator<T>());
+    return EndVectorOfStructs<T>(len);
+  }
+
+  /// @cond FLATBUFFERS_INTERNAL
+  template <typename T>
+  struct TableKeyComparator {
+    explicit TableKeyComparator(vector_downward<SizeT>& buf) : buf_(buf) {}
+    TableKeyComparator(const TableKeyComparator& other) : buf_(other.buf_) {}
+    bool operator()(const Offset<T>& a, const Offset<T>& b) const
+    {
+      auto table_a = reinterpret_cast<T*>(buf_.data_at(a.o));
+      auto table_b = reinterpret_cast<T*>(buf_.data_at(b.o));
+      return table_a->KeyCompareLessThan(table_b);
+    }
+    vector_downward<SizeT>& buf_;
+
+   private:
+    FLATBUFFERS_DELETE_FUNC(TableKeyComparator& operator=(const TableKeyComparator& other));
+  };
+  /// @endcond
+
+  /// @brief Serialize an array of `table` offsets as a `vector` in the buffer
+  /// in sorted order.
+  /// @tparam T The data type that the offset refers to.
+  /// @param[in] v An array of type `Offset<T>` that contains the `table`
+  /// offsets to store in the buffer in sorted order.
+  /// @param[in] len The number of elements to store in the `vector`.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T>
+  Offset<Vector<Offset<T>>> CreateVectorOfSortedTables(Offset<T>* v, size_t len)
+  {
+    std::stable_sort(v, v + len, TableKeyComparator<T>(buf_));
+    return CreateVector(v, len);
+  }
+
+  /// @brief Serialize an array of `table` offsets as a `vector` in the buffer
+  /// in sorted order.
+  /// @tparam T The data type that the offset refers to.
+  /// @param[in] v An array of type `Offset<T>` that contains the `table`
+  /// offsets to store in the buffer in sorted order.
+  /// @return Returns a typed `Offset` into the serialized data indicating
+  /// where the vector is stored.
+  template <typename T, typename Alloc = std::allocator<T>>
+  Offset<Vector<Offset<T>>> CreateVectorOfSortedTables(std::vector<Offset<T>, Alloc>* v)
+  {
+    return CreateVectorOfSortedTables(data(*v), v->size());
+  }
+
+  /// @brief Specialized version of `CreateVector` for non-copying use cases.
+  /// Write the data any time later to the returned buffer pointer `buf`.
+  /// @param[in] len The number of elements to store in the `vector`.
+  /// @param[in] elemsize The size of each element in the `vector`.
+  /// @param[out] buf A pointer to a `uint8_t` pointer that can be
+  /// written to at a later time to serialize the data into a `vector`
+  /// in the buffer.
+  uoffset_t CreateUninitializedVector(size_t len, size_t elemsize, size_t alignment, uint8_t** buf)
+  {
+    NotNested();
+    StartVector(len, elemsize, alignment);
+    buf_.make_space(len * elemsize);
+    const uoffset_t vec_start = GetSizeRelative32BitRegion();
+    auto vec_end              = EndVector(len);
+    *buf                      = buf_.data_at(vec_start);
+    return vec_end;
+  }
+
+  FLATBUFFERS_ATTRIBUTE([[deprecated("call the version above instead")]])
+  uoffset_t CreateUninitializedVector(size_t len, size_t elemsize, uint8_t** buf)
+  {
+    return CreateUninitializedVector(len, elemsize, elemsize, buf);
+  }
+
+  /// @brief Specialized version of `CreateVector` for non-copying use cases.
+  /// Write the data any time later to the returned buffer pointer `buf`.
+  /// @tparam T The data type of the data that will be stored in the buffer
+  /// as a `vector`.
+  /// @param[in] len The number of elements to store in the `vector`.
+  /// @param[out] buf A pointer to a pointer of type `T` that can be
+  /// written to at a later time to serialize the data into a `vector`
+  /// in the buffer.
+  template <typename T>
+  Offset<Vector<T>> CreateUninitializedVector(size_t len, T** buf)
+  {
+    AssertScalarT<T>();
+    return CreateUninitializedVector(
+      len, sizeof(T), AlignOf<T>(), reinterpret_cast<uint8_t**>(buf));
+  }
+
+  template <typename T>
+  Offset<Vector<const T*>> CreateUninitializedVectorOfStructs(size_t len, T** buf)
+  {
+    return CreateUninitializedVector(
+      len, sizeof(T), AlignOf<T>(), reinterpret_cast<uint8_t**>(buf));
+  }
+
+  // @brief Create a vector of scalar type T given as input a vector of scalar
+  // type U, useful with e.g. pre "enum class" enums, or any existing scalar
+  // data of the wrong type.
+  template <typename T, typename U>
+  Offset<Vector<T>> CreateVectorScalarCast(const U* v, size_t len)
+  {
+    AssertScalarT<T>();
+    AssertScalarT<U>();
+    StartVector<T>(len);
+    for (auto i = len; i > 0;) {
+      PushElement(static_cast<T>(v[--i]));
+    }
+    return Offset<Vector<T>>(EndVector(len));
+  }
+
+  /// @brief Write a struct by itself, typically to be part of a union.
+  template <typename T>
+  Offset<const T*> CreateStruct(const T& structobj)
+  {
+    NotNested();
+    Align(AlignOf<T>());
+    buf_.push_small(structobj);
+    return Offset<const T*>(CalculateOffset<typename Offset<const T*>::offset_type>());
+  }
+
+  /// @brief Finish serializing a buffer by writing the root offset.
+  /// @param[in] file_identifier If a `file_identifier` is given, the buffer
+  /// will be prefixed with a standard FlatBuffers file header.
+  template <typename T>
+  void Finish(Offset<T> root, const char* file_identifier = nullptr)
+  {
+    Finish(root.o, file_identifier, false);
+  }
+
+  /// @brief Finish a buffer with a 32 bit size field pre-fixed (size of the
+  /// buffer following the size field). These buffers are NOT compatible
+  /// with standard buffers created by Finish, i.e. you can't call GetRoot
+  /// on them, you have to use GetSizePrefixedRoot instead.
+  /// All >32 bit quantities in this buffer will be aligned when the whole
+  /// size pre-fixed buffer is aligned.
+  /// These kinds of buffers are useful for creating a stream of FlatBuffers.
+  template <typename T>
+  void FinishSizePrefixed(Offset<T> root, const char* file_identifier = nullptr)
+  {
+    Finish(root.o, file_identifier, true);
+  }
+
+  void SwapBufAllocator(FlatBufferBuilderImpl& other) { buf_.swap_allocator(other.buf_); }
+
+  /// @brief The length of a FlatBuffer file header.
+  static const size_t kFileIdentifierLength = ::flatbuffers::kFileIdentifierLength;
+
+ protected:
+  // You shouldn't really be copying instances of this class.
+  FlatBufferBuilderImpl(const FlatBufferBuilderImpl&);
+  FlatBufferBuilderImpl& operator=(const FlatBufferBuilderImpl&);
+
+  void Finish(uoffset_t root, const char* file_identifier, bool size_prefix)
+  {
+    // A buffer can only be finished once. To reuse a builder use `clear()`.
+    FLATBUFFERS_ASSERT(!finished);
+
+    NotNested();
+    buf_.clear_scratch();
+
+    const size_t prefix_size = size_prefix ? sizeof(SizeT) : 0;
+    // Make sure we track the alignment of the size prefix.
+    TrackMinAlign(prefix_size);
+
+    const size_t root_offset_size = sizeof(uoffset_t);
+    const size_t file_id_size     = file_identifier ? kFileIdentifierLength : 0;
+
+    // This will cause the whole buffer to be aligned.
+    PreAlign(prefix_size + root_offset_size + file_id_size, minalign_);
+
+    if (file_identifier) {
+      FLATBUFFERS_ASSERT(strlen(file_identifier) == kFileIdentifierLength);
+      PushBytes(reinterpret_cast<const uint8_t*>(file_identifier), kFileIdentifierLength);
+    }
+    PushElement(ReferTo(root));  // Location of root.
+    if (size_prefix) { PushElement(GetSize()); }
+    finished = true;
+  }
+
+  struct FieldLoc {
+    uoffset_t off;
+    voffset_t id;
+  };
+
+  vector_downward<SizeT> buf_;
+
+  // Accumulating offsets of table members while it is being built.
+  // We store these in the scratch pad of buf_, after the vtable offsets.
+  uoffset_t num_field_loc;
+  // Track how much of the vtable is in use, so we can output the most compact
+  // possible vtable.
+  voffset_t max_voffset_;
+
+  // This is the length of the 64-bit region of the buffer. The buffer supports
+  // 64-bit offsets by forcing serialization of those elements in the "tail"
+  // region of the buffer (i.e. "64-bit region"). To properly keep track of
+  // offsets that are referenced from the tail of the buffer to not overflow
+  // their size (e.g. Offset is a uint32_t type), the boundary of the 32-/64-bit
+  // regions must be tracked.
+  //
+  // [    Complete FlatBuffer     ]
+  // [32-bit region][64-bit region]
+  //               ^              ^
+  //               |              Tail of the buffer.
+  //               |
+  //               Tail of the 32-bit region of the buffer.
+  //
+  // This keeps track of the size of the 64-bit region so that the tail of the
+  // 32-bit region can be calculated as `GetSize() - length_of_64_bit_region_`.
+  //
+  // This will remain 0 if no 64-bit offset types are added to the buffer.
+  size_t length_of_64_bit_region_;
+
+  // Ensure objects are not nested.
+  bool nested;
+
+  // Ensure the buffer is finished before it is being accessed.
+  bool finished;
+
+  size_t minalign_;
+
+  bool force_defaults_;  // Serialize values equal to their defaults anyway.
+
+  bool dedup_vtables_;
+
+  struct StringOffsetCompare {
+    explicit StringOffsetCompare(const vector_downward<SizeT>& buf) : buf_(&buf) {}
+    bool operator()(const Offset<String>& a, const Offset<String>& b) const
+    {
+      auto stra = reinterpret_cast<const String*>(buf_->data_at(a.o));
+      auto strb = reinterpret_cast<const String*>(buf_->data_at(b.o));
+      return StringLessThan(stra->data(), stra->size(), strb->data(), strb->size());
+    }
+    const vector_downward<SizeT>* buf_;
+  };
+
+  // For use with CreateSharedString. Instantiated on first use only.
+  typedef std::set<Offset<String>, StringOffsetCompare> StringOffsetMap;
+  StringOffsetMap* string_pool;
+
+ private:
+  void CanAddOffset64()
+  {
+    // If you hit this assertion, you are attempting to add a 64-bit offset to
+    // a 32-bit only builder. This is because the builder has overloads that
+    // differ only on the offset size returned: e.g.:
+    //
+    //   FlatBufferBuilder builder;
+    //   Offset64<String> string_offset = builder.CreateString<Offset64>();
+    //
+    // Either use a 64-bit aware builder, or don't try to create an Offset64
+    // return type.
+    //
+    // TODO(derekbailey): we can probably do more enable_if to avoid this
+    // looking like its possible to the user.
+    static_assert(Is64Aware, "cannot add 64-bit offset to a 32-bit builder");
+
+    // If you hit this assertion, you are attempting to add an 64-bit offset
+    // item after already serializing a 32-bit item. All 64-bit offsets have to
+    // added to the tail of the buffer before any 32-bit items can be added.
+    // Otherwise some items might not be addressable due to the maximum range of
+    // the 32-bit offset.
+    FLATBUFFERS_ASSERT(GetSize() == length_of_64_bit_region_);
+  }
+
+  /// @brief Store a string in the buffer, which can contain any binary data.
+  /// @param[in] str A const char pointer to the data to be stored as a string.
+  /// @param[in] len The number of bytes that should be stored from `str`.
+  /// @return Returns the offset in the buffer where the string starts.
+  void CreateStringImpl(const char* str, size_t len)
+  {
+    NotNested();
+    PreAlign<uoffset_t>(len + 1);  // Always 0-terminated.
+    buf_.fill(1);
+    PushBytes(reinterpret_cast<const uint8_t*>(str), len);
+    PushElement(static_cast<uoffset_t>(len));
+  }
+
+  // Allocates space for a vector of structures.
+  // Must be completed with EndVectorOfStructs().
+  template <typename T, template <typename> class OffsetT = Offset>
+  T* StartVectorOfStructs(size_t vector_size)
+  {
+    StartVector<OffsetT>(vector_size, sizeof(T), AlignOf<T>());
+    return reinterpret_cast<T*>(buf_.make_space(vector_size * sizeof(T)));
+  }
+
+  // End the vector of structures in the flatbuffers.
+  // Vector should have previously be started with StartVectorOfStructs().
+  template <typename T, template <typename> class OffsetT = Offset>
+  OffsetT<Vector<const T*>> EndVectorOfStructs(size_t vector_size)
+  {
+    return OffsetT<Vector<const T*>>(
+      EndVector<typename Vector<const T*>::size_type,
+                typename OffsetT<Vector<const T*>>::offset_type>(vector_size));
+  }
+
+  template <typename T>
+  typename std::enable_if<std::is_same<T, uoffset_t>::value, T>::type CalculateOffset()
+  {
+    // Default to the end of the 32-bit region. This may or may not be the end
+    // of the buffer, depending on if any 64-bit offsets have been added.
+    return GetSizeRelative32BitRegion();
+  }
+
+  // Specializations to handle the 64-bit CalculateOffset, which is relative to
+  // end of the buffer.
+  template <typename T>
+  typename std::enable_if<std::is_same<T, uoffset64_t>::value, T>::type CalculateOffset()
+  {
+    // This should never be compiled in when not using a 64-bit builder.
+    static_assert(Is64Aware, "invalid 64-bit offset in 32-bit builder");
+
+    // Store how big the 64-bit region of the buffer is, so we can determine
+    // where the 32/64 bit boundary is.
+    length_of_64_bit_region_ = GetSize();
+
+    return length_of_64_bit_region_;
+  }
+};
+/// @}
+
+// Hack to `FlatBufferBuilder` mean `FlatBufferBuilder<false>` or
+// `FlatBufferBuilder<>`, where the template < > syntax is required.
+using FlatBufferBuilder   = FlatBufferBuilderImpl<false>;
+using FlatBufferBuilder64 = FlatBufferBuilderImpl<true>;
+
+// These are external due to GCC not allowing them in the class.
+// See: https://stackoverflow.com/q/8061456/868247
+template <>
+template <>
+inline Offset64<String> FlatBufferBuilder64::CreateString(const char* str, size_t len)
+{
+  CanAddOffset64();
+  CreateStringImpl(str, len);
+  return Offset64<String>(CalculateOffset<typename Offset64<String>::offset_type>());
+}
+
+// Used to distinguish from real Offsets.
+template <typename T = void>
+struct EmptyOffset {};
+
+// TODO(derekbailey): it would be nice to combine these two methods.
+template <>
+template <>
+inline void FlatBufferBuilder64::StartVector<Offset64, uint32_t>(size_t len,
+                                                                 size_t elemsize,
+                                                                 size_t alignment)
+{
+  CanAddOffset64();
+  StartVector<EmptyOffset, uint32_t>(len, elemsize, alignment);
+}
+
+template <>
+template <>
+inline void FlatBufferBuilder64::StartVector<Offset64, uint64_t>(size_t len,
+                                                                 size_t elemsize,
+                                                                 size_t alignment)
+{
+  CanAddOffset64();
+  StartVector<EmptyOffset, uint64_t>(len, elemsize, alignment);
+}
+
+/// Helpers to get a typed pointer to objects that are currently being built.
+/// @warning Creating new objects will lead to reallocations and invalidates
+/// the pointer!
+template <typename T>
+T* GetMutableTemporaryPointer(FlatBufferBuilder& fbb, Offset<T> offset)
+{
+  return reinterpret_cast<T*>(fbb.GetCurrentBufferPointer() + fbb.GetSize() - offset.o);
+}
+
+template <typename T>
+const T* GetTemporaryPointer(const FlatBufferBuilder& fbb, Offset<T> offset)
+{
+  return reinterpret_cast<const T*>(fbb.GetCurrentBufferPointer() + fbb.GetSize() - offset.o);
+}
+
+}  // namespace flatbuffers
+
+#endif  // FLATBUFFERS_FLATBUFFER_BUILDER_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/flatbuffers.h b/cpp/include/cudf/io/ipc/flatbuffers/flatbuffers.h
new file mode 100644
index 00000000000..d432398ebd8
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/flatbuffers.h
@@ -0,0 +1,289 @@
+/*
+ * Copyright 2014 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_H_
+#define FLATBUFFERS_H_
+
+#include <algorithm>
+
+// TODO: These includes are for mitigating the pains of users editing their
+// source because they relied on flatbuffers.h to include everything for them.
+#include <cudf/io/ipc/flatbuffers/array.h>
+#include <cudf/io/ipc/flatbuffers/base.h>
+#include <cudf/io/ipc/flatbuffers/buffer.h>
+#include <cudf/io/ipc/flatbuffers/buffer_ref.h>
+#include <cudf/io/ipc/flatbuffers/detached_buffer.h>
+#include <cudf/io/ipc/flatbuffers/flatbuffer_builder.h>
+#include <cudf/io/ipc/flatbuffers/stl_emulation.h>
+#include <cudf/io/ipc/flatbuffers/string.h>
+#include <cudf/io/ipc/flatbuffers/struct.h>
+#include <cudf/io/ipc/flatbuffers/table.h>
+#include <cudf/io/ipc/flatbuffers/vector.h>
+#include <cudf/io/ipc/flatbuffers/vector_downward.h>
+#include <cudf/io/ipc/flatbuffers/verifier.h>
+
+namespace flatbuffers {
+
+/// @brief This can compute the start of a FlatBuffer from a root pointer, i.e.
+/// it is the opposite transformation of GetRoot().
+/// This may be useful if you want to pass on a root and have the recipient
+/// delete the buffer afterwards.
+inline const uint8_t* GetBufferStartFromRootPointer(const void* root)
+{
+  auto table  = reinterpret_cast<const Table*>(root);
+  auto vtable = table->GetVTable();
+  // Either the vtable is before the root or after the root.
+  auto start = (std::min)(vtable, reinterpret_cast<const uint8_t*>(root));
+  // Align to at least sizeof(uoffset_t).
+  start =
+    reinterpret_cast<const uint8_t*>(reinterpret_cast<uintptr_t>(start) & ~(sizeof(uoffset_t) - 1));
+  // Additionally, there may be a file_identifier in the buffer, and the root
+  // offset. The buffer may have been aligned to any size between
+  // sizeof(uoffset_t) and FLATBUFFERS_MAX_ALIGNMENT (see "force_align").
+  // Sadly, the exact alignment is only known when constructing the buffer,
+  // since it depends on the presence of values with said alignment properties.
+  // So instead, we simply look at the next uoffset_t values (root,
+  // file_identifier, and alignment padding) to see which points to the root.
+  // None of the other values can "impersonate" the root since they will either
+  // be 0 or four ASCII characters.
+  static_assert(flatbuffers::kFileIdentifierLength == sizeof(uoffset_t),
+                "file_identifier is assumed to be the same size as uoffset_t");
+  for (auto possible_roots = FLATBUFFERS_MAX_ALIGNMENT / sizeof(uoffset_t) + 1; possible_roots;
+       possible_roots--) {
+    start -= sizeof(uoffset_t);
+    if (ReadScalar<uoffset_t>(start) + start == reinterpret_cast<const uint8_t*>(root))
+      return start;
+  }
+  // We didn't find the root, either the "root" passed isn't really a root,
+  // or the buffer is corrupt.
+  // Assert, because calling this function with bad data may cause reads
+  // outside of buffer boundaries.
+  FLATBUFFERS_ASSERT(false);
+  return nullptr;
+}
+
+/// @brief This return the prefixed size of a FlatBuffer.
+template <typename SizeT = uoffset_t>
+inline SizeT GetPrefixedSize(const uint8_t* buf)
+{
+  return ReadScalar<SizeT>(buf);
+}
+
+// Gets the total length of the buffer given a sized prefixed FlatBuffer.
+//
+// This includes the size of the prefix as well as the buffer:
+//
+//  [size prefix][flatbuffer]
+//  |---------length--------|
+template <typename SizeT = uoffset_t>
+inline SizeT GetSizePrefixedBufferLength(const uint8_t* const buf)
+{
+  return ReadScalar<SizeT>(buf) + sizeof(SizeT);
+}
+
+// Base class for native objects (FlatBuffer data de-serialized into native
+// C++ data structures).
+// Contains no functionality, purely documentative.
+struct NativeTable {};
+
+/// @brief Function types to be used with resolving hashes into objects and
+/// back again. The resolver gets a pointer to a field inside an object API
+/// object that is of the type specified in the schema using the attribute
+/// `cpp_type` (it is thus important whatever you write to this address
+/// matches that type). The value of this field is initially null, so you
+/// may choose to implement a delayed binding lookup using this function
+/// if you wish. The resolver does the opposite lookup, for when the object
+/// is being serialized again.
+typedef uint64_t hash_value_t;
+typedef std::function<void(void** pointer_adr, hash_value_t hash)> resolver_function_t;
+typedef std::function<hash_value_t(void* pointer)> rehasher_function_t;
+
+// Helper function to test if a field is present, using any of the field
+// enums in the generated code.
+// `table` must be a generated table type. Since this is a template parameter,
+// this is not typechecked to be a subclass of Table, so beware!
+// Note: this function will return false for fields equal to the default
+// value, since they're not stored in the buffer (unless force_defaults was
+// used).
+template <typename T>
+bool IsFieldPresent(const T* table, typename T::FlatBuffersVTableOffset field)
+{
+  // Cast, since Table is a private baseclass of any table types.
+  return reinterpret_cast<const Table*>(table)->CheckField(static_cast<voffset_t>(field));
+}
+
+// Utility function for reverse lookups on the EnumNames*() functions
+// (in the generated C++ code)
+// names must be NULL terminated.
+inline int LookupEnum(const char** names, const char* name)
+{
+  for (const char** p = names; *p; p++)
+    if (!strcmp(*p, name)) return static_cast<int>(p - names);
+  return -1;
+}
+
+// These macros allow us to layout a struct with a guarantee that they'll end
+// up looking the same on different compilers and platforms.
+// It does this by disallowing the compiler to do any padding, and then
+// does padding itself by inserting extra padding fields that make every
+// element aligned to its own size.
+// Additionally, it manually sets the alignment of the struct as a whole,
+// which is typically its largest element, or a custom size set in the schema
+// by the force_align attribute.
+// These are used in the generated code only.
+
+// clang-format off
+#if defined(_MSC_VER)
+  #define FLATBUFFERS_MANUALLY_ALIGNED_STRUCT(alignment) \
+    __pragma(pack(1)) \
+    struct __declspec(align(alignment))
+  #define FLATBUFFERS_STRUCT_END(name, size) \
+    __pragma(pack()) \
+    static_assert(sizeof(name) == size, "compiler breaks packing rules")
+#elif defined(__GNUC__) || defined(__clang__) || defined(__ICCARM__)
+  #define FLATBUFFERS_MANUALLY_ALIGNED_STRUCT(alignment) \
+    _Pragma("pack(1)") \
+    struct __attribute__((aligned(alignment)))
+  #define FLATBUFFERS_STRUCT_END(name, size) \
+    _Pragma("pack()") \
+    static_assert(sizeof(name) == size, "compiler breaks packing rules")
+#else
+  #error Unknown compiler, please define structure alignment macros
+#endif
+// clang-format on
+
+// Minimal reflection via code generation.
+// Besides full-fat reflection (see reflection.h) and parsing/printing by
+// loading schemas (see idl.h), we can also have code generation for minimal
+// reflection data which allows pretty-printing and other uses without needing
+// a schema or a parser.
+// Generate code with --reflect-types (types only) or --reflect-names (names
+// also) to enable.
+// See minireflect.h for utilities using this functionality.
+
+// These types are organized slightly differently as the ones in idl.h.
+enum SequenceType { ST_TABLE, ST_STRUCT, ST_UNION, ST_ENUM };
+
+// Scalars have the same order as in idl.h
+// clang-format off
+#define FLATBUFFERS_GEN_ELEMENTARY_TYPES(ET) \
+  ET(ET_UTYPE) \
+  ET(ET_BOOL) \
+  ET(ET_CHAR) \
+  ET(ET_UCHAR) \
+  ET(ET_SHORT) \
+  ET(ET_USHORT) \
+  ET(ET_INT) \
+  ET(ET_UINT) \
+  ET(ET_LONG) \
+  ET(ET_ULONG) \
+  ET(ET_FLOAT) \
+  ET(ET_DOUBLE) \
+  ET(ET_STRING) \
+  ET(ET_SEQUENCE)  // See SequenceType.
+
+enum ElementaryType {
+  #define FLATBUFFERS_ET(E) E,
+    FLATBUFFERS_GEN_ELEMENTARY_TYPES(FLATBUFFERS_ET)
+  #undef FLATBUFFERS_ET
+};
+
+inline const char * const *ElementaryTypeNames() {
+  static const char * const names[] = {
+    #define FLATBUFFERS_ET(E) #E,
+      FLATBUFFERS_GEN_ELEMENTARY_TYPES(FLATBUFFERS_ET)
+    #undef FLATBUFFERS_ET
+  };
+  return names;
+}
+// clang-format on
+
+// Basic type info cost just 16bits per field!
+// We're explicitly defining the signedness since the signedness of integer
+// bitfields is otherwise implementation-defined and causes warnings on older
+// GCC compilers.
+struct TypeCode {
+  // ElementaryType
+  unsigned short base_type : 4;
+  // Either vector (in table) or array (in struct)
+  unsigned short is_repeating : 1;
+  // Index into type_refs below, or -1 for none.
+  signed short sequence_ref : 11;
+};
+
+static_assert(sizeof(TypeCode) == 2, "TypeCode");
+
+struct TypeTable;
+
+// Signature of the static method present in each type.
+typedef const TypeTable* (*TypeFunction)();
+
+struct TypeTable {
+  SequenceType st;
+  size_t num_elems;               // of type_codes, values, names (but not type_refs).
+  const TypeCode* type_codes;     // num_elems count
+  const TypeFunction* type_refs;  // less than num_elems entries (see TypeCode).
+  const int16_t* array_sizes;     // less than num_elems entries (see TypeCode).
+  const int64_t* values;          // Only set for non-consecutive enum/union or structs.
+  const char* const* names;       // Only set if compiled with --reflect-names.
+};
+
+// String which identifies the current version of FlatBuffers.
+inline const char* flatbuffers_version_string()
+{
+  return "FlatBuffers " FLATBUFFERS_STRING(FLATBUFFERS_VERSION_MAJOR) "." FLATBUFFERS_STRING(
+    FLATBUFFERS_VERSION_MINOR) "." FLATBUFFERS_STRING(FLATBUFFERS_VERSION_REVISION);
+}
+
+// clang-format off
+#define FLATBUFFERS_DEFINE_BITMASK_OPERATORS(E, T)\
+    inline FLATBUFFERS_CONSTEXPR_CPP11 E operator | (E lhs, E rhs){\
+        return E(T(lhs) | T(rhs));\
+    }\
+    inline FLATBUFFERS_CONSTEXPR_CPP11 E operator & (E lhs, E rhs){\
+        return E(T(lhs) & T(rhs));\
+    }\
+    inline FLATBUFFERS_CONSTEXPR_CPP11 E operator ^ (E lhs, E rhs){\
+        return E(T(lhs) ^ T(rhs));\
+    }\
+    inline FLATBUFFERS_CONSTEXPR_CPP11 E operator ~ (E lhs){\
+        return E(~T(lhs));\
+    }\
+    inline FLATBUFFERS_CONSTEXPR_CPP11 E operator |= (E &lhs, E rhs){\
+        lhs = lhs | rhs;\
+        return lhs;\
+    }\
+    inline FLATBUFFERS_CONSTEXPR_CPP11 E operator &= (E &lhs, E rhs){\
+        lhs = lhs & rhs;\
+        return lhs;\
+    }\
+    inline FLATBUFFERS_CONSTEXPR_CPP11 E operator ^= (E &lhs, E rhs){\
+        lhs = lhs ^ rhs;\
+        return lhs;\
+    }\
+    inline FLATBUFFERS_CONSTEXPR_CPP11 bool operator !(E rhs) \
+    {\
+        return !bool(T(rhs)); \
+    }
+/// @endcond
+}  // namespace flatbuffers
+
+// clang-format on
+
+#endif  // FLATBUFFERS_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/stl_emulation.h b/cpp/include/cudf/io/ipc/flatbuffers/stl_emulation.h
new file mode 100644
index 00000000000..7527e964456
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/stl_emulation.h
@@ -0,0 +1,568 @@
+/*
+ * Copyright 2017 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_STL_EMULATION_H_
+#define FLATBUFFERS_STL_EMULATION_H_
+
+#include <cudf/io/ipc/flatbuffers/base.h>
+
+#include <limits>
+#include <memory>
+#include <string>
+#include <type_traits>
+#include <vector>
+
+#ifndef FLATBUFFERS_USE_STD_OPTIONAL
+// Detect C++17 compatible compiler.
+// __cplusplus >= 201703L - a compiler has support of 'static inline' variables.
+#if (defined(__cplusplus) && __cplusplus >= 201703L) || \
+  (defined(_MSVC_LANG) && _MSVC_LANG >= 201703L)
+#define FLATBUFFERS_USE_STD_OPTIONAL 1
+#else
+#define FLATBUFFERS_USE_STD_OPTIONAL 0
+#endif  // (defined(__cplusplus) && __cplusplus >= 201703L) ...
+#endif  // FLATBUFFERS_USE_STD_OPTIONAL
+
+#if FLATBUFFERS_USE_STD_OPTIONAL
+#include <optional>
+#endif
+
+#ifndef FLATBUFFERS_USE_STD_SPAN
+// Testing __cpp_lib_span requires including either <version> or <span>,
+// both of which were added in C++20.
+// See: https://en.cppreference.com/w/cpp/utility/feature_test
+#if defined(__cplusplus) && __cplusplus >= 202002L || (defined(_MSVC_LANG) && _MSVC_LANG >= 202002L)
+#define FLATBUFFERS_USE_STD_SPAN 1
+#endif
+#endif  // FLATBUFFERS_USE_STD_SPAN
+
+#if defined(FLATBUFFERS_USE_STD_SPAN)
+#include <array>
+#include <span>
+#else
+// Disable non-trivial ctors if FLATBUFFERS_SPAN_MINIMAL defined.
+#if !defined(FLATBUFFERS_TEMPLATES_ALIASES)
+#define FLATBUFFERS_SPAN_MINIMAL
+#else
+// Enable implicit construction of a span<T,N> from a std::array<T,N>.
+#include <array>
+#endif
+#endif  // defined(FLATBUFFERS_USE_STD_SPAN)
+
+// This header provides backwards compatibility for older versions of the STL.
+namespace flatbuffers {
+
+#if defined(FLATBUFFERS_TEMPLATES_ALIASES)
+template <typename T>
+using numeric_limits = std::numeric_limits<T>;
+#else
+template <typename T>
+class numeric_limits : public std::numeric_limits<T> {};
+#endif  // defined(FLATBUFFERS_TEMPLATES_ALIASES)
+
+#if defined(FLATBUFFERS_TEMPLATES_ALIASES)
+template <typename T>
+using is_scalar = std::is_scalar<T>;
+template <typename T, typename U>
+using is_same = std::is_same<T, U>;
+template <typename T>
+using is_floating_point = std::is_floating_point<T>;
+template <typename T>
+using is_unsigned = std::is_unsigned<T>;
+template <typename T>
+using is_enum = std::is_enum<T>;
+template <typename T>
+using make_unsigned = std::make_unsigned<T>;
+template <bool B, class T, class F>
+using conditional = std::conditional<B, T, F>;
+template <class T, T v>
+using integral_constant = std::integral_constant<T, v>;
+template <bool B>
+using bool_constant = integral_constant<bool, B>;
+using true_type     = std::true_type;
+using false_type    = std::false_type;
+#else
+// MSVC 2010 doesn't support C++11 aliases.
+template <typename T>
+struct is_scalar : public std::is_scalar<T> {};
+template <typename T, typename U>
+struct is_same : public std::is_same<T, U> {};
+template <typename T>
+struct is_floating_point : public std::is_floating_point<T> {};
+template <typename T>
+struct is_unsigned : public std::is_unsigned<T> {};
+template <typename T>
+struct is_enum : public std::is_enum<T> {};
+template <typename T>
+struct make_unsigned : public std::make_unsigned<T> {};
+template <bool B, class T, class F>
+struct conditional : public std::conditional<B, T, F> {};
+template <class T, T v>
+struct integral_constant : public std::integral_constant<T, v> {};
+template <bool B>
+struct bool_constant : public integral_constant<bool, B> {};
+typedef bool_constant<true> true_type;
+typedef bool_constant<false> false_type;
+#endif  // defined(FLATBUFFERS_TEMPLATES_ALIASES)
+
+#if defined(FLATBUFFERS_TEMPLATES_ALIASES)
+template <class T>
+using unique_ptr = std::unique_ptr<T>;
+#else
+// MSVC 2010 doesn't support C++11 aliases.
+// We're manually "aliasing" the class here as we want to bring unique_ptr
+// into the flatbuffers namespace.  We have unique_ptr in the flatbuffers
+// namespace we have a completely independent implementation (see below)
+// for C++98 STL implementations.
+template <class T>
+class unique_ptr : public std::unique_ptr<T> {
+ public:
+  unique_ptr() {}
+  explicit unique_ptr(T* p) : std::unique_ptr<T>(p) {}
+  unique_ptr(std::unique_ptr<T>&& u) { *this = std::move(u); }
+  unique_ptr(unique_ptr&& u) { *this = std::move(u); }
+  unique_ptr& operator=(std::unique_ptr<T>&& u)
+  {
+    std::unique_ptr<T>::reset(u.release());
+    return *this;
+  }
+  unique_ptr& operator=(unique_ptr&& u)
+  {
+    std::unique_ptr<T>::reset(u.release());
+    return *this;
+  }
+  unique_ptr& operator=(T* p) { return std::unique_ptr<T>::operator=(p); }
+};
+#endif  // defined(FLATBUFFERS_TEMPLATES_ALIASES)
+
+#if FLATBUFFERS_USE_STD_OPTIONAL
+template <class T>
+using Optional                     = std::optional<T>;
+using nullopt_t                    = std::nullopt_t;
+inline constexpr nullopt_t nullopt = std::nullopt;
+
+#else
+// Limited implementation of Optional<T> type for a scalar T.
+// This implementation limited by trivial types compatible with
+// std::is_arithmetic<T> or std::is_enum<T> type traits.
+
+// A tag to indicate an empty flatbuffers::optional<T>.
+struct nullopt_t {
+  explicit FLATBUFFERS_CONSTEXPR_CPP11 nullopt_t(int) {}
+};
+
+#if defined(FLATBUFFERS_CONSTEXPR_DEFINED)
+namespace internal {
+template <class>
+struct nullopt_holder {
+  static constexpr nullopt_t instance_ = nullopt_t(0);
+};
+template <class Dummy>
+constexpr nullopt_t nullopt_holder<Dummy>::instance_;
+}  // namespace internal
+static constexpr const nullopt_t& nullopt = internal::nullopt_holder<void>::instance_;
+
+#else
+namespace internal {
+template <class>
+struct nullopt_holder {
+  static const nullopt_t instance_;
+};
+template <class Dummy>
+const nullopt_t nullopt_holder<Dummy>::instance_ = nullopt_t(0);
+}  // namespace internal
+static const nullopt_t& nullopt = internal::nullopt_holder<void>::instance_;
+
+#endif
+
+template <class T>
+class Optional FLATBUFFERS_FINAL_CLASS {
+  // Non-scalar 'T' would extremely complicated Optional<T>.
+  // Use is_scalar<T> checking because flatbuffers flatbuffers::is_arithmetic<T>
+  // isn't implemented.
+  static_assert(flatbuffers::is_scalar<T>::value, "unexpected type T");
+
+ public:
+  ~Optional() {}
+
+  FLATBUFFERS_CONSTEXPR_CPP11 Optional() FLATBUFFERS_NOEXCEPT : value_(), has_value_(false) {}
+
+  FLATBUFFERS_CONSTEXPR_CPP11 Optional(nullopt_t) FLATBUFFERS_NOEXCEPT : value_(), has_value_(false)
+  {
+  }
+
+  FLATBUFFERS_CONSTEXPR_CPP11 Optional(T val) FLATBUFFERS_NOEXCEPT : value_(val), has_value_(true)
+  {
+  }
+
+  FLATBUFFERS_CONSTEXPR_CPP11 Optional(const Optional& other) FLATBUFFERS_NOEXCEPT
+    : value_(other.value_),
+      has_value_(other.has_value_)
+  {
+  }
+
+  FLATBUFFERS_CONSTEXPR_CPP14 Optional& operator=(const Optional& other) FLATBUFFERS_NOEXCEPT
+  {
+    value_     = other.value_;
+    has_value_ = other.has_value_;
+    return *this;
+  }
+
+  FLATBUFFERS_CONSTEXPR_CPP14 Optional& operator=(nullopt_t) FLATBUFFERS_NOEXCEPT
+  {
+    value_     = T();
+    has_value_ = false;
+    return *this;
+  }
+
+  FLATBUFFERS_CONSTEXPR_CPP14 Optional& operator=(T val) FLATBUFFERS_NOEXCEPT
+  {
+    value_     = val;
+    has_value_ = true;
+    return *this;
+  }
+
+  void reset() FLATBUFFERS_NOEXCEPT { *this = nullopt; }
+
+  void swap(Optional& other) FLATBUFFERS_NOEXCEPT
+  {
+    std::swap(value_, other.value_);
+    std::swap(has_value_, other.has_value_);
+  }
+
+  FLATBUFFERS_CONSTEXPR_CPP11 FLATBUFFERS_EXPLICIT_CPP11 operator bool() const FLATBUFFERS_NOEXCEPT
+  {
+    return has_value_;
+  }
+
+  FLATBUFFERS_CONSTEXPR_CPP11 bool has_value() const FLATBUFFERS_NOEXCEPT { return has_value_; }
+
+  FLATBUFFERS_CONSTEXPR_CPP11 const T& operator*() const FLATBUFFERS_NOEXCEPT { return value_; }
+
+  const T& value() const
+  {
+    FLATBUFFERS_ASSERT(has_value());
+    return value_;
+  }
+
+  T value_or(T default_value) const FLATBUFFERS_NOEXCEPT
+  {
+    return has_value() ? value_ : default_value;
+  }
+
+ private:
+  T value_;
+  bool has_value_;
+};
+
+template <class T>
+FLATBUFFERS_CONSTEXPR_CPP11 bool operator==(const Optional<T>& opt, nullopt_t) FLATBUFFERS_NOEXCEPT
+{
+  return !opt;
+}
+template <class T>
+FLATBUFFERS_CONSTEXPR_CPP11 bool operator==(nullopt_t, const Optional<T>& opt) FLATBUFFERS_NOEXCEPT
+{
+  return !opt;
+}
+
+template <class T, class U>
+FLATBUFFERS_CONSTEXPR_CPP11 bool operator==(const Optional<T>& lhs,
+                                            const U& rhs) FLATBUFFERS_NOEXCEPT
+{
+  return static_cast<bool>(lhs) && (*lhs == rhs);
+}
+
+template <class T, class U>
+FLATBUFFERS_CONSTEXPR_CPP11 bool operator==(const T& lhs,
+                                            const Optional<U>& rhs) FLATBUFFERS_NOEXCEPT
+{
+  return static_cast<bool>(rhs) && (lhs == *rhs);
+}
+
+template <class T, class U>
+FLATBUFFERS_CONSTEXPR_CPP11 bool operator==(const Optional<T>& lhs,
+                                            const Optional<U>& rhs) FLATBUFFERS_NOEXCEPT
+{
+  return static_cast<bool>(lhs) != static_cast<bool>(rhs) ? false
+         : !static_cast<bool>(lhs)                        ? false
+                                                          : (*lhs == *rhs);
+}
+#endif  // FLATBUFFERS_USE_STD_OPTIONAL
+
+// Very limited and naive partial implementation of C++20 std::span<T,Extent>.
+#if defined(FLATBUFFERS_USE_STD_SPAN)
+inline constexpr std::size_t dynamic_extent = std::dynamic_extent;
+template <class T, std::size_t Extent = std::dynamic_extent>
+using span = std::span<T, Extent>;
+
+#else  // !defined(FLATBUFFERS_USE_STD_SPAN)
+FLATBUFFERS_CONSTEXPR std::size_t dynamic_extent = static_cast<std::size_t>(-1);
+
+// Exclude this code if MSVC2010 or non-STL Android is active.
+// The non-STL Android doesn't have `std::is_convertible` required for SFINAE.
+#if !defined(FLATBUFFERS_SPAN_MINIMAL)
+namespace internal {
+// This is SFINAE helper class for checking of a common condition:
+// > This overload only participates in overload resolution
+// > Check whether a pointer to an array of From can be converted
+// > to a pointer to an array of To.
+// This helper is used for checking of 'From -> const From'.
+template <class To, std::size_t Extent, class From, std::size_t N>
+struct is_span_convertible {
+  using type = typename std::conditional<std::is_convertible<From (*)[], To (*)[]>::value &&
+                                           (Extent == dynamic_extent || N == Extent),
+                                         int,
+                                         void>::type;
+};
+
+template <typename T>
+struct SpanIterator {
+  // TODO: upgrade to std::random_access_iterator_tag.
+  using iterator_category = std::forward_iterator_tag;
+  using difference_type   = std::ptrdiff_t;
+  using value_type        = typename std::remove_cv<T>::type;
+  using reference         = T&;
+  using pointer           = T*;
+
+// Convince MSVC compiler that this iterator is trusted (it is verified).
+#ifdef _MSC_VER
+  using _Unchecked_type = pointer;
+#endif  // _MSC_VER
+
+  SpanIterator(pointer ptr) : ptr_(ptr) {}
+  reference operator*() const { return *ptr_; }
+  pointer operator->() { return ptr_; }
+  SpanIterator& operator++()
+  {
+    ptr_++;
+    return *this;
+  }
+  SpanIterator operator++(int)
+  {
+    auto tmp = *this;
+    ++(*this);
+    return tmp;
+  }
+
+  friend bool operator==(const SpanIterator& lhs, const SpanIterator& rhs)
+  {
+    return lhs.ptr_ == rhs.ptr_;
+  }
+  friend bool operator!=(const SpanIterator& lhs, const SpanIterator& rhs)
+  {
+    return lhs.ptr_ != rhs.ptr_;
+  }
+
+ private:
+  pointer ptr_;
+};
+}  // namespace internal
+#endif  // !defined(FLATBUFFERS_SPAN_MINIMAL)
+
+// T - element type; must be a complete type that is not an abstract
+// class type.
+// Extent - the number of elements in the sequence, or dynamic.
+template <class T, std::size_t Extent = dynamic_extent>
+class span FLATBUFFERS_FINAL_CLASS {
+ public:
+  typedef T element_type;
+  typedef T& reference;
+  typedef const T& const_reference;
+  typedef T* pointer;
+  typedef const T* const_pointer;
+  typedef std::size_t size_type;
+
+  static FLATBUFFERS_CONSTEXPR size_type extent = Extent;
+
+  // Returns the number of elements in the span.
+  FLATBUFFERS_CONSTEXPR_CPP11 size_type size() const FLATBUFFERS_NOEXCEPT { return count_; }
+
+  // Returns the size of the sequence in bytes.
+  FLATBUFFERS_CONSTEXPR_CPP11
+  size_type size_bytes() const FLATBUFFERS_NOEXCEPT { return size() * sizeof(element_type); }
+
+  // Checks if the span is empty.
+  FLATBUFFERS_CONSTEXPR_CPP11 bool empty() const FLATBUFFERS_NOEXCEPT { return size() == 0; }
+
+  // Returns a pointer to the beginning of the sequence.
+  FLATBUFFERS_CONSTEXPR_CPP11 pointer data() const FLATBUFFERS_NOEXCEPT { return data_; }
+
+#if !defined(FLATBUFFERS_SPAN_MINIMAL)
+  using Iterator = internal::SpanIterator<T>;
+
+  Iterator begin() const { return Iterator(data()); }
+  Iterator end() const { return Iterator(data() + size()); }
+#endif
+
+  // Returns a reference to the idx-th element of the sequence.
+  // The behavior is undefined if the idx is greater than or equal to size().
+  FLATBUFFERS_CONSTEXPR_CPP11 reference operator[](size_type idx) const { return data()[idx]; }
+
+  FLATBUFFERS_CONSTEXPR_CPP11 span(const span& other) FLATBUFFERS_NOEXCEPT : data_(other.data_),
+                                                                             count_(other.count_)
+  {
+  }
+
+  FLATBUFFERS_CONSTEXPR_CPP14 span& operator=(const span& other) FLATBUFFERS_NOEXCEPT
+  {
+    data_  = other.data_;
+    count_ = other.count_;
+  }
+
+  // Limited implementation of
+  // `template <class It> constexpr std::span(It first, size_type count);`.
+  //
+  // Constructs a span that is a view over the range [first, first + count);
+  // the resulting span has: data() == first and size() == count.
+  // The behavior is undefined if [first, first + count) is not a valid range,
+  // or if (extent != flatbuffers::dynamic_extent && count != extent).
+  FLATBUFFERS_CONSTEXPR_CPP11
+  explicit span(pointer first, size_type count) FLATBUFFERS_NOEXCEPT
+    : data_(Extent == dynamic_extent ? first : (Extent == count ? first : nullptr)),
+      count_(Extent == dynamic_extent ? count : (Extent == count ? Extent : 0))
+  {
+    // Make span empty if the count argument is incompatible with span<T,N>.
+  }
+
+// Exclude this code if MSVC2010 is active. The MSVC2010 isn't C++11
+// compliant, it doesn't support default template arguments for functions.
+#if defined(FLATBUFFERS_SPAN_MINIMAL)
+  FLATBUFFERS_CONSTEXPR_CPP11 span() FLATBUFFERS_NOEXCEPT : data_(nullptr), count_(0)
+  {
+    static_assert(extent == 0 || extent == dynamic_extent, "invalid span");
+  }
+
+#else
+  // Constructs an empty span whose data() == nullptr and size() == 0.
+  // This overload only participates in overload resolution if
+  // extent == 0 || extent == flatbuffers::dynamic_extent.
+  // A dummy template argument N is need dependency for SFINAE.
+  template <
+    std::size_t N                                                                             = 0,
+    typename internal::is_span_convertible<element_type, Extent, element_type, (N - N)>::type = 0>
+  FLATBUFFERS_CONSTEXPR_CPP11 span() FLATBUFFERS_NOEXCEPT : data_(nullptr), count_(0)
+  {
+    static_assert(extent == 0 || extent == dynamic_extent, "invalid span");
+  }
+
+  // Constructs a span that is a view over the array arr; the resulting span
+  // has size() == N and data() == std::data(arr). These overloads only
+  // participate in overload resolution if
+  // extent == std::dynamic_extent || N == extent is true and
+  // std::remove_pointer_t<decltype(std::data(arr))>(*)[]
+  // is convertible to element_type (*)[].
+  template <std::size_t N,
+            typename internal::is_span_convertible<element_type, Extent, element_type, N>::type = 0>
+  FLATBUFFERS_CONSTEXPR_CPP11 span(element_type (&arr)[N]) FLATBUFFERS_NOEXCEPT : data_(arr),
+                                                                                  count_(N)
+  {
+  }
+
+  template <class U,
+            std::size_t N,
+            typename internal::is_span_convertible<element_type, Extent, U, N>::type = 0>
+  FLATBUFFERS_CONSTEXPR_CPP11 span(std::array<U, N>& arr) FLATBUFFERS_NOEXCEPT : data_(arr.data()),
+                                                                                 count_(N)
+  {
+  }
+
+  // template<class U, std::size_t N,
+  //   int = 0>
+  // FLATBUFFERS_CONSTEXPR_CPP11 span(std::array<U, N> &arr) FLATBUFFERS_NOEXCEPT
+  //    : data_(arr.data()), count_(N) {}
+
+  template <class U,
+            std::size_t N,
+            typename internal::is_span_convertible<element_type, Extent, U, N>::type = 0>
+  FLATBUFFERS_CONSTEXPR_CPP11 span(const std::array<U, N>& arr) FLATBUFFERS_NOEXCEPT
+    : data_(arr.data()),
+      count_(N)
+  {
+  }
+
+  // Converting constructor from another span s;
+  // the resulting span has size() == s.size() and data() == s.data().
+  // This overload only participates in overload resolution
+  // if extent == std::dynamic_extent || N == extent is true and U (*)[]
+  // is convertible to element_type (*)[].
+  template <class U,
+            std::size_t N,
+            typename internal::is_span_convertible<element_type, Extent, U, N>::type = 0>
+  FLATBUFFERS_CONSTEXPR_CPP11 span(const flatbuffers::span<U, N>& s) FLATBUFFERS_NOEXCEPT
+    : span(s.data(), s.size())
+  {
+  }
+
+#endif  // !defined(FLATBUFFERS_SPAN_MINIMAL)
+
+ private:
+  // This is a naive implementation with 'count_' member even if (Extent != dynamic_extent).
+  pointer const data_;
+  size_type count_;
+};
+#endif  // defined(FLATBUFFERS_USE_STD_SPAN)
+
+#if !defined(FLATBUFFERS_SPAN_MINIMAL)
+template <class ElementType, std::size_t Extent>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<ElementType, Extent> make_span(
+  ElementType (&arr)[Extent]) FLATBUFFERS_NOEXCEPT
+{
+  return span<ElementType, Extent>(arr);
+}
+
+template <class ElementType, std::size_t Extent>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const ElementType, Extent> make_span(
+  const ElementType (&arr)[Extent]) FLATBUFFERS_NOEXCEPT
+{
+  return span<const ElementType, Extent>(arr);
+}
+
+template <class ElementType, std::size_t Extent>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<ElementType, Extent> make_span(
+  std::array<ElementType, Extent>& arr) FLATBUFFERS_NOEXCEPT
+{
+  return span<ElementType, Extent>(arr);
+}
+
+template <class ElementType, std::size_t Extent>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const ElementType, Extent> make_span(
+  const std::array<ElementType, Extent>& arr) FLATBUFFERS_NOEXCEPT
+{
+  return span<const ElementType, Extent>(arr);
+}
+
+template <class ElementType, std::size_t Extent>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<ElementType, dynamic_extent> make_span(
+  ElementType* first, std::size_t count) FLATBUFFERS_NOEXCEPT
+{
+  return span<ElementType, dynamic_extent>(first, count);
+}
+
+template <class ElementType, std::size_t Extent>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const ElementType, dynamic_extent> make_span(
+  const ElementType* first, std::size_t count) FLATBUFFERS_NOEXCEPT
+{
+  return span<const ElementType, dynamic_extent>(first, count);
+}
+#endif  // !defined(FLATBUFFERS_SPAN_MINIMAL)
+
+}  // namespace flatbuffers
+
+#endif  // FLATBUFFERS_STL_EMULATION_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/string.h b/cpp/include/cudf/io/ipc/flatbuffers/string.h
new file mode 100644
index 00000000000..be877fde35c
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/string.h
@@ -0,0 +1,70 @@
+/*
+ * Copyright 2021 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_STRING_H_
+#define FLATBUFFERS_STRING_H_
+
+#include <cudf/io/ipc/flatbuffers/base.h>
+#include <cudf/io/ipc/flatbuffers/vector.h>
+
+namespace flatbuffers {
+
+struct String : public Vector<char> {
+  const char* c_str() const { return reinterpret_cast<const char*>(Data()); }
+  std::string str() const { return std::string(c_str(), size()); }
+
+// clang-format off
+  #ifdef FLATBUFFERS_HAS_STRING_VIEW
+  flatbuffers::string_view string_view() const {
+    return flatbuffers::string_view(c_str(), size());
+  }
+
+  /* implicit */
+  operator flatbuffers::string_view() const {
+    return flatbuffers::string_view(c_str(), size());
+  }
+  #endif // FLATBUFFERS_HAS_STRING_VIEW
+  // clang-format on
+
+  bool operator<(const String& o) const
+  {
+    return StringLessThan(this->data(), this->size(), o.data(), o.size());
+  }
+};
+
+// Convenience function to get std::string from a String returning an empty
+// string on null pointer.
+static inline std::string GetString(const String* str) { return str ? str->str() : ""; }
+
+// Convenience function to get char* from a String returning an empty string on
+// null pointer.
+static inline const char* GetCstring(const String* str) { return str ? str->c_str() : ""; }
+
+#ifdef FLATBUFFERS_HAS_STRING_VIEW
+// Convenience function to get string_view from a String returning an empty
+// string_view on null pointer.
+static inline flatbuffers::string_view GetStringView(const String* str)
+{
+  return str ? str->string_view() : flatbuffers::string_view();
+}
+#endif  // FLATBUFFERS_HAS_STRING_VIEW
+
+}  // namespace flatbuffers
+
+#endif  // FLATBUFFERS_STRING_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/struct.h b/cpp/include/cudf/io/ipc/flatbuffers/struct.h
new file mode 100644
index 00000000000..b4fd5a1de73
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/struct.h
@@ -0,0 +1,60 @@
+/*
+ * Copyright 2021 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_STRUCT_H_
+#define FLATBUFFERS_STRUCT_H_
+
+#include <cudf/io/ipc/flatbuffers/base.h>
+
+namespace flatbuffers {
+
+// "structs" are flat structures that do not have an offset table, thus
+// always have all members present and do not support forwards/backwards
+// compatible extensions.
+
+class Struct FLATBUFFERS_FINAL_CLASS {
+ public:
+  template <typename T>
+  T GetField(uoffset_t o) const
+  {
+    return ReadScalar<T>(&data_[o]);
+  }
+
+  template <typename T>
+  T GetStruct(uoffset_t o) const
+  {
+    return reinterpret_cast<T>(&data_[o]);
+  }
+
+  const uint8_t* GetAddressOf(uoffset_t o) const { return &data_[o]; }
+  uint8_t* GetAddressOf(uoffset_t o) { return &data_[o]; }
+
+ private:
+  // private constructor & copy constructor: you obtain instances of this
+  // class by pointing to existing data only
+  Struct();
+  Struct(const Struct&);
+  Struct& operator=(const Struct&);
+
+  uint8_t data_[1];
+};
+
+}  // namespace flatbuffers
+
+#endif  // FLATBUFFERS_STRUCT_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/table.h b/cpp/include/cudf/io/ipc/flatbuffers/table.h
new file mode 100644
index 00000000000..34aa51ebea7
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/table.h
@@ -0,0 +1,202 @@
+/*
+ * Copyright 2021 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_TABLE_H_
+#define FLATBUFFERS_TABLE_H_
+
+#include <cudf/io/ipc/flatbuffers/base.h>
+#include <cudf/io/ipc/flatbuffers/verifier.h>
+
+namespace flatbuffers {
+
+// "tables" use an offset table (possibly shared) that allows fields to be
+// omitted and added at will, but uses an extra indirection to read.
+class Table {
+ public:
+  const uint8_t* GetVTable() const { return data_ - ReadScalar<soffset_t>(data_); }
+
+  // This gets the field offset for any of the functions below it, or 0
+  // if the field was not present.
+  voffset_t GetOptionalFieldOffset(voffset_t field) const
+  {
+    // The vtable offset is always at the start.
+    auto vtable = GetVTable();
+    // The first element is the size of the vtable (fields + type id + itself).
+    auto vtsize = ReadScalar<voffset_t>(vtable);
+    // If the field we're accessing is outside the vtable, we're reading older
+    // data, so it's the same as if the offset was 0 (not present).
+    return field < vtsize ? ReadScalar<voffset_t>(vtable + field) : 0;
+  }
+
+  template <typename T>
+  T GetField(voffset_t field, T defaultval) const
+  {
+    auto field_offset = GetOptionalFieldOffset(field);
+    return field_offset ? ReadScalar<T>(data_ + field_offset) : defaultval;
+  }
+
+  template <typename P, typename OffsetSize = uoffset_t>
+  P GetPointer(voffset_t field)
+  {
+    auto field_offset = GetOptionalFieldOffset(field);
+    auto p            = data_ + field_offset;
+    return field_offset ? reinterpret_cast<P>(p + ReadScalar<OffsetSize>(p)) : nullptr;
+  }
+  template <typename P, typename OffsetSize = uoffset_t>
+  P GetPointer(voffset_t field) const
+  {
+    return const_cast<Table*>(this)->GetPointer<P, OffsetSize>(field);
+  }
+
+  template <typename P>
+  P GetPointer64(voffset_t field)
+  {
+    return GetPointer<P, uoffset64_t>(field);
+  }
+
+  template <typename P>
+  P GetPointer64(voffset_t field) const
+  {
+    return GetPointer<P, uoffset64_t>(field);
+  }
+
+  template <typename P>
+  P GetStruct(voffset_t field) const
+  {
+    auto field_offset = GetOptionalFieldOffset(field);
+    auto p            = const_cast<uint8_t*>(data_ + field_offset);
+    return field_offset ? reinterpret_cast<P>(p) : nullptr;
+  }
+
+  template <typename Raw, typename Face>
+  flatbuffers::Optional<Face> GetOptional(voffset_t field) const
+  {
+    auto field_offset = GetOptionalFieldOffset(field);
+    auto p            = data_ + field_offset;
+    return field_offset ? Optional<Face>(static_cast<Face>(ReadScalar<Raw>(p))) : Optional<Face>();
+  }
+
+  template <typename T>
+  bool SetField(voffset_t field, T val, T def)
+  {
+    auto field_offset = GetOptionalFieldOffset(field);
+    if (!field_offset) return IsTheSameAs(val, def);
+    WriteScalar(data_ + field_offset, val);
+    return true;
+  }
+  template <typename T>
+  bool SetField(voffset_t field, T val)
+  {
+    auto field_offset = GetOptionalFieldOffset(field);
+    if (!field_offset) return false;
+    WriteScalar(data_ + field_offset, val);
+    return true;
+  }
+
+  bool SetPointer(voffset_t field, const uint8_t* val)
+  {
+    auto field_offset = GetOptionalFieldOffset(field);
+    if (!field_offset) return false;
+    WriteScalar(data_ + field_offset, static_cast<uoffset_t>(val - (data_ + field_offset)));
+    return true;
+  }
+
+  uint8_t* GetAddressOf(voffset_t field)
+  {
+    auto field_offset = GetOptionalFieldOffset(field);
+    return field_offset ? data_ + field_offset : nullptr;
+  }
+  const uint8_t* GetAddressOf(voffset_t field) const
+  {
+    return const_cast<Table*>(this)->GetAddressOf(field);
+  }
+
+  bool CheckField(voffset_t field) const { return GetOptionalFieldOffset(field) != 0; }
+
+  // Verify the vtable of this table.
+  // Call this once per table, followed by VerifyField once per field.
+  bool VerifyTableStart(Verifier& verifier) const { return verifier.VerifyTableStart(data_); }
+
+  // Verify a particular field.
+  template <typename T>
+  bool VerifyField(const Verifier& verifier, voffset_t field, size_t align) const
+  {
+    // Calling GetOptionalFieldOffset should be safe now thanks to
+    // VerifyTable().
+    auto field_offset = GetOptionalFieldOffset(field);
+    // Check the actual field.
+    return !field_offset || verifier.VerifyField<T>(data_, field_offset, align);
+  }
+
+  // VerifyField for required fields.
+  template <typename T>
+  bool VerifyFieldRequired(const Verifier& verifier, voffset_t field, size_t align) const
+  {
+    auto field_offset = GetOptionalFieldOffset(field);
+    return verifier.Check(field_offset != 0) && verifier.VerifyField<T>(data_, field_offset, align);
+  }
+
+  // Versions for offsets.
+  template <typename OffsetT = uoffset_t>
+  bool VerifyOffset(const Verifier& verifier, voffset_t field) const
+  {
+    auto field_offset = GetOptionalFieldOffset(field);
+    return !field_offset || verifier.VerifyOffset<OffsetT>(data_, field_offset);
+  }
+
+  template <typename OffsetT = uoffset_t>
+  bool VerifyOffsetRequired(const Verifier& verifier, voffset_t field) const
+  {
+    auto field_offset = GetOptionalFieldOffset(field);
+    return verifier.Check(field_offset != 0) && verifier.VerifyOffset<OffsetT>(data_, field_offset);
+  }
+
+  bool VerifyOffset64(const Verifier& verifier, voffset_t field) const
+  {
+    return VerifyOffset<uoffset64_t>(verifier, field);
+  }
+
+  bool VerifyOffset64Required(const Verifier& verifier, voffset_t field) const
+  {
+    return VerifyOffsetRequired<uoffset64_t>(verifier, field);
+  }
+
+ private:
+  // private constructor & copy constructor: you obtain instances of this
+  // class by pointing to existing data only
+  Table();
+  Table(const Table& other);
+  Table& operator=(const Table&);
+
+  uint8_t data_[1];
+};
+
+// This specialization allows avoiding warnings like:
+// MSVC C4800: type: forcing value to bool 'true' or 'false'.
+template <>
+inline flatbuffers::Optional<bool> Table::GetOptional<uint8_t, bool>(voffset_t field) const
+{
+  auto field_offset = GetOptionalFieldOffset(field);
+  auto p            = data_ + field_offset;
+  return field_offset ? Optional<bool>(ReadScalar<uint8_t>(p) != 0) : Optional<bool>();
+}
+
+}  // namespace flatbuffers
+
+#endif  // FLATBUFFERS_TABLE_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/vector.h b/cpp/include/cudf/io/ipc/flatbuffers/vector.h
new file mode 100644
index 00000000000..095939f8b0c
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/vector.h
@@ -0,0 +1,416 @@
+/*
+ * Copyright 2021 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_VECTOR_H_
+#define FLATBUFFERS_VECTOR_H_
+
+#include <cudf/io/ipc/flatbuffers/base.h>
+#include <cudf/io/ipc/flatbuffers/buffer.h>
+#include <cudf/io/ipc/flatbuffers/stl_emulation.h>
+
+namespace flatbuffers {
+
+struct String;
+
+// An STL compatible iterator implementation for Vector below, effectively
+// calling Get() for every element.
+template <typename T, typename IT, typename Data = uint8_t*, typename SizeT = uoffset_t>
+struct VectorIterator {
+  typedef std::random_access_iterator_tag iterator_category;
+  typedef IT value_type;
+  typedef ptrdiff_t difference_type;
+  typedef IT* pointer;
+  typedef IT& reference;
+
+  static const SizeT element_stride = IndirectHelper<T>::element_stride;
+
+  VectorIterator(Data data, SizeT i) : data_(data + element_stride * i) {}
+  VectorIterator(const VectorIterator& other) : data_(other.data_) {}
+  VectorIterator() : data_(nullptr) {}
+
+  VectorIterator& operator=(const VectorIterator& other)
+  {
+    data_ = other.data_;
+    return *this;
+  }
+
+  VectorIterator& operator=(VectorIterator&& other)
+  {
+    data_ = other.data_;
+    return *this;
+  }
+
+  bool operator==(const VectorIterator& other) const { return data_ == other.data_; }
+
+  bool operator<(const VectorIterator& other) const { return data_ < other.data_; }
+
+  bool operator!=(const VectorIterator& other) const { return data_ != other.data_; }
+
+  difference_type operator-(const VectorIterator& other) const
+  {
+    return (data_ - other.data_) / element_stride;
+  }
+
+  // Note: return type is incompatible with the standard
+  // `reference operator*()`.
+  IT operator*() const { return IndirectHelper<T>::Read(data_, 0); }
+
+  // Note: return type is incompatible with the standard
+  // `pointer operator->()`.
+  IT operator->() const { return IndirectHelper<T>::Read(data_, 0); }
+
+  VectorIterator& operator++()
+  {
+    data_ += element_stride;
+    return *this;
+  }
+
+  VectorIterator operator++(int)
+  {
+    VectorIterator temp(data_, 0);
+    data_ += element_stride;
+    return temp;
+  }
+
+  VectorIterator operator+(const SizeT& offset) const
+  {
+    return VectorIterator(data_ + offset * element_stride, 0);
+  }
+
+  VectorIterator& operator+=(const SizeT& offset)
+  {
+    data_ += offset * element_stride;
+    return *this;
+  }
+
+  VectorIterator& operator--()
+  {
+    data_ -= element_stride;
+    return *this;
+  }
+
+  VectorIterator operator--(int)
+  {
+    VectorIterator temp(data_, 0);
+    data_ -= element_stride;
+    return temp;
+  }
+
+  VectorIterator operator-(const SizeT& offset) const
+  {
+    return VectorIterator(data_ - offset * element_stride, 0);
+  }
+
+  VectorIterator& operator-=(const SizeT& offset)
+  {
+    data_ -= offset * element_stride;
+    return *this;
+  }
+
+ private:
+  Data data_;
+};
+
+template <typename T, typename IT, typename SizeT = uoffset_t>
+using VectorConstIterator = VectorIterator<T, IT, const uint8_t*, SizeT>;
+
+template <typename Iterator>
+struct VectorReverseIterator : public std::reverse_iterator<Iterator> {
+  explicit VectorReverseIterator(Iterator iter) : std::reverse_iterator<Iterator>(iter) {}
+
+  // Note: return type is incompatible with the standard
+  // `reference operator*()`.
+  typename Iterator::value_type operator*() const
+  {
+    auto tmp = std::reverse_iterator<Iterator>::current;
+    return *--tmp;
+  }
+
+  // Note: return type is incompatible with the standard
+  // `pointer operator->()`.
+  typename Iterator::value_type operator->() const
+  {
+    auto tmp = std::reverse_iterator<Iterator>::current;
+    return *--tmp;
+  }
+};
+
+// This is used as a helper type for accessing vectors.
+// Vector::data() assumes the vector elements start after the length field.
+template <typename T, typename SizeT = uoffset_t>
+class Vector {
+ public:
+  typedef VectorIterator<T, typename IndirectHelper<T>::mutable_return_type, uint8_t*, SizeT>
+    iterator;
+  typedef VectorConstIterator<T, typename IndirectHelper<T>::return_type, SizeT> const_iterator;
+  typedef VectorReverseIterator<iterator> reverse_iterator;
+  typedef VectorReverseIterator<const_iterator> const_reverse_iterator;
+
+  typedef typename flatbuffers::bool_constant<flatbuffers::is_scalar<T>::value> scalar_tag;
+
+  static FLATBUFFERS_CONSTEXPR bool is_span_observable =
+    scalar_tag::value && (FLATBUFFERS_LITTLEENDIAN || sizeof(T) == 1);
+
+  SizeT size() const { return EndianScalar(length_); }
+
+  // Deprecated: use size(). Here for backwards compatibility.
+  FLATBUFFERS_ATTRIBUTE([[deprecated("use size() instead")]])
+  SizeT Length() const { return size(); }
+
+  typedef SizeT size_type;
+  typedef typename IndirectHelper<T>::return_type return_type;
+  typedef typename IndirectHelper<T>::mutable_return_type mutable_return_type;
+  typedef return_type value_type;
+
+  return_type Get(SizeT i) const
+  {
+    FLATBUFFERS_ASSERT(i < size());
+    return IndirectHelper<T>::Read(Data(), i);
+  }
+
+  return_type operator[](SizeT i) const { return Get(i); }
+
+  // If this is a Vector of enums, T will be its storage type, not the enum
+  // type. This function makes it convenient to retrieve value with enum
+  // type E.
+  template <typename E>
+  E GetEnum(SizeT i) const
+  {
+    return static_cast<E>(Get(i));
+  }
+
+  // If this a vector of unions, this does the cast for you. There's no check
+  // to make sure this is the right type!
+  template <typename U>
+  const U* GetAs(SizeT i) const
+  {
+    return reinterpret_cast<const U*>(Get(i));
+  }
+
+  // If this a vector of unions, this does the cast for you. There's no check
+  // to make sure this is actually a string!
+  const String* GetAsString(SizeT i) const { return reinterpret_cast<const String*>(Get(i)); }
+
+  const void* GetStructFromOffset(size_t o) const
+  {
+    return reinterpret_cast<const void*>(Data() + o);
+  }
+
+  iterator begin() { return iterator(Data(), 0); }
+  const_iterator begin() const { return const_iterator(Data(), 0); }
+
+  iterator end() { return iterator(Data(), size()); }
+  const_iterator end() const { return const_iterator(Data(), size()); }
+
+  reverse_iterator rbegin() { return reverse_iterator(end()); }
+  const_reverse_iterator rbegin() const { return const_reverse_iterator(end()); }
+
+  reverse_iterator rend() { return reverse_iterator(begin()); }
+  const_reverse_iterator rend() const { return const_reverse_iterator(begin()); }
+
+  const_iterator cbegin() const { return begin(); }
+
+  const_iterator cend() const { return end(); }
+
+  const_reverse_iterator crbegin() const { return rbegin(); }
+
+  const_reverse_iterator crend() const { return rend(); }
+
+  // Change elements if you have a non-const pointer to this object.
+  // Scalars only. See reflection.h, and the documentation.
+  void Mutate(SizeT i, const T& val)
+  {
+    FLATBUFFERS_ASSERT(i < size());
+    WriteScalar(data() + i, val);
+  }
+
+  // Change an element of a vector of tables (or strings).
+  // "val" points to the new table/string, as you can obtain from
+  // e.g. reflection::AddFlatBuffer().
+  void MutateOffset(SizeT i, const uint8_t* val)
+  {
+    FLATBUFFERS_ASSERT(i < size());
+    static_assert(sizeof(T) == sizeof(SizeT), "Unrelated types");
+    WriteScalar(data() + i, static_cast<SizeT>(val - (Data() + i * sizeof(SizeT))));
+  }
+
+  // Get a mutable pointer to tables/strings inside this vector.
+  mutable_return_type GetMutableObject(SizeT i) const
+  {
+    FLATBUFFERS_ASSERT(i < size());
+    return const_cast<mutable_return_type>(IndirectHelper<T>::Read(Data(), i));
+  }
+
+  // The raw data in little endian format. Use with care.
+  const uint8_t* Data() const { return reinterpret_cast<const uint8_t*>(&length_ + 1); }
+
+  uint8_t* Data() { return reinterpret_cast<uint8_t*>(&length_ + 1); }
+
+  // Similarly, but typed, much like std::vector::data
+  const T* data() const { return reinterpret_cast<const T*>(Data()); }
+  T* data() { return reinterpret_cast<T*>(Data()); }
+
+  template <typename K>
+  return_type LookupByKey(K key) const
+  {
+    void* search_result =
+      std::bsearch(&key, Data(), size(), IndirectHelper<T>::element_stride, KeyCompare<K>);
+
+    if (!search_result) {
+      return nullptr;  // Key not found.
+    }
+
+    const uint8_t* element = reinterpret_cast<const uint8_t*>(search_result);
+
+    return IndirectHelper<T>::Read(element, 0);
+  }
+
+  template <typename K>
+  mutable_return_type MutableLookupByKey(K key)
+  {
+    return const_cast<mutable_return_type>(LookupByKey(key));
+  }
+
+ protected:
+  // This class is only used to access pre-existing data. Don't ever
+  // try to construct these manually.
+  Vector();
+
+  SizeT length_;
+
+ private:
+  // This class is a pointer. Copying will therefore create an invalid object.
+  // Private and unimplemented copy constructor.
+  Vector(const Vector&);
+  Vector& operator=(const Vector&);
+
+  template <typename K>
+  static int KeyCompare(const void* ap, const void* bp)
+  {
+    const K* key        = reinterpret_cast<const K*>(ap);
+    const uint8_t* data = reinterpret_cast<const uint8_t*>(bp);
+    auto table          = IndirectHelper<T>::Read(data, 0);
+
+    // std::bsearch compares with the operands transposed, so we negate the
+    // result here.
+    return -table->KeyCompareWithValue(*key);
+  }
+};
+
+template <typename T>
+using Vector64 = Vector<T, uoffset64_t>;
+
+template <class U>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<U> make_span(Vector<U>& vec) FLATBUFFERS_NOEXCEPT
+{
+  static_assert(Vector<U>::is_span_observable,
+                "wrong type U, only LE-scalar, or byte types are allowed");
+  return span<U>(vec.data(), vec.size());
+}
+
+template <class U>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const U> make_span(const Vector<U>& vec)
+  FLATBUFFERS_NOEXCEPT
+{
+  static_assert(Vector<U>::is_span_observable,
+                "wrong type U, only LE-scalar, or byte types are allowed");
+  return span<const U>(vec.data(), vec.size());
+}
+
+template <class U>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<uint8_t> make_bytes_span(Vector<U>& vec)
+  FLATBUFFERS_NOEXCEPT
+{
+  static_assert(Vector<U>::scalar_tag::value,
+                "wrong type U, only LE-scalar, or byte types are allowed");
+  return span<uint8_t>(vec.Data(), vec.size() * sizeof(U));
+}
+
+template <class U>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const uint8_t> make_bytes_span(const Vector<U>& vec)
+  FLATBUFFERS_NOEXCEPT
+{
+  static_assert(Vector<U>::scalar_tag::value,
+                "wrong type U, only LE-scalar, or byte types are allowed");
+  return span<const uint8_t>(vec.Data(), vec.size() * sizeof(U));
+}
+
+// Convenient helper functions to get a span of any vector, regardless
+// of whether it is null or not (the field is not set).
+template <class U>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<U> make_span(Vector<U>* ptr) FLATBUFFERS_NOEXCEPT
+{
+  static_assert(Vector<U>::is_span_observable,
+                "wrong type U, only LE-scalar, or byte types are allowed");
+  return ptr ? make_span(*ptr) : span<U>();
+}
+
+template <class U>
+FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const U> make_span(const Vector<U>* ptr)
+  FLATBUFFERS_NOEXCEPT
+{
+  static_assert(Vector<U>::is_span_observable,
+                "wrong type U, only LE-scalar, or byte types are allowed");
+  return ptr ? make_span(*ptr) : span<const U>();
+}
+
+// Represent a vector much like the template above, but in this case we
+// don't know what the element types are (used with reflection.h).
+class VectorOfAny {
+ public:
+  uoffset_t size() const { return EndianScalar(length_); }
+
+  const uint8_t* Data() const { return reinterpret_cast<const uint8_t*>(&length_ + 1); }
+  uint8_t* Data() { return reinterpret_cast<uint8_t*>(&length_ + 1); }
+
+ protected:
+  VectorOfAny();
+
+  uoffset_t length_;
+
+ private:
+  VectorOfAny(const VectorOfAny&);
+  VectorOfAny& operator=(const VectorOfAny&);
+};
+
+template <typename T, typename U>
+Vector<Offset<T>>* VectorCast(Vector<Offset<U>>* ptr)
+{
+  static_assert(std::is_base_of<T, U>::value, "Unrelated types");
+  return reinterpret_cast<Vector<Offset<T>>*>(ptr);
+}
+
+template <typename T, typename U>
+const Vector<Offset<T>>* VectorCast(const Vector<Offset<U>>* ptr)
+{
+  static_assert(std::is_base_of<T, U>::value, "Unrelated types");
+  return reinterpret_cast<const Vector<Offset<T>>*>(ptr);
+}
+
+// Convenient helper function to get the length of any vector, regardless
+// of whether it is null or not (the field is not set).
+template <typename T>
+static inline size_t VectorLength(const Vector<T>* v)
+{
+  return v ? v->size() : 0;
+}
+
+}  // namespace flatbuffers
+
+#endif  // FLATBUFFERS_VERIFIER_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/vector_downward.h b/cpp/include/cudf/io/ipc/flatbuffers/vector_downward.h
new file mode 100644
index 00000000000..052e5d7f874
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/vector_downward.h
@@ -0,0 +1,316 @@
+/*
+ * Copyright 2021 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_VECTOR_DOWNWARD_H_
+#define FLATBUFFERS_VECTOR_DOWNWARD_H_
+
+#include <cudf/io/ipc/flatbuffers/base.h>
+#include <cudf/io/ipc/flatbuffers/default_allocator.h>
+#include <cudf/io/ipc/flatbuffers/detached_buffer.h>
+
+#include <algorithm>
+#include <cstdint>
+
+namespace flatbuffers {
+
+// This is a minimal replication of std::vector<uint8_t> functionality,
+// except growing from higher to lower addresses. i.e. push_back() inserts data
+// in the lowest address in the vector.
+// Since this vector leaves the lower part unused, we support a "scratch-pad"
+// that can be stored there for temporary data, to share the allocated space.
+// Essentially, this supports 2 std::vectors in a single buffer.
+template <typename SizeT = uoffset_t>
+class vector_downward {
+ public:
+  explicit vector_downward(size_t initial_size,
+                           Allocator* allocator,
+                           bool own_allocator,
+                           size_t buffer_minalign,
+                           const SizeT max_size = FLATBUFFERS_MAX_BUFFER_SIZE)
+    : allocator_(allocator),
+      own_allocator_(own_allocator),
+      initial_size_(initial_size),
+      max_size_(max_size),
+      buffer_minalign_(buffer_minalign),
+      reserved_(0),
+      size_(0),
+      buf_(nullptr),
+      cur_(nullptr),
+      scratch_(nullptr)
+  {
+  }
+
+  vector_downward(vector_downward&& other) noexcept
+    // clang-format on
+    : allocator_(other.allocator_),
+      own_allocator_(other.own_allocator_),
+      initial_size_(other.initial_size_),
+      max_size_(other.max_size_),
+      buffer_minalign_(other.buffer_minalign_),
+      reserved_(other.reserved_),
+      size_(other.size_),
+      buf_(other.buf_),
+      cur_(other.cur_),
+      scratch_(other.scratch_)
+  {
+    // No change in other.allocator_
+    // No change in other.initial_size_
+    // No change in other.buffer_minalign_
+    other.own_allocator_ = false;
+    other.reserved_      = 0;
+    other.buf_           = nullptr;
+    other.cur_           = nullptr;
+    other.scratch_       = nullptr;
+  }
+
+  vector_downward& operator=(vector_downward&& other) noexcept
+  {
+    // Move construct a temporary and swap idiom
+    vector_downward temp(std::move(other));
+    swap(temp);
+    return *this;
+  }
+
+  ~vector_downward()
+  {
+    clear_buffer();
+    clear_allocator();
+  }
+
+  void reset()
+  {
+    clear_buffer();
+    clear();
+  }
+
+  void clear()
+  {
+    if (buf_) {
+      cur_ = buf_ + reserved_;
+    } else {
+      reserved_ = 0;
+      cur_      = nullptr;
+    }
+    size_ = 0;
+    clear_scratch();
+  }
+
+  void clear_scratch() { scratch_ = buf_; }
+
+  void clear_allocator()
+  {
+    if (own_allocator_ && allocator_) { delete allocator_; }
+    allocator_     = nullptr;
+    own_allocator_ = false;
+  }
+
+  void clear_buffer()
+  {
+    if (buf_) Deallocate(allocator_, buf_, reserved_);
+    buf_ = nullptr;
+  }
+
+  // Relinquish the pointer to the caller.
+  uint8_t* release_raw(size_t& allocated_bytes, size_t& offset)
+  {
+    auto* buf       = buf_;
+    allocated_bytes = reserved_;
+    offset          = vector_downward::offset();
+
+    // release_raw only relinquishes the buffer ownership.
+    // Does not deallocate or reset the allocator. Destructor will do that.
+    buf_ = nullptr;
+    clear();
+    return buf;
+  }
+
+  // Relinquish the pointer to the caller.
+  DetachedBuffer release()
+  {
+    // allocator ownership (if any) is transferred to DetachedBuffer.
+    DetachedBuffer fb(allocator_, own_allocator_, buf_, reserved_, cur_, size());
+    if (own_allocator_) {
+      allocator_     = nullptr;
+      own_allocator_ = false;
+    }
+    buf_ = nullptr;
+    clear();
+    return fb;
+  }
+
+  size_t ensure_space(size_t len)
+  {
+    FLATBUFFERS_ASSERT(cur_ >= scratch_ && scratch_ >= buf_);
+    // If the length is larger than the unused part of the buffer, we need to
+    // grow.
+    if (len > unused_buffer_size()) { reallocate(len); }
+    FLATBUFFERS_ASSERT(size() < max_size_);
+    return len;
+  }
+
+  inline uint8_t* make_space(size_t len)
+  {
+    if (len) {
+      ensure_space(len);
+      cur_ -= len;
+      size_ += static_cast<SizeT>(len);
+    }
+    return cur_;
+  }
+
+  // Returns nullptr if using the DefaultAllocator.
+  Allocator* get_custom_allocator() { return allocator_; }
+
+  // The current offset into the buffer.
+  size_t offset() const { return cur_ - buf_; }
+
+  // The total size of the vector (both the buffer and scratch parts).
+  inline SizeT size() const { return size_; }
+
+  // The size of the buffer part of the vector that is currently unused.
+  SizeT unused_buffer_size() const { return static_cast<SizeT>(cur_ - scratch_); }
+
+  // The size of the scratch part of the vector.
+  SizeT scratch_size() const { return static_cast<SizeT>(scratch_ - buf_); }
+
+  size_t capacity() const { return reserved_; }
+
+  uint8_t* data() const
+  {
+    FLATBUFFERS_ASSERT(cur_);
+    return cur_;
+  }
+
+  uint8_t* scratch_data() const
+  {
+    FLATBUFFERS_ASSERT(buf_);
+    return buf_;
+  }
+
+  uint8_t* scratch_end() const
+  {
+    FLATBUFFERS_ASSERT(scratch_);
+    return scratch_;
+  }
+
+  uint8_t* data_at(size_t offset) const { return buf_ + reserved_ - offset; }
+
+  void push(const uint8_t* bytes, size_t num)
+  {
+    if (num > 0) { memcpy(make_space(num), bytes, num); }
+  }
+
+  // Specialized version of push() that avoids memcpy call for small data.
+  template <typename T>
+  void push_small(const T& little_endian_t)
+  {
+    make_space(sizeof(T));
+    *reinterpret_cast<T*>(cur_) = little_endian_t;
+  }
+
+  template <typename T>
+  void scratch_push_small(const T& t)
+  {
+    ensure_space(sizeof(T));
+    *reinterpret_cast<T*>(scratch_) = t;
+    scratch_ += sizeof(T);
+  }
+
+  // fill() is most frequently called with small byte counts (<= 4),
+  // which is why we're using loops rather than calling memset.
+  void fill(size_t zero_pad_bytes)
+  {
+    make_space(zero_pad_bytes);
+    for (size_t i = 0; i < zero_pad_bytes; i++)
+      cur_[i] = 0;
+  }
+
+  // Version for when we know the size is larger.
+  // Precondition: zero_pad_bytes > 0
+  void fill_big(size_t zero_pad_bytes) { memset(make_space(zero_pad_bytes), 0, zero_pad_bytes); }
+
+  void pop(size_t bytes_to_remove)
+  {
+    cur_ += bytes_to_remove;
+    size_ -= static_cast<SizeT>(bytes_to_remove);
+  }
+
+  void scratch_pop(size_t bytes_to_remove) { scratch_ -= bytes_to_remove; }
+
+  void swap(vector_downward& other)
+  {
+    using std::swap;
+    swap(allocator_, other.allocator_);
+    swap(own_allocator_, other.own_allocator_);
+    swap(initial_size_, other.initial_size_);
+    swap(buffer_minalign_, other.buffer_minalign_);
+    swap(reserved_, other.reserved_);
+    swap(size_, other.size_);
+    swap(max_size_, other.max_size_);
+    swap(buf_, other.buf_);
+    swap(cur_, other.cur_);
+    swap(scratch_, other.scratch_);
+  }
+
+  void swap_allocator(vector_downward& other)
+  {
+    using std::swap;
+    swap(allocator_, other.allocator_);
+    swap(own_allocator_, other.own_allocator_);
+  }
+
+ private:
+  // You shouldn't really be copying instances of this class.
+  FLATBUFFERS_DELETE_FUNC(vector_downward(const vector_downward&));
+  FLATBUFFERS_DELETE_FUNC(vector_downward& operator=(const vector_downward&));
+
+  Allocator* allocator_;
+  bool own_allocator_;
+  size_t initial_size_;
+
+  // The maximum size the vector can be.
+  SizeT max_size_;
+  size_t buffer_minalign_;
+  size_t reserved_;
+  SizeT size_;
+  uint8_t* buf_;
+  uint8_t* cur_;      // Points at location between empty (below) and used (above).
+  uint8_t* scratch_;  // Points to the end of the scratchpad in use.
+
+  void reallocate(size_t len)
+  {
+    auto old_reserved     = reserved_;
+    auto old_size         = size();
+    auto old_scratch_size = scratch_size();
+    reserved_ += (std::max)(len, old_reserved ? old_reserved / 2 : initial_size_);
+    reserved_ = (reserved_ + buffer_minalign_ - 1) & ~(buffer_minalign_ - 1);
+    if (buf_) {
+      buf_ =
+        ReallocateDownward(allocator_, buf_, old_reserved, reserved_, old_size, old_scratch_size);
+    } else {
+      buf_ = Allocate(allocator_, reserved_);
+    }
+    cur_     = buf_ + reserved_ - old_size;
+    scratch_ = buf_ + old_scratch_size;
+  }
+};
+
+}  // namespace flatbuffers
+
+#endif  // FLATBUFFERS_VECTOR_DOWNWARD_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/verifier.h b/cpp/include/cudf/io/ipc/flatbuffers/verifier.h
new file mode 100644
index 00000000000..18ed19d03fb
--- /dev/null
+++ b/cpp/include/cudf/io/ipc/flatbuffers/verifier.h
@@ -0,0 +1,389 @@
+/*
+ * Copyright 2021 Google Inc. All rights reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef DOXYGEN_SHOULD_SKIP_THIS
+
+#ifndef FLATBUFFERS_VERIFIER_H_
+#define FLATBUFFERS_VERIFIER_H_
+
+#include <cudf/io/ipc/flatbuffers/base.h>
+#include <cudf/io/ipc/flatbuffers/vector.h>
+
+namespace flatbuffers {
+
+// Helper class to verify the integrity of a FlatBuffer
+template <bool TrackVerifierBufferSize>
+class VerifierTemplate FLATBUFFERS_FINAL_CLASS {
+ public:
+  struct Options {
+    // The maximum nesting of tables and vectors before we call it invalid.
+    uoffset_t max_depth = 64;
+    // The maximum number of tables we will verify before we call it invalid.
+    uoffset_t max_tables = 1000000;
+    // If true, verify all data is aligned.
+    bool check_alignment = true;
+    // If true, run verifier on nested flatbuffers
+    bool check_nested_flatbuffers = true;
+    // The maximum size of a buffer.
+    size_t max_size = FLATBUFFERS_MAX_BUFFER_SIZE;
+    // Use assertions to check for errors.
+    bool assert = false;
+  };
+
+  explicit VerifierTemplate(const uint8_t* const buf, const size_t buf_len, const Options& opts)
+    : buf_(buf), size_(buf_len), opts_(opts)
+  {
+    FLATBUFFERS_ASSERT(size_ < opts.max_size);
+  }
+
+  // Deprecated API, please construct with VerifierTemplate::Options.
+  VerifierTemplate(const uint8_t* const buf,
+                   const size_t buf_len,
+                   const uoffset_t max_depth  = 64,
+                   const uoffset_t max_tables = 1000000,
+                   const bool check_alignment = true)
+    : VerifierTemplate(buf, buf_len, [&] {
+        Options opts;
+        opts.max_depth       = max_depth;
+        opts.max_tables      = max_tables;
+        opts.check_alignment = check_alignment;
+        return opts;
+      }())
+  {
+  }
+
+  // Central location where any verification failures register.
+  bool Check(const bool ok) const
+  {
+// clang-format off
+    #ifdef FLATBUFFERS_DEBUG_VERIFICATION_FAILURE
+      if (opts_.assert) { FLATBUFFERS_ASSERT(ok); }
+    #endif
+    // clang-format on
+    if (TrackVerifierBufferSize) {
+      if (!ok) { upper_bound_ = 0; }
+    }
+    return ok;
+  }
+
+  // Verify any range within the buffer.
+  bool Verify(const size_t elem, const size_t elem_len) const
+  {
+    if (TrackVerifierBufferSize) {
+      auto upper_bound = elem + elem_len;
+      if (upper_bound_ < upper_bound) { upper_bound_ = upper_bound; }
+    }
+    return Check(elem_len < size_ && elem <= size_ - elem_len);
+  }
+
+  bool VerifyAlignment(const size_t elem, const size_t align) const
+  {
+    return Check((elem & (align - 1)) == 0 || !opts_.check_alignment);
+  }
+
+  // Verify a range indicated by sizeof(T).
+  template <typename T>
+  bool Verify(const size_t elem) const
+  {
+    return VerifyAlignment(elem, sizeof(T)) && Verify(elem, sizeof(T));
+  }
+
+  bool VerifyFromPointer(const uint8_t* const p, const size_t len)
+  {
+    return Verify(static_cast<size_t>(p - buf_), len);
+  }
+
+  // Verify relative to a known-good base pointer.
+  bool VerifyFieldStruct(const uint8_t* const base,
+                         const voffset_t elem_off,
+                         const size_t elem_len,
+                         const size_t align) const
+  {
+    const auto f = static_cast<size_t>(base - buf_) + elem_off;
+    return VerifyAlignment(f, align) && Verify(f, elem_len);
+  }
+
+  template <typename T>
+  bool VerifyField(const uint8_t* const base, const voffset_t elem_off, const size_t align) const
+  {
+    const auto f = static_cast<size_t>(base - buf_) + elem_off;
+    return VerifyAlignment(f, align) && Verify(f, sizeof(T));
+  }
+
+  // Verify a pointer (may be NULL) of a table type.
+  template <typename T>
+  bool VerifyTable(const T* const table)
+  {
+    return !table || table->Verify(*this);
+  }
+
+  // Verify a pointer (may be NULL) of any vector type.
+  template <int&..., typename T, typename LenT>
+  bool VerifyVector(const Vector<T, LenT>* const vec) const
+  {
+    return !vec || VerifyVectorOrString<LenT>(reinterpret_cast<const uint8_t*>(vec), sizeof(T));
+  }
+
+  // Verify a pointer (may be NULL) of a vector to struct.
+  template <int&..., typename T, typename LenT>
+  bool VerifyVector(const Vector<const T*, LenT>* const vec) const
+  {
+    return VerifyVector(reinterpret_cast<const Vector<T, LenT>*>(vec));
+  }
+
+  // Verify a pointer (may be NULL) to string.
+  bool VerifyString(const String* const str) const
+  {
+    size_t end;
+    return !str ||
+           (VerifyVectorOrString<uoffset_t>(reinterpret_cast<const uint8_t*>(str), 1, &end) &&
+            Verify(end, 1) &&           // Must have terminator
+            Check(buf_[end] == '\0'));  // Terminating byte must be 0.
+  }
+
+  // Common code between vectors and strings.
+  template <typename LenT = uoffset_t>
+  bool VerifyVectorOrString(const uint8_t* const vec,
+                            const size_t elem_size,
+                            size_t* const end = nullptr) const
+  {
+    const auto vec_offset = static_cast<size_t>(vec - buf_);
+    // Check we can read the size field.
+    if (!Verify<LenT>(vec_offset)) return false;
+    // Check the whole array. If this is a string, the byte past the array must
+    // be 0.
+    const LenT size      = ReadScalar<LenT>(vec);
+    const auto max_elems = opts_.max_size / elem_size;
+    if (!Check(size < max_elems)) return false;  // Protect against byte_size overflowing.
+    const auto byte_size = sizeof(LenT) + elem_size * size;
+    if (end) *end = vec_offset + byte_size;
+    return Verify(vec_offset, byte_size);
+  }
+
+  // Special case for string contents, after the above has been called.
+  bool VerifyVectorOfStrings(const Vector<Offset<String>>* const vec) const
+  {
+    if (vec) {
+      for (uoffset_t i = 0; i < vec->size(); i++) {
+        if (!VerifyString(vec->Get(i))) return false;
+      }
+    }
+    return true;
+  }
+
+  // Special case for table contents, after the above has been called.
+  template <typename T>
+  bool VerifyVectorOfTables(const Vector<Offset<T>>* const vec)
+  {
+    if (vec) {
+      for (uoffset_t i = 0; i < vec->size(); i++) {
+        if (!vec->Get(i)->Verify(*this)) return false;
+      }
+    }
+    return true;
+  }
+
+  FLATBUFFERS_SUPPRESS_UBSAN("unsigned-integer-overflow")
+  bool VerifyTableStart(const uint8_t* const table)
+  {
+    // Check the vtable offset.
+    const auto tableo = static_cast<size_t>(table - buf_);
+    if (!Verify<soffset_t>(tableo)) return false;
+    // This offset may be signed, but doing the subtraction unsigned always
+    // gives the result we want.
+    const auto vtableo = tableo - static_cast<size_t>(ReadScalar<soffset_t>(table));
+    // Check the vtable size field, then check vtable fits in its entirety.
+    if (!(VerifyComplexity() && Verify<voffset_t>(vtableo) &&
+          VerifyAlignment(ReadScalar<voffset_t>(buf_ + vtableo), sizeof(voffset_t))))
+      return false;
+    const auto vsize = ReadScalar<voffset_t>(buf_ + vtableo);
+    return Check((vsize & 1) == 0) && Verify(vtableo, vsize);
+  }
+
+  template <typename T>
+  bool VerifyBufferFromStart(const char* const identifier, const size_t start)
+  {
+    // Buffers have to be of some size to be valid. The reason it is a runtime
+    // check instead of static_assert, is that nested flatbuffers go through
+    // this call and their size is determined at runtime.
+    if (!Check(size_ >= FLATBUFFERS_MIN_BUFFER_SIZE)) return false;
+
+    // If an identifier is provided, check that we have a buffer
+    if (identifier && !Check((size_ >= 2 * sizeof(flatbuffers::uoffset_t) &&
+                              BufferHasIdentifier(buf_ + start, identifier)))) {
+      return false;
+    }
+
+    // Call T::Verify, which must be in the generated code for this type.
+    const auto o = VerifyOffset<uoffset_t>(start);
+    if (!Check(o != 0)) return false;
+    if (!(reinterpret_cast<const T*>(buf_ + start + o)->Verify(*this))) { return false; }
+    if (TrackVerifierBufferSize) {
+      if (GetComputedSize() == 0) return false;
+    }
+    return true;
+  }
+
+  template <typename T, int&..., typename SizeT>
+  bool VerifyNestedFlatBuffer(const Vector<uint8_t, SizeT>* const buf, const char* const identifier)
+  {
+    // Caller opted out of this.
+    if (!opts_.check_nested_flatbuffers) return true;
+
+    // An empty buffer is OK as it indicates not present.
+    if (!buf) return true;
+
+    // If there is a nested buffer, it must be greater than the min size.
+    if (!Check(buf->size() >= FLATBUFFERS_MIN_BUFFER_SIZE)) return false;
+
+    VerifierTemplate<TrackVerifierBufferSize> nested_verifier(buf->data(), buf->size(), opts_);
+    return nested_verifier.VerifyBuffer<T>(identifier);
+  }
+
+  // Verify this whole buffer, starting with root type T.
+  template <typename T>
+  bool VerifyBuffer()
+  {
+    return VerifyBuffer<T>(nullptr);
+  }
+
+  template <typename T>
+  bool VerifyBuffer(const char* const identifier)
+  {
+    return VerifyBufferFromStart<T>(identifier, 0);
+  }
+
+  template <typename T, typename SizeT = uoffset_t>
+  bool VerifySizePrefixedBuffer(const char* const identifier)
+  {
+    return Verify<SizeT>(0U) &&
+           // Ensure the prefixed size is within the bounds of the provided
+           // length.
+           Check(ReadScalar<SizeT>(buf_) + sizeof(SizeT) <= size_) &&
+           VerifyBufferFromStart<T>(identifier, sizeof(SizeT));
+  }
+
+  template <typename OffsetT = uoffset_t, typename SOffsetT = soffset_t>
+  size_t VerifyOffset(const size_t start) const
+  {
+    if (!Verify<OffsetT>(start)) return 0;
+    const auto o = ReadScalar<OffsetT>(buf_ + start);
+    // May not point to itself.
+    if (!Check(o != 0)) return 0;
+    // Can't wrap around larger than the max size.
+    if (!Check(static_cast<SOffsetT>(o) >= 0)) return 0;
+    // Must be inside the buffer to create a pointer from it (pointer outside
+    // buffer is UB).
+    if (!Verify(start + o, 1)) return 0;
+    return o;
+  }
+
+  template <typename OffsetT = uoffset_t>
+  size_t VerifyOffset(const uint8_t* const base, const voffset_t start) const
+  {
+    return VerifyOffset<OffsetT>(static_cast<size_t>(base - buf_) + start);
+  }
+
+  // Called at the start of a table to increase counters measuring data
+  // structure depth and amount, and possibly bails out with false if limits set
+  // by the constructor have been hit. Needs to be balanced with EndTable().
+  bool VerifyComplexity()
+  {
+    depth_++;
+    num_tables_++;
+    return Check(depth_ <= opts_.max_depth && num_tables_ <= opts_.max_tables);
+  }
+
+  // Called at the end of a table to pop the depth count.
+  bool EndTable()
+  {
+    depth_--;
+    return true;
+  }
+
+  // Returns the message size in bytes.
+  //
+  // This should only be called after first calling VerifyBuffer or
+  // VerifySizePrefixedBuffer.
+  //
+  // This method should only be called for VerifierTemplate instances
+  // where the TrackVerifierBufferSize template parameter is true,
+  // i.e. for SizeVerifier.  For instances where TrackVerifierBufferSize
+  // is false, this fails at runtime or returns zero.
+  size_t GetComputedSize() const
+  {
+    if (TrackVerifierBufferSize) {
+      uintptr_t size = upper_bound_;
+      // Align the size to uoffset_t
+      size = (size - 1 + sizeof(uoffset_t)) & ~(sizeof(uoffset_t) - 1);
+      return (size > size_) ? 0 : size;
+    }
+    // Must use SizeVerifier, or (deprecated) turn on
+    // FLATBUFFERS_TRACK_VERIFIER_BUFFER_SIZE, for this to work.
+    (void)upper_bound_;
+    FLATBUFFERS_ASSERT(false);
+    return 0;
+  }
+
+  std::vector<uint8_t>* GetFlexReuseTracker() { return flex_reuse_tracker_; }
+
+  void SetFlexReuseTracker(std::vector<uint8_t>* const rt) { flex_reuse_tracker_ = rt; }
+
+ private:
+  const uint8_t* buf_;
+  const size_t size_;
+  const Options opts_;
+
+  mutable size_t upper_bound_ = 0;
+
+  uoffset_t depth_                          = 0;
+  uoffset_t num_tables_                     = 0;
+  std::vector<uint8_t>* flex_reuse_tracker_ = nullptr;
+};
+
+// Specialization for 64-bit offsets.
+template <>
+template <>
+inline size_t VerifierTemplate<false>::VerifyOffset<uoffset64_t>(const size_t start) const
+{
+  return VerifyOffset<uoffset64_t, soffset64_t>(start);
+}
+template <>
+template <>
+inline size_t VerifierTemplate<true>::VerifyOffset<uoffset64_t>(const size_t start) const
+{
+  return VerifyOffset<uoffset64_t, soffset64_t>(start);
+}
+
+// Instance of VerifierTemplate that supports GetComputedSize().
+using SizeVerifier = VerifierTemplate</*TrackVerifierBufferSize = */ true>;
+
+// The FLATBUFFERS_TRACK_VERIFIER_BUFFER_SIZE build configuration macro is
+// deprecated, and should not be defined, since it is easy to misuse in ways
+// that result in ODR violations. Rather than using Verifier and defining
+// FLATBUFFERS_TRACK_VERIFIER_BUFFER_SIZE, please use SizeVerifier instead.
+#ifdef FLATBUFFERS_TRACK_VERIFIER_BUFFER_SIZE  // Deprecated, see above.
+using Verifier = SizeVerifier;
+#else
+// Instance of VerifierTemplate that is slightly faster, but does not
+// support GetComputedSize().
+using Verifier = VerifierTemplate</*TrackVerifierBufferSize = */ false>;
+#endif
+
+}  // namespace flatbuffers
+
+#endif  // FLATBUFFERS_VERIFIER_H_
+#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/src/io/functions.cpp b/cpp/src/io/functions.cpp
index f0a37839810..fbc1f123905 100644
--- a/cpp/src/io/functions.cpp
+++ b/cpp/src/io/functions.cpp
@@ -484,12 +484,15 @@ table_with_metadata read_parquet(parquet_reader_options const& options,
                                  rmm::cuda_stream_view stream,
                                  rmm::device_async_resource_ref mr)
 {
+  // MH: This is where the reader starts
   CUDF_FUNC_RANGE();
 
   auto datasources = make_datasources(options.get_source());
+  // MH: reader object is made here
   auto reader =
     std::make_unique<detail_parquet::reader>(std::move(datasources), options, stream, mr);
 
+  // MH: read function called
   return reader->read(options);
 }
 
diff --git a/cpp/src/io/parquet/reader_impl.cpp b/cpp/src/io/parquet/reader_impl.cpp
index a524e7c6dcc..fb574d5e915 100644
--- a/cpp/src/io/parquet/reader_impl.cpp
+++ b/cpp/src/io/parquet/reader_impl.cpp
@@ -452,15 +452,18 @@ void reader::impl::populate_metadata(table_metadata& out_metadata)
 table_with_metadata reader::impl::read_chunk_internal(
   bool uses_custom_row_bounds, std::optional<std::reference_wrapper<ast::expression const>> filter)
 {
-  // If `_output_metadata` has been constructed, just copy it over.
+  // If `_output_metadata` has been constructed, just
+  // copy it over.
   auto out_metadata = _output_metadata ? table_metadata{*_output_metadata} : table_metadata{};
   out_metadata.schema_info.resize(_output_buffers.size());
 
-  // output cudf columns as determined by the top level schema
+  // output cudf columns as determined by the top level
+  // schema
   auto out_columns = std::vector<std::unique_ptr<column>>{};
   out_columns.reserve(_output_buffers.size());
 
-  // no work to do (this can happen on the first pass if we have no rows to read)
+  // no work to do (this can happen on the first pass if
+  // we have no rows to read)
   if (!has_more_work()) { return finalize_output(out_metadata, out_columns, filter); }
 
   auto& pass            = *_pass_itm_data;
@@ -484,7 +487,8 @@ table_with_metadata reader::impl::read_chunk_internal(
       metadata = std::make_optional<reader_column_schema>();
       metadata->set_convert_binary_to_strings(false);
     }
-    // Only construct `out_metadata` if `_output_metadata` has not been cached.
+    // Only construct `out_metadata` if
+    // `_output_metadata` has not been cached.
     if (!_output_metadata) {
       column_name_info& col_name = out_metadata.schema_info[i];
       out_columns.emplace_back(make_column(_output_buffers[i], &col_name, metadata, _stream));
@@ -493,7 +497,8 @@ table_with_metadata reader::impl::read_chunk_internal(
     }
   }
 
-  // Add empty columns if needed. Filter output columns based on filter.
+  // Add empty columns if needed. Filter output columns
+  // based on filter.
   return finalize_output(out_metadata, out_columns, filter);
 }
 
@@ -502,7 +507,8 @@ table_with_metadata reader::impl::finalize_output(
   std::vector<std::unique_ptr<column>>& out_columns,
   std::optional<std::reference_wrapper<ast::expression const>> filter)
 {
-  // Create empty columns as needed (this can happen if we've ended up with no actual data to read)
+  // Create empty columns as needed (this can happen if
+  // we've ended up with no actual data to read)
   for (size_t i = out_columns.size(); i < _output_buffers.size(); ++i) {
     if (!_output_metadata) {
       column_name_info& col_name = out_metadata.schema_info[i];
@@ -514,7 +520,8 @@ table_with_metadata reader::impl::finalize_output(
 
   if (!_output_metadata) {
     populate_metadata(out_metadata);
-    // Finally, save the output table metadata into `_output_metadata` for reuse next time.
+    // Finally, save the output table metadata into
+    // `_output_metadata` for reuse next time.
     _output_metadata = std::make_unique<table_metadata>(out_metadata);
   }
 
@@ -546,7 +553,8 @@ table_with_metadata reader::impl::read(
   std::optional<std::reference_wrapper<ast::expression const>> filter)
 {
   CUDF_EXPECTS(_output_chunk_read_limit == 0,
-               "Reading the whole file must not have non-zero byte_limit.");
+               "Reading the whole file must not have "
+               "non-zero byte_limit.");
   table_metadata metadata;
   populate_metadata(metadata);
   auto expr_conv     = named_to_reference_converter(filter, metadata);
@@ -558,8 +566,9 @@ table_with_metadata reader::impl::read(
 
 table_with_metadata reader::impl::read_chunk()
 {
-  // Reset the output buffers to their original states (right after reader construction).
-  // Don't need to do it if we read the file all at once.
+  // Reset the output buffers to their original states
+  // (right after reader construction). Don't need to do
+  // it if we read the file all at once.
   if (_file_itm_data._output_chunk_count > 0) {
     _output_buffers.resize(0);
     for (auto const& buff : _output_buffers_template) {
@@ -570,7 +579,9 @@ table_with_metadata reader::impl::read_chunk()
   prepare_data(0 /*skip_rows*/,
                std::nullopt /*num_rows, `nullopt` means unlimited*/,
                true /*uses_custom_row_bounds*/,
-               {} /*row_group_indices, empty means read all row groups*/,
+               {} /*row_group_indices, empty means read all row
+                     groups*/
+               ,
                std::nullopt /*filter*/);
   return read_chunk_internal(true, std::nullopt);
 }
@@ -580,11 +591,14 @@ bool reader::impl::has_next()
   prepare_data(0 /*skip_rows*/,
                std::nullopt /*num_rows, `nullopt` means unlimited*/,
                true /*uses_custom_row_bounds*/,
-               {} /*row_group_indices, empty means read all row groups*/,
+               {} /*row_group_indices, empty means read all row
+                     groups*/
+               ,
                std::nullopt /*filter*/);
 
-  // current_input_pass will only be incremented to be == num_passes after
-  // the last chunk in the last subpass in the last pass has been returned
+  // current_input_pass will only be incremented to be ==
+  // num_passes after the last chunk in the last subpass
+  // in the last pass has been returned
   return has_more_work();
 }
 
diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 402ccef7a15..26d6d770b2c 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -16,14 +16,35 @@
 
 #include "reader_impl_helpers.hpp"
 
+#include "cudf/detail/utilities/assert.cuh"
+#include "cudf/types.hpp"
+#include "cudf/utilities/error.hpp"
 #include "io/parquet/parquet.hpp"
+#include "io/parquet/parquet_common.hpp"
 #include "io/utilities/row_selection.hpp"
 
+#include <cudf/detail/utilities/base64_utils.hpp>
+// flatbuffer headers
+#include <cudf/io/ipc/detail/Message_generated.h>
+#include <cudf/io/ipc/detail/Schema_generated.h>
+
+#include <arrow/scalar.h>
+#include <arrow/type_fwd.h>
+
+#include <algorithm>
+#include <cstdint>
+#include <iterator>
+#include <memory>
 #include <numeric>
+#include <optional>
 #include <regex>
 
 namespace cudf::io::parquet::detail {
 
+#define printVar(x) std::cout << "@" << #x << " : " << x << std::flush << std::endl;
+
+namespace flatbuf = cudf::io::parquet::flatbuf;
+
 namespace {
 
 thrust::optional<LogicalType> converted_to_logical_type(SchemaElement const& schema)
@@ -64,11 +85,11 @@ thrust::optional<LogicalType> converted_to_logical_type(SchemaElement const& sch
  */
 type_id to_type_id(SchemaElement const& schema,
                    bool strings_to_categorical,
-                   type_id timestamp_type_id)
+                   type_id timestamp_type_id,
+                   cudf::data_type duration_type)
 {
   auto const physical = schema.type;
   auto logical_type   = schema.logical_type;
-
   // sanity check, but not worth failing over
   if (schema.converted_type.has_value() and not logical_type.has_value()) {
     CUDF_LOG_WARN("ConvertedType is specified but not LogicalType");
@@ -161,7 +182,8 @@ type_id to_type_id(SchemaElement const& schema,
   switch (physical) {
     case BOOLEAN: return type_id::BOOL8;
     case INT32: return type_id::INT32;
-    case INT64: return type_id::INT64;
+    case INT64:
+      return (duration_type.id() == cudf::type_id::EMPTY) ? type_id::INT64 : duration_type.id();
     case FLOAT: return type_id::FLOAT32;
     case DOUBLE: return type_id::FLOAT64;
     case BYTE_ARRAY:
@@ -519,6 +541,7 @@ aggregate_reader_metadata::aggregate_reader_metadata(
   host_span<std::unique_ptr<datasource> const> sources)
   : per_file_metadata(metadatas_from_sources(sources)),
     keyval_maps(collect_keyval_metadata()),
+    arrow_schema(collect_arrow_schema()),
     num_rows(calc_num_rows()),
     num_row_groups(calc_num_row_groups())
 {
@@ -537,6 +560,214 @@ aggregate_reader_metadata::aggregate_reader_metadata(
       CUDF_EXPECTS(schema == pfm.schema, "All sources must have the same schema");
     }
   }
+
+  if (arrow_schema.has_value()) {
+    // erase "ARROW:schema" from the output pfm.
+    std::for_each(
+      keyval_maps.begin(), keyval_maps.end(), [](auto& pfm) { pfm.erase("ARROW:schema"); });
+  }
+}
+
+[[nodiscard]] std::optional<arrow_schema_t> aggregate_reader_metadata::collect_arrow_schema() const
+{
+  // Check if the key_value metadata contains an ARROW:schema
+  // If yes, read and decode the flatbuffer schema
+
+  // TODO: Should we check if any file has the "ARROW:schema" key or
+  // Or if all files have the same "ARROW:schema"?
+  auto it = keyval_maps[0].find("ARROW:schema");
+  if (it == keyval_maps[0].end()) { return std::nullopt; }
+
+  // Local arrow::schema object
+  arrow_schema_t schema;
+
+  // Read arrow schema from flatbuffers
+  std::string encoded_serialized_message = it->second;
+
+  // Decode the base64 encoded ipc message string
+
+  // Note: Store the output from base64_decode in the lvalue here and then pass
+  // it to decode_ipc_message. Directly passing rvalue from base64_decode to
+  // decode_ipc_message can lead to unintended nullptr dereferences.
+  auto decoded_message = cudf::detail::base64_decode(encoded_serialized_message);
+
+  // Decode the ipc message to get a const void pointer to the arrow:Message flatbuffer
+  auto metadata_buf = decode_ipc_message(decoded_message);
+
+  if (metadata_buf == nullptr) {
+    CUDF_LOG_ERROR("Parquet reader encountered an invalid metadata pointer.",
+                   "arrow:schema not processed.");
+    return std::nullopt;
+  }
+
+  // Get an arrow:ipc message object from ipc:message's decoded metadata section
+  auto ipc_message = flatbuf::GetMessage(metadata_buf);
+  if (ipc_message == nullptr) {
+    CUDF_LOG_ERROR("Parquet reader encountered an invalid ipc_message pointer.",
+                   "arrow:schema not processed.");
+    return std::nullopt;
+  }
+
+  // Get schema object from the arrow:ipc message
+  auto fb_schema = ipc_message->header_as_Schema();
+  if (fb_schema == nullptr) {
+    CUDF_LOG_ERROR("Parquet reader encountered an invalid fb_schema pointer.",
+                   "arrow:schema not processed.");
+    return std::nullopt;
+  }
+
+  // Get the vector of fields from arrow:schema object
+  const auto fields = fb_schema->fields();
+  if (fields == nullptr) {
+    CUDF_LOG_ERROR("Parquet reader encountered an invalid fields pointer.",
+                   "arrow:schema not processed.");
+    return std::nullopt;
+  }
+
+  // This lambda function converts from flatbuf::duration type to cudf::type_id
+  auto duration_from_flatbuffer = [](flatbuf::Duration const* duration) {
+    // TODO: we only need this for arrow::DurationType for now. Else, we can take in a
+    // void ptr and typecast it to the corresponding type based on the type_id.
+    auto fb_unit = duration->unit();
+    switch (fb_unit) {
+      case flatbuf::TimeUnit::TimeUnit_SECOND:
+        return cudf::data_type{cudf::type_id::DURATION_SECONDS};
+      case flatbuf::TimeUnit::TimeUnit_MILLISECOND:
+        return cudf::data_type{cudf::type_id::DURATION_MILLISECONDS};
+      case flatbuf::TimeUnit::TimeUnit_MICROSECOND:
+        return cudf::data_type{cudf::type_id::DURATION_MICROSECONDS};
+      case flatbuf::TimeUnit::TimeUnit_NANOSECOND:
+        return cudf::data_type{cudf::type_id::DURATION_NANOSECONDS};
+      default: break;
+    }
+    // 0 is simply a dummy value for the scalar
+    return cudf::data_type{};
+  };
+
+  // Question: Should we not walk the schema here and return flatbuf:Fields *
+  // and walk fields in `select_columns` function where we actually
+  // use the to_type_id function?
+
+  // Lambda function to walk a field and its children in DFS manner and
+  // return boolean walk success status
+  std::function<bool(const flatbuf::Field*)> walk_field =
+    [&schema, &duration_from_flatbuffer, &walk_field](const flatbuf::Field* field) -> bool {
+    // DFS: recursively walk over its children first
+    const auto& children = field->children();
+    if (children != nullptr) {
+      auto iter = std::find_if_not(children->cbegin(),
+                                   children->cend(),
+                                   [&walk_field](const auto& child) { return walk_field(child); });
+      if (iter != children->end()) { return false; }
+    }
+
+    // Walk the field itself
+    // TODO: is the 'name' a good key? What if cols at different levels have the same name.
+    // Solution: build strings like: "parent.child.grandchild.greatgrandchild" to ensure
+    // uniqueness?
+    auto name = (field->name() != nullptr) ? field->name()->str() : "";
+
+    if (field->type_type() == flatbuf::Type::Type_Duration) {
+      auto type_data = field->type_as_Duration();
+      if (type_data != nullptr) {
+        // add an entry to the the unordered_map
+        schema[name] = duration_from_flatbuffer(type_data);
+      } else {
+        CUDF_LOG_ERROR("Parquet reader encountered an invalid type_data pointer.",
+                       "arrow:schema not processed.");
+        return false;
+      }
+    }
+    return true;
+  };
+
+  // Walk all fields and extract all DurationType columns
+  auto iter = std::find_if_not(fields->cbegin(), fields->cend(), [&walk_field](const auto& field) {
+    return walk_field(field);
+  });
+
+  if (iter != fields->end()) { return std::nullopt; }
+
+  // TODO: Get endianness from arrow:schema object - We aren't using this for now
+  [[maybe_unused]] auto endianness = fb_schema->endianness();
+
+  // TODO: Get an arrow:KeyValue map of custom_metadata from arrow:schema object -
+  // We aren't using this for now
+  [[maybe_unused]] auto custom_metadata = fb_schema->custom_metadata();
+
+  return std::make_optional(std::move(schema));
+}
+
+const void* aggregate_reader_metadata::decode_ipc_message(std::string& serialized_message) const
+{
+  // Constants copied from arrow source and renamed to match the case
+  constexpr auto message_decoder_next_required_size_initial         = sizeof(int32_t);
+  constexpr auto message_decoder_next_required_size_metadata_length = sizeof(int32_t);
+  constexpr int32_t ipc_continuation_token                          = -1;
+
+  // message buffer
+  auto message_buf = serialized_message.data();
+  // current message (buffer) size
+  auto message_size = static_cast<int32_t>(serialized_message.size());
+
+  // Check for empty message
+  if (message_size == 0) {
+    CUDF_LOG_ERROR("Parquet reader encountered zero length arrow:schema.",
+                   "arrow:schema not processed.");
+    return static_cast<const void*>(nullptr);
+  }
+  // Check for improper message.
+  if (message_size - message_decoder_next_required_size_initial < 0) {
+    CUDF_LOG_ERROR("Parquet reader encountered unexpected arrow:schema message length.",
+                   "arrow:schema not processed.");
+  }
+
+  // Get the first 4 bytes (continuation) of the ipc message
+  int32_t continuation;
+  std::memcpy(&continuation, message_buf, message_decoder_next_required_size_initial);
+
+  // Check if the continuation matches the expected token
+  if (continuation != ipc_continuation_token) {
+    CUDF_LOG_ERROR("Parquet reader encountered unexpected IPC continuation token.",
+                   "arrow:schema not processed.");
+    return static_cast<const void*>(nullptr);
+  } else {
+    // Offset the message buf and reduce remaining size
+    message_buf += message_decoder_next_required_size_initial;
+    message_size -= message_decoder_next_required_size_initial;
+  }
+
+  // Check for improper message.
+  if (message_size - message_decoder_next_required_size_metadata_length < 0) {
+    CUDF_LOG_ERROR("Parquet reader encountered unexpected arrow:schema message length.",
+                   "arrow:schema not processed.");
+  }
+
+  // Get the next 4 bytes (metadata_len) of the ipc message
+  int32_t metadata_len;
+  std::memcpy(&metadata_len, message_buf, message_decoder_next_required_size_metadata_length);
+
+  // Check if the continuation matches the expected token
+  if (metadata_len <= 0) {
+    CUDF_LOG_ERROR("Parquet reader encountered unexpected metadata length.",
+                   "arrow:schema not processed.");
+    return static_cast<const void*>(nullptr);
+  } else {
+    // Offset the message buf and reduce remaining size
+    message_buf += message_decoder_next_required_size_metadata_length;
+    message_size -= message_decoder_next_required_size_metadata_length;
+  }
+
+  // TODO: Since the arrow:schema message doesn't have a body,
+  // the following check may be made tighter from < to ==
+  if (message_size < metadata_len) {
+    CUDF_LOG_ERROR("Parquet reader encountered unexpected metadata bytes.",
+                   "arrow:schema not processed.");
+    return static_cast<const void*>(nullptr);
+  }
+
+  // All good, return the current message_buf typecasted as const void*
+  return static_cast<const void*>(message_buf);
 }
 
 RowGroup const& aggregate_reader_metadata::get_row_group(size_type row_group_index,
@@ -719,70 +950,86 @@ aggregate_reader_metadata::select_columns(std::optional<std::vector<std::string>
   // not a child of "struct1" then the function will return false for "struct1"
   std::function<bool(
     column_name_info const*, int, std::vector<cudf::io::detail::inline_column_buffer>&, bool)>
-    build_column = [&](column_name_info const* col_name_info,
-                       int schema_idx,
-                       std::vector<cudf::io::detail::inline_column_buffer>& out_col_array,
-                       bool has_list_parent) {
-      if (schema_idx < 0) { return false; }
-      auto const& schema_elem = get_schema(schema_idx);
-
-      // if schema_elem is a stub then it does not exist in the column_name_info and column_buffer
-      // hierarchy. So continue on
-      if (schema_elem.is_stub()) {
-        // is this legit?
-        CUDF_EXPECTS(schema_elem.num_children == 1, "Unexpected number of children for stub");
-        auto child_col_name_info = (col_name_info) ? &col_name_info->children[0] : nullptr;
-        return build_column(
-          child_col_name_info, schema_elem.children_idx[0], out_col_array, has_list_parent);
-      }
+    build_column =
+      [&](column_name_info const* col_name_info,
+          int schema_idx,
+          std::vector<cudf::io::detail::inline_column_buffer>& out_col_array,
+          bool has_list_parent) {
+        if (schema_idx < 0) { return false; }
+        auto const& schema_elem = get_schema(schema_idx);
+
+        // if schema_elem is a stub then it does not exist in the column_name_info and column_buffer
+        // hierarchy. So continue on
+        if (schema_elem.is_stub()) {
+          // is this legit?
+          CUDF_EXPECTS(schema_elem.num_children == 1, "Unexpected number of children for stub");
+          auto child_col_name_info = (col_name_info) ? &col_name_info->children[0] : nullptr;
+          return build_column(
+            child_col_name_info, schema_elem.children_idx[0], out_col_array, has_list_parent);
+        }
+
+        auto const one_level_list =
+          schema_elem.is_one_level_list(get_schema(schema_elem.parent_idx));
 
-      auto const one_level_list = schema_elem.is_one_level_list(get_schema(schema_elem.parent_idx));
-
-      // if we're at the root, this is a new output column
-      auto const col_type = one_level_list
-                              ? type_id::LIST
-                              : to_type_id(schema_elem, strings_to_categorical, timestamp_type_id);
-      auto const dtype    = to_data_type(col_type, schema_elem);
-
-      cudf::io::detail::inline_column_buffer output_col(dtype,
-                                                        schema_elem.repetition_type == OPTIONAL);
-      if (has_list_parent) { output_col.user_data |= PARQUET_COLUMN_BUFFER_FLAG_HAS_LIST_PARENT; }
-      // store the index of this element if inserted in out_col_array
-      nesting.push_back(static_cast<int>(out_col_array.size()));
-      output_col.name = schema_elem.name;
-
-      // build each child
-      bool path_is_valid = false;
-      if (col_name_info == nullptr or col_name_info->children.empty()) {
-        // add all children of schema_elem.
-        // At this point, we can no longer pass a col_name_info to build_column
-        for (int idx = 0; idx < schema_elem.num_children; idx++) {
-          path_is_valid |= build_column(nullptr,
-                                        schema_elem.children_idx[idx],
-                                        output_col.children,
-                                        has_list_parent || col_type == type_id::LIST);
+        auto duration_type = cudf::data_type{};
+        if (arrow_schema.has_value()) {
+          if (arrow_schema.value().find(schema_elem.name) != arrow_schema.value().end()) {
+            duration_type = arrow_schema.value().at(schema_elem.name);
+          }
         }
-      } else {
-        for (size_t idx = 0; idx < col_name_info->children.size(); idx++) {
-          path_is_valid |=
-            build_column(&col_name_info->children[idx],
-                         find_schema_child(schema_elem, col_name_info->children[idx].name),
-                         output_col.children,
-                         has_list_parent || col_type == type_id::LIST);
+        // if we're at the root, this is a new output column
+        auto const col_type =
+          one_level_list
+            ? type_id::LIST
+            : to_type_id(schema_elem, strings_to_categorical, timestamp_type_id, duration_type);
+        auto const dtype = to_data_type(col_type, schema_elem);
+
+        cudf::io::detail::inline_column_buffer output_col(dtype,
+                                                          schema_elem.repetition_type == OPTIONAL);
+        if (has_list_parent) { output_col.user_data |= PARQUET_COLUMN_BUFFER_FLAG_HAS_LIST_PARENT; }
+        // store the index of this element if inserted in out_col_array
+        nesting.push_back(static_cast<int>(out_col_array.size()));
+        output_col.name = schema_elem.name;
+
+        // build each child
+        bool path_is_valid = false;
+        if (col_name_info == nullptr or col_name_info->children.empty()) {
+          // add all children of schema_elem.
+          // At this point, we can no longer pass a col_name_info to build_column
+          for (int idx = 0; idx < schema_elem.num_children; idx++) {
+            path_is_valid |= build_column(nullptr,
+                                          schema_elem.children_idx[idx],
+                                          output_col.children,
+                                          has_list_parent || col_type == type_id::LIST);
+          }
+        } else {
+          for (size_t idx = 0; idx < col_name_info->children.size(); idx++) {
+            path_is_valid |=
+              build_column(&col_name_info->children[idx],
+                           find_schema_child(schema_elem, col_name_info->children[idx].name),
+                           output_col.children,
+                           has_list_parent || col_type == type_id::LIST);
+          }
         }
-      }
 
-      // if I have no children, we're at a leaf and I'm an input column (that is, one with actual
-      // data stored) so add me to the list.
-      if (schema_elem.num_children == 0) {
-        input_column_info& input_col = input_columns.emplace_back(
-          input_column_info{schema_idx, schema_elem.name, schema_elem.max_repetition_level > 0});
+        // if I have no children, we're at a leaf and I'm an input column (that is, one with
+        // actual data stored) so add me to the list.
+        if (schema_elem.num_children == 0) {
+          input_column_info& input_col = input_columns.emplace_back(
+            input_column_info{schema_idx, schema_elem.name, schema_elem.max_repetition_level > 0});
+
+          // set up child output column for one-level encoding list
 
-        // set up child output column for one-level encoding list
-        if (one_level_list) {
+          // check for duration type
+          auto duration_type = cudf::data_type{};
+          if (arrow_schema.has_value()) {
+            if (arrow_schema.value().find(schema_elem.name) != arrow_schema.value().end()) {
+              duration_type = arrow_schema.value().at(schema_elem.name);
+            }
+          }
           // determine the element data type
           auto const element_type =
-            to_type_id(schema_elem, strings_to_categorical, timestamp_type_id);
+            to_type_id(schema_elem, strings_to_categorical, timestamp_type_id, duration_type);
           auto const element_dtype = to_data_type(element_type, schema_elem);
 
           cudf::io::detail::inline_column_buffer element_col(
@@ -806,147 +1053,148 @@ aggregate_reader_metadata::select_columns(std::optional<std::vector<std::string>
         path_is_valid = true;  // If we're able to reach leaf then path is valid
       }
 
-      if (path_is_valid) { out_col_array.push_back(std::move(output_col)); }
-
-      nesting.pop_back();
-      return path_is_valid;
-    };
+  if (path_is_valid)
+  {
+    out_col_array.push_back(std::move(output_col));
+  }
 
-  std::vector<int> output_column_schemas;
+  nesting.pop_back();
+  return path_is_valid;
+};
+
+std::vector<int> output_column_schemas;
+
+//
+// there is not necessarily a 1:1 mapping between input columns and output columns.
+// For example, parquet does not explicitly store a ColumnChunkDesc for struct columns.
+// The "structiness" is simply implied by the schema.  For example, this schema:
+//  required group field_id=1 name {
+//    required binary field_id=2 firstname (String);
+//    required binary field_id=3 middlename (String);
+//    required binary field_id=4 lastname (String);
+// }
+// will only contain 3 internal columns of data (firstname, middlename, lastname).  But of
+// course "name" is ultimately the struct column we want to return.
+//
+// "firstname", "middlename" and "lastname" represent the input columns in the file that we
+// process to produce the final cudf "name" column.
+//
+// A user can ask for a single field out of the struct e.g. firstname.
+// In this case they'll pass a fully qualified name to the schema element like
+// ["name", "firstname"]
+//
+auto const& root = get_schema(0);
+if (not use_names.has_value()) {
+  for (auto const& schema_idx : root.children_idx) {
+    build_column(nullptr, schema_idx, output_columns, false);
+    output_column_schemas.push_back(schema_idx);
+  }
+} else {
+  struct path_info {
+    std::string full_path;
+    int schema_idx;
+  };
 
-  //
-  // there is not necessarily a 1:1 mapping between input columns and output columns.
-  // For example, parquet does not explicitly store a ColumnChunkDesc for struct columns.
-  // The "structiness" is simply implied by the schema.  For example, this schema:
-  //  required group field_id=1 name {
-  //    required binary field_id=2 firstname (String);
-  //    required binary field_id=3 middlename (String);
-  //    required binary field_id=4 lastname (String);
-  // }
-  // will only contain 3 internal columns of data (firstname, middlename, lastname).  But of
-  // course "name" is ultimately the struct column we want to return.
-  //
-  // "firstname", "middlename" and "lastname" represent the input columns in the file that we
-  // process to produce the final cudf "name" column.
-  //
-  // A user can ask for a single field out of the struct e.g. firstname.
-  // In this case they'll pass a fully qualified name to the schema element like
-  // ["name", "firstname"]
-  //
-  auto const& root = get_schema(0);
-  if (not use_names.has_value()) {
-    for (auto const& schema_idx : root.children_idx) {
-      build_column(nullptr, schema_idx, output_columns, false);
-      output_column_schemas.push_back(schema_idx);
+  // Convert schema into a vector of every possible path
+  std::vector<path_info> all_paths;
+  std::function<void(std::string, int)> add_path = [&](std::string path_till_now, int schema_idx) {
+    auto const& schema_elem = get_schema(schema_idx);
+    std::string curr_path   = path_till_now + schema_elem.name;
+    all_paths.push_back({curr_path, schema_idx});
+    for (auto const& child_idx : schema_elem.children_idx) {
+      add_path(curr_path + ".", child_idx);
     }
-  } else {
-    struct path_info {
-      std::string full_path;
-      int schema_idx;
-    };
+  };
+  for (auto const& child_idx : get_schema(0).children_idx) {
+    add_path("", child_idx);
+  }
 
-    // Convert schema into a vector of every possible path
-    std::vector<path_info> all_paths;
-    std::function<void(std::string, int)> add_path = [&](std::string path_till_now,
-                                                         int schema_idx) {
-      auto const& schema_elem = get_schema(schema_idx);
-      std::string curr_path   = path_till_now + schema_elem.name;
-      all_paths.push_back({curr_path, schema_idx});
-      for (auto const& child_idx : schema_elem.children_idx) {
-        add_path(curr_path + ".", child_idx);
-      }
-    };
-    for (auto const& child_idx : get_schema(0).children_idx) {
-      add_path("", child_idx);
+  // Find which of the selected paths are valid and get their schema index
+  std::vector<path_info> valid_selected_paths;
+  for (auto const& selected_path : *use_names) {
+    auto found_path = std::find_if(all_paths.begin(), all_paths.end(), [&](path_info& valid_path) {
+      return valid_path.full_path == selected_path;
+    });
+    if (found_path != all_paths.end()) {
+      valid_selected_paths.push_back({selected_path, found_path->schema_idx});
     }
+  }
 
-    // Find which of the selected paths are valid and get their schema index
-    std::vector<path_info> valid_selected_paths;
-    for (auto const& selected_path : *use_names) {
-      auto found_path =
-        std::find_if(all_paths.begin(), all_paths.end(), [&](path_info& valid_path) {
-          return valid_path.full_path == selected_path;
-        });
-      if (found_path != all_paths.end()) {
-        valid_selected_paths.push_back({selected_path, found_path->schema_idx});
-      }
-    }
+  // Now construct paths as vector of strings for further consumption
+  std::vector<std::vector<std::string>> use_names3;
+  std::transform(valid_selected_paths.cbegin(),
+                 valid_selected_paths.cend(),
+                 std::back_inserter(use_names3),
+                 [&](path_info const& valid_path) {
+                   auto schema_idx = valid_path.schema_idx;
+                   std::vector<std::string> result_path;
+                   do {
+                     SchemaElement const& elem = get_schema(schema_idx);
+                     result_path.push_back(elem.name);
+                     schema_idx = elem.parent_idx;
+                   } while (schema_idx > 0);
+                   return std::vector<std::string>(result_path.rbegin(), result_path.rend());
+                 });
 
-    // Now construct paths as vector of strings for further consumption
-    std::vector<std::vector<std::string>> use_names3;
-    std::transform(valid_selected_paths.cbegin(),
-                   valid_selected_paths.cend(),
-                   std::back_inserter(use_names3),
-                   [&](path_info const& valid_path) {
-                     auto schema_idx = valid_path.schema_idx;
-                     std::vector<std::string> result_path;
-                     do {
-                       SchemaElement const& elem = get_schema(schema_idx);
-                       result_path.push_back(elem.name);
-                       schema_idx = elem.parent_idx;
-                     } while (schema_idx > 0);
-                     return std::vector<std::string>(result_path.rbegin(), result_path.rend());
-                   });
-
-    std::vector<column_name_info> selected_columns;
-    if (include_index) {
-      std::vector<std::string> index_names = get_pandas_index_names();
-      std::transform(index_names.cbegin(),
-                     index_names.cend(),
-                     std::back_inserter(selected_columns),
-                     [](std::string const& name) { return column_name_info(name); });
-    }
-    // Merge the vector use_names into a set of hierarchical column_name_info objects
-    /* This is because if we have columns like this:
-     *     col1
-     *      / \
-     *    s3   f4
-     *   / \
-     * f5   f6
-     *
-     * there may be common paths in use_names like:
-     * {"col1", "s3", "f5"}, {"col1", "f4"}
-     * which means we want the output to contain
-     *     col1
-     *      / \
-     *    s3   f4
-     *   /
-     * f5
-     *
-     * rather than
-     *  col1   col1
-     *   |      |
-     *   s3     f4
-     *   |
-     *   f5
-     */
-    for (auto const& path : use_names3) {
-      auto array_to_find_in = &selected_columns;
-      for (size_t depth = 0; depth < path.size(); ++depth) {
-        // Check if the path exists in our selected_columns and if not, add it.
-        auto const& name_to_find = path[depth];
-        auto found_col           = std::find_if(
-          array_to_find_in->begin(),
-          array_to_find_in->end(),
-          [&name_to_find](column_name_info const& col) { return col.name == name_to_find; });
-        if (found_col == array_to_find_in->end()) {
-          auto& col        = array_to_find_in->emplace_back(name_to_find);
-          array_to_find_in = &col.children;
-        } else {
-          // Path exists. go down further.
-          array_to_find_in = &found_col->children;
-        }
+  std::vector<column_name_info> selected_columns;
+  if (include_index) {
+    std::vector<std::string> index_names = get_pandas_index_names();
+    std::transform(index_names.cbegin(),
+                   index_names.cend(),
+                   std::back_inserter(selected_columns),
+                   [](std::string const& name) { return column_name_info(name); });
+  }
+  // Merge the vector use_names into a set of hierarchical column_name_info objects
+  /* This is because if we have columns like this:
+   *     col1
+   *      / \
+   *    s3   f4
+   *   / \
+   * f5   f6
+   *
+   * there may be common paths in use_names like:
+   * {"col1", "s3", "f5"}, {"col1", "f4"}
+   * which means we want the output to contain
+   *     col1
+   *      / \
+   *    s3   f4
+   *   /
+   * f5
+   *
+   * rather than
+   *  col1   col1
+   *   |      |
+   *   s3     f4
+   *   |
+   *   f5
+   */
+  for (auto const& path : use_names3) {
+    auto array_to_find_in = &selected_columns;
+    for (size_t depth = 0; depth < path.size(); ++depth) {
+      // Check if the path exists in our selected_columns and if not, add it.
+      auto const& name_to_find = path[depth];
+      auto found_col           = std::find_if(
+        array_to_find_in->begin(),
+        array_to_find_in->end(),
+        [&name_to_find](column_name_info const& col) { return col.name == name_to_find; });
+      if (found_col == array_to_find_in->end()) {
+        auto& col        = array_to_find_in->emplace_back(name_to_find);
+        array_to_find_in = &col.children;
+      } else {
+        // Path exists. go down further.
+        array_to_find_in = &found_col->children;
       }
     }
-    for (auto& col : selected_columns) {
-      auto const& top_level_col_schema_idx = find_schema_child(root, col.name);
-      bool valid_column = build_column(&col, top_level_col_schema_idx, output_columns, false);
-      if (valid_column) output_column_schemas.push_back(top_level_col_schema_idx);
-    }
   }
+  for (auto& col : selected_columns) {
+    auto const& top_level_col_schema_idx = find_schema_child(root, col.name);
+    bool valid_column = build_column(&col, top_level_col_schema_idx, output_columns, false);
+    if (valid_column) output_column_schemas.push_back(top_level_col_schema_idx);
+  }
+}
 
-  return std::make_tuple(
-    std::move(input_columns), std::move(output_columns), std::move(output_column_schemas));
+return std::make_tuple(
+  std::move(input_columns), std::move(output_columns), std::move(output_column_schemas));
 }
 
 }  // namespace cudf::io::parquet::detail
diff --git a/cpp/src/io/parquet/reader_impl_helpers.hpp b/cpp/src/io/parquet/reader_impl_helpers.hpp
index 09f65f9c388..d78e8c67de6 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.hpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.hpp
@@ -28,6 +28,8 @@
 #include <thrust/iterator/counting_iterator.h>
 #include <thrust/iterator/zip_iterator.h>
 
+#include <arrow/type_fwd.h>
+
 #include <list>
 #include <tuple>
 #include <vector>
@@ -101,7 +103,8 @@ struct row_group_info {
  */
 [[nodiscard]] type_id to_type_id(SchemaElement const& schema,
                                  bool strings_to_categorical,
-                                 type_id timestamp_type_id);
+                                 type_id timestamp_type_id,
+                                 cudf::data_type duration_type = cudf::data_type{});
 
 /**
  * @brief Converts cuDF type enum to column logical type
@@ -121,9 +124,13 @@ struct metadata : public FileMetaData {
   void sanitize_schema();
 };
 
+using arrow_schema_t = std::unordered_map<std::string, cudf::data_type>;
+
 class aggregate_reader_metadata {
   std::vector<metadata> per_file_metadata;
   std::vector<std::unordered_map<std::string, std::string>> keyval_maps;
+  std::optional<arrow_schema_t> arrow_schema;
+
   int64_t num_rows;
   size_type num_row_groups;
 
@@ -139,6 +146,17 @@ class aggregate_reader_metadata {
   [[nodiscard]] std::vector<std::unordered_map<std::string, std::string>> collect_keyval_metadata()
     const;
 
+  /**
+   * @brief Walks over an "ARROW:schema" flatbuffer and collects type information for DurationType
+   * columns into an unordered map.
+   */
+  [[nodiscard]] std::optional<arrow_schema_t> collect_arrow_schema() const;
+
+  /**
+   * @brief Decode an arrow:IPC message and returns a const void pointer to its metadata header
+   */
+  [[nodiscard]] const void* decode_ipc_message(std::string& serialized_message) const;
+
   /**
    * @brief Sums up the number of rows of each source
    */
@@ -183,7 +201,7 @@ class aggregate_reader_metadata {
   }
 
   [[nodiscard]] auto const& get_key_value_metadata() const& { return keyval_maps; }
-
+  [[nodiscard]] auto const& get_arrow_schema() const& { return arrow_schema; }
   [[nodiscard]] auto&& get_key_value_metadata() && { return std::move(keyval_maps); }
 
   /**

From aa4e9bbc05e6b7afab4a847fc01c2e29556be403 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Tue, 30 Apr 2024 03:44:41 +0000
Subject: [PATCH 02/53] reverting an inadvertently removed code line.

---
 cpp/include/cudf/io/ipc/Schema.fbs            |   4 +-
 .../cudf/io/ipc/detail/Schema_generated.h     |   2 +-
 .../cudf/io/ipc/flatbuffers/allocator.h       |   2 +-
 cpp/src/io/parquet/reader_impl_helpers.cpp    | 398 +++++++++---------
 4 files changed, 199 insertions(+), 207 deletions(-)

diff --git a/cpp/include/cudf/io/ipc/Schema.fbs b/cpp/include/cudf/io/ipc/Schema.fbs
index 8479785b261..4c8722d0628 100644
--- a/cpp/include/cudf/io/ipc/Schema.fbs
+++ b/cpp/include/cudf/io/ipc/Schema.fbs
@@ -60,7 +60,7 @@ enum MetadataVersion:short {
 ///      forward compatibility guarantees).
 ///  2.  A means of negotiating between a client and server
 ///      what features a stream is allowed to use. The enums
-///      values here are intented to represent higher level
+///      values here are intended to represent higher level
 ///      features, additional details maybe negotiated
 ///      with key-value pairs specific to the protocol.
 ///
@@ -215,7 +215,7 @@ table Bool {
 
 /// Contains two child arrays, run_ends and values.
 /// The run_ends child array must be a 16/32/64-bit integer array
-/// which encodes the indices at which the run with the value in 
+/// which encodes the indices at which the run with the value in
 /// each corresponding index in the values child array ends.
 /// Like list/struct types, the value array can be of any type.
 table RunEndEncoded {
diff --git a/cpp/include/cudf/io/ipc/detail/Schema_generated.h b/cpp/include/cudf/io/ipc/detail/Schema_generated.h
index 4d662704604..0f086ecdc2c 100644
--- a/cpp/include/cudf/io/ipc/detail/Schema_generated.h
+++ b/cpp/include/cudf/io/ipc/detail/Schema_generated.h
@@ -162,7 +162,7 @@ inline const char* EnumNameMetadataVersion(MetadataVersion e)
 ///      forward compatibility guarantees).
 ///  2.  A means of negotiating between a client and server
 ///      what features a stream is allowed to use. The enums
-///      values here are intented to represent higher level
+///      values here are intended to represent higher level
 ///      features, additional details maybe negotiated
 ///      with key-value pairs specific to the protocol.
 ///
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/allocator.h b/cpp/include/cudf/io/ipc/flatbuffers/allocator.h
index f6fe10044a2..f887543ab9a 100644
--- a/cpp/include/cudf/io/ipc/flatbuffers/allocator.h
+++ b/cpp/include/cudf/io/ipc/flatbuffers/allocator.h
@@ -37,7 +37,7 @@ class Allocator {
 
   // Reallocate `new_size` bytes of memory, replacing the old region of size
   // `old_size` at `p`. In contrast to a normal realloc, this grows downwards,
-  // and is intended specifcally for `vector_downward` use.
+  // and is intended specifically for `vector_downward` use.
   // `in_use_back` and `in_use_front` indicate how much of `old_size` is
   // actually in use at each end, and needs to be copied.
   virtual uint8_t* reallocate_downward(
diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 26d6d770b2c..e0a8ab8fe30 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -41,8 +41,6 @@
 
 namespace cudf::io::parquet::detail {
 
-#define printVar(x) std::cout << "@" << #x << " : " << x << std::flush << std::endl;
-
 namespace flatbuf = cudf::io::parquet::flatbuf;
 
 namespace {
@@ -950,84 +948,79 @@ aggregate_reader_metadata::select_columns(std::optional<std::vector<std::string>
   // not a child of "struct1" then the function will return false for "struct1"
   std::function<bool(
     column_name_info const*, int, std::vector<cudf::io::detail::inline_column_buffer>&, bool)>
-    build_column =
-      [&](column_name_info const* col_name_info,
-          int schema_idx,
-          std::vector<cudf::io::detail::inline_column_buffer>& out_col_array,
-          bool has_list_parent) {
-        if (schema_idx < 0) { return false; }
-        auto const& schema_elem = get_schema(schema_idx);
-
-        // if schema_elem is a stub then it does not exist in the column_name_info and column_buffer
-        // hierarchy. So continue on
-        if (schema_elem.is_stub()) {
-          // is this legit?
-          CUDF_EXPECTS(schema_elem.num_children == 1, "Unexpected number of children for stub");
-          auto child_col_name_info = (col_name_info) ? &col_name_info->children[0] : nullptr;
-          return build_column(
-            child_col_name_info, schema_elem.children_idx[0], out_col_array, has_list_parent);
-        }
+    build_column = [&](column_name_info const* col_name_info,
+                       int schema_idx,
+                       std::vector<cudf::io::detail::inline_column_buffer>& out_col_array,
+                       bool has_list_parent) {
+      if (schema_idx < 0) { return false; }
+      auto const& schema_elem = get_schema(schema_idx);
+
+      // if schema_elem is a stub then it does not exist in the column_name_info and column_buffer
+      // hierarchy. So continue on
+      if (schema_elem.is_stub()) {
+        // is this legit?
+        CUDF_EXPECTS(schema_elem.num_children == 1, "Unexpected number of children for stub");
+        auto child_col_name_info = (col_name_info) ? &col_name_info->children[0] : nullptr;
+        return build_column(
+          child_col_name_info, schema_elem.children_idx[0], out_col_array, has_list_parent);
+      }
 
-        auto const one_level_list =
-          schema_elem.is_one_level_list(get_schema(schema_elem.parent_idx));
+      auto const one_level_list = schema_elem.is_one_level_list(get_schema(schema_elem.parent_idx));
 
-        auto duration_type = cudf::data_type{};
-        if (arrow_schema.has_value()) {
-          if (arrow_schema.value().find(schema_elem.name) != arrow_schema.value().end()) {
-            duration_type = arrow_schema.value().at(schema_elem.name);
-          }
+      auto duration_type = cudf::data_type{};
+      if (arrow_schema.has_value() and
+          arrow_schema.value().find(schema_elem.name) != arrow_schema.value().end()) {
+        duration_type = arrow_schema.value().at(schema_elem.name);
+      }
+      // if we're at the root, this is a new output column
+      auto const col_type =
+        one_level_list
+          ? type_id::LIST
+          : to_type_id(schema_elem, strings_to_categorical, timestamp_type_id, duration_type);
+      auto const dtype = to_data_type(col_type, schema_elem);
+
+      cudf::io::detail::inline_column_buffer output_col(dtype,
+                                                        schema_elem.repetition_type == OPTIONAL);
+      if (has_list_parent) { output_col.user_data |= PARQUET_COLUMN_BUFFER_FLAG_HAS_LIST_PARENT; }
+      // store the index of this element if inserted in out_col_array
+      nesting.push_back(static_cast<int>(out_col_array.size()));
+      output_col.name = schema_elem.name;
+
+      // build each child
+      bool path_is_valid = false;
+      if (col_name_info == nullptr or col_name_info->children.empty()) {
+        // add all children of schema_elem.
+        // At this point, we can no longer pass a col_name_info to build_column
+        for (int idx = 0; idx < schema_elem.num_children; idx++) {
+          path_is_valid |= build_column(nullptr,
+                                        schema_elem.children_idx[idx],
+                                        output_col.children,
+                                        has_list_parent || col_type == type_id::LIST);
         }
-        // if we're at the root, this is a new output column
-        auto const col_type =
-          one_level_list
-            ? type_id::LIST
-            : to_type_id(schema_elem, strings_to_categorical, timestamp_type_id, duration_type);
-        auto const dtype = to_data_type(col_type, schema_elem);
-
-        cudf::io::detail::inline_column_buffer output_col(dtype,
-                                                          schema_elem.repetition_type == OPTIONAL);
-        if (has_list_parent) { output_col.user_data |= PARQUET_COLUMN_BUFFER_FLAG_HAS_LIST_PARENT; }
-        // store the index of this element if inserted in out_col_array
-        nesting.push_back(static_cast<int>(out_col_array.size()));
-        output_col.name = schema_elem.name;
-
-        // build each child
-        bool path_is_valid = false;
-        if (col_name_info == nullptr or col_name_info->children.empty()) {
-          // add all children of schema_elem.
-          // At this point, we can no longer pass a col_name_info to build_column
-          for (int idx = 0; idx < schema_elem.num_children; idx++) {
-            path_is_valid |= build_column(nullptr,
-                                          schema_elem.children_idx[idx],
-                                          output_col.children,
-                                          has_list_parent || col_type == type_id::LIST);
-          }
-        } else {
-          for (size_t idx = 0; idx < col_name_info->children.size(); idx++) {
-            path_is_valid |=
-              build_column(&col_name_info->children[idx],
-                           find_schema_child(schema_elem, col_name_info->children[idx].name),
-                           output_col.children,
-                           has_list_parent || col_type == type_id::LIST);
-          }
+      } else {
+        for (size_t idx = 0; idx < col_name_info->children.size(); idx++) {
+          path_is_valid |=
+            build_column(&col_name_info->children[idx],
+                         find_schema_child(schema_elem, col_name_info->children[idx].name),
+                         output_col.children,
+                         has_list_parent || col_type == type_id::LIST);
         }
+      }
 
-        // if I have no children, we're at a leaf and I'm an input column (that is, one with
-        // actual data stored) so add me to the list.
-        if (schema_elem.num_children == 0) {
-          input_column_info& input_col = input_columns.emplace_back(
-            input_column_info{schema_idx, schema_elem.name, schema_elem.max_repetition_level > 0});
-
-          // set up child output column for one-level encoding list
+      // if I have no children, we're at a leaf and I'm an input column (that is, one with actual
+      // data stored) so add me to the list.
+      if (schema_elem.num_children == 0) {
+        input_column_info& input_col = input_columns.emplace_back(
+          input_column_info{schema_idx, schema_elem.name, schema_elem.max_repetition_level > 0});
 
-          // check for duration type
+        // set up child output column for one-level encoding list
+        if (one_level_list) {
+          // determine the element data type
           auto duration_type = cudf::data_type{};
-          if (arrow_schema.has_value()) {
-            if (arrow_schema.value().find(schema_elem.name) != arrow_schema.value().end()) {
-              duration_type = arrow_schema.value().at(schema_elem.name);
-            }
+          if (arrow_schema.has_value() and
+              arrow_schema.value().find(schema_elem.name) != arrow_schema.value().end()) {
+            duration_type = arrow_schema.value().at(schema_elem.name);
           }
-          // determine the element data type
           auto const element_type =
             to_type_id(schema_elem, strings_to_categorical, timestamp_type_id, duration_type);
           auto const element_dtype = to_data_type(element_type, schema_elem);
@@ -1053,148 +1046,147 @@ aggregate_reader_metadata::select_columns(std::optional<std::vector<std::string>
         path_is_valid = true;  // If we're able to reach leaf then path is valid
       }
 
-  if (path_is_valid)
-  {
-    out_col_array.push_back(std::move(output_col));
-  }
+      if (path_is_valid) { out_col_array.push_back(std::move(output_col)); }
 
-  nesting.pop_back();
-  return path_is_valid;
-};
-
-std::vector<int> output_column_schemas;
-
-//
-// there is not necessarily a 1:1 mapping between input columns and output columns.
-// For example, parquet does not explicitly store a ColumnChunkDesc for struct columns.
-// The "structiness" is simply implied by the schema.  For example, this schema:
-//  required group field_id=1 name {
-//    required binary field_id=2 firstname (String);
-//    required binary field_id=3 middlename (String);
-//    required binary field_id=4 lastname (String);
-// }
-// will only contain 3 internal columns of data (firstname, middlename, lastname).  But of
-// course "name" is ultimately the struct column we want to return.
-//
-// "firstname", "middlename" and "lastname" represent the input columns in the file that we
-// process to produce the final cudf "name" column.
-//
-// A user can ask for a single field out of the struct e.g. firstname.
-// In this case they'll pass a fully qualified name to the schema element like
-// ["name", "firstname"]
-//
-auto const& root = get_schema(0);
-if (not use_names.has_value()) {
-  for (auto const& schema_idx : root.children_idx) {
-    build_column(nullptr, schema_idx, output_columns, false);
-    output_column_schemas.push_back(schema_idx);
-  }
-} else {
-  struct path_info {
-    std::string full_path;
-    int schema_idx;
-  };
+      nesting.pop_back();
+      return path_is_valid;
+    };
+
+  std::vector<int> output_column_schemas;
 
-  // Convert schema into a vector of every possible path
-  std::vector<path_info> all_paths;
-  std::function<void(std::string, int)> add_path = [&](std::string path_till_now, int schema_idx) {
-    auto const& schema_elem = get_schema(schema_idx);
-    std::string curr_path   = path_till_now + schema_elem.name;
-    all_paths.push_back({curr_path, schema_idx});
-    for (auto const& child_idx : schema_elem.children_idx) {
-      add_path(curr_path + ".", child_idx);
+  //
+  // there is not necessarily a 1:1 mapping between input columns and output columns.
+  // For example, parquet does not explicitly store a ColumnChunkDesc for struct columns.
+  // The "structiness" is simply implied by the schema.  For example, this schema:
+  //  required group field_id=1 name {
+  //    required binary field_id=2 firstname (String);
+  //    required binary field_id=3 middlename (String);
+  //    required binary field_id=4 lastname (String);
+  // }
+  // will only contain 3 internal columns of data (firstname, middlename, lastname).  But of
+  // course "name" is ultimately the struct column we want to return.
+  //
+  // "firstname", "middlename" and "lastname" represent the input columns in the file that we
+  // process to produce the final cudf "name" column.
+  //
+  // A user can ask for a single field out of the struct e.g. firstname.
+  // In this case they'll pass a fully qualified name to the schema element like
+  // ["name", "firstname"]
+  //
+  auto const& root = get_schema(0);
+  if (not use_names.has_value()) {
+    for (auto const& schema_idx : root.children_idx) {
+      build_column(nullptr, schema_idx, output_columns, false);
+      output_column_schemas.push_back(schema_idx);
     }
-  };
-  for (auto const& child_idx : get_schema(0).children_idx) {
-    add_path("", child_idx);
-  }
+  } else {
+    struct path_info {
+      std::string full_path;
+      int schema_idx;
+    };
 
-  // Find which of the selected paths are valid and get their schema index
-  std::vector<path_info> valid_selected_paths;
-  for (auto const& selected_path : *use_names) {
-    auto found_path = std::find_if(all_paths.begin(), all_paths.end(), [&](path_info& valid_path) {
-      return valid_path.full_path == selected_path;
-    });
-    if (found_path != all_paths.end()) {
-      valid_selected_paths.push_back({selected_path, found_path->schema_idx});
+    // Convert schema into a vector of every possible path
+    std::vector<path_info> all_paths;
+    std::function<void(std::string, int)> add_path = [&](std::string path_till_now,
+                                                         int schema_idx) {
+      auto const& schema_elem = get_schema(schema_idx);
+      std::string curr_path   = path_till_now + schema_elem.name;
+      all_paths.push_back({curr_path, schema_idx});
+      for (auto const& child_idx : schema_elem.children_idx) {
+        add_path(curr_path + ".", child_idx);
+      }
+    };
+    for (auto const& child_idx : get_schema(0).children_idx) {
+      add_path("", child_idx);
     }
-  }
 
-  // Now construct paths as vector of strings for further consumption
-  std::vector<std::vector<std::string>> use_names3;
-  std::transform(valid_selected_paths.cbegin(),
-                 valid_selected_paths.cend(),
-                 std::back_inserter(use_names3),
-                 [&](path_info const& valid_path) {
-                   auto schema_idx = valid_path.schema_idx;
-                   std::vector<std::string> result_path;
-                   do {
-                     SchemaElement const& elem = get_schema(schema_idx);
-                     result_path.push_back(elem.name);
-                     schema_idx = elem.parent_idx;
-                   } while (schema_idx > 0);
-                   return std::vector<std::string>(result_path.rbegin(), result_path.rend());
-                 });
+    // Find which of the selected paths are valid and get their schema index
+    std::vector<path_info> valid_selected_paths;
+    for (auto const& selected_path : *use_names) {
+      auto found_path =
+        std::find_if(all_paths.begin(), all_paths.end(), [&](path_info& valid_path) {
+          return valid_path.full_path == selected_path;
+        });
+      if (found_path != all_paths.end()) {
+        valid_selected_paths.push_back({selected_path, found_path->schema_idx});
+      }
+    }
 
-  std::vector<column_name_info> selected_columns;
-  if (include_index) {
-    std::vector<std::string> index_names = get_pandas_index_names();
-    std::transform(index_names.cbegin(),
-                   index_names.cend(),
-                   std::back_inserter(selected_columns),
-                   [](std::string const& name) { return column_name_info(name); });
-  }
-  // Merge the vector use_names into a set of hierarchical column_name_info objects
-  /* This is because if we have columns like this:
-   *     col1
-   *      / \
-   *    s3   f4
-   *   / \
-   * f5   f6
-   *
-   * there may be common paths in use_names like:
-   * {"col1", "s3", "f5"}, {"col1", "f4"}
-   * which means we want the output to contain
-   *     col1
-   *      / \
-   *    s3   f4
-   *   /
-   * f5
-   *
-   * rather than
-   *  col1   col1
-   *   |      |
-   *   s3     f4
-   *   |
-   *   f5
-   */
-  for (auto const& path : use_names3) {
-    auto array_to_find_in = &selected_columns;
-    for (size_t depth = 0; depth < path.size(); ++depth) {
-      // Check if the path exists in our selected_columns and if not, add it.
-      auto const& name_to_find = path[depth];
-      auto found_col           = std::find_if(
-        array_to_find_in->begin(),
-        array_to_find_in->end(),
-        [&name_to_find](column_name_info const& col) { return col.name == name_to_find; });
-      if (found_col == array_to_find_in->end()) {
-        auto& col        = array_to_find_in->emplace_back(name_to_find);
-        array_to_find_in = &col.children;
-      } else {
-        // Path exists. go down further.
-        array_to_find_in = &found_col->children;
+    // Now construct paths as vector of strings for further consumption
+    std::vector<std::vector<std::string>> use_names3;
+    std::transform(valid_selected_paths.cbegin(),
+                   valid_selected_paths.cend(),
+                   std::back_inserter(use_names3),
+                   [&](path_info const& valid_path) {
+                     auto schema_idx = valid_path.schema_idx;
+                     std::vector<std::string> result_path;
+                     do {
+                       SchemaElement const& elem = get_schema(schema_idx);
+                       result_path.push_back(elem.name);
+                       schema_idx = elem.parent_idx;
+                     } while (schema_idx > 0);
+                     return std::vector<std::string>(result_path.rbegin(), result_path.rend());
+                   });
+
+    std::vector<column_name_info> selected_columns;
+    if (include_index) {
+      std::vector<std::string> index_names = get_pandas_index_names();
+      std::transform(index_names.cbegin(),
+                     index_names.cend(),
+                     std::back_inserter(selected_columns),
+                     [](std::string const& name) { return column_name_info(name); });
+    }
+    // Merge the vector use_names into a set of hierarchical column_name_info objects
+    /* This is because if we have columns like this:
+     *     col1
+     *      / \
+     *    s3   f4
+     *   / \
+     * f5   f6
+     *
+     * there may be common paths in use_names like:
+     * {"col1", "s3", "f5"}, {"col1", "f4"}
+     * which means we want the output to contain
+     *     col1
+     *      / \
+     *    s3   f4
+     *   /
+     * f5
+     *
+     * rather than
+     *  col1   col1
+     *   |      |
+     *   s3     f4
+     *   |
+     *   f5
+     */
+    for (auto const& path : use_names3) {
+      auto array_to_find_in = &selected_columns;
+      for (size_t depth = 0; depth < path.size(); ++depth) {
+        // Check if the path exists in our selected_columns and if not, add it.
+        auto const& name_to_find = path[depth];
+        auto found_col           = std::find_if(
+          array_to_find_in->begin(),
+          array_to_find_in->end(),
+          [&name_to_find](column_name_info const& col) { return col.name == name_to_find; });
+        if (found_col == array_to_find_in->end()) {
+          auto& col        = array_to_find_in->emplace_back(name_to_find);
+          array_to_find_in = &col.children;
+        } else {
+          // Path exists. go down further.
+          array_to_find_in = &found_col->children;
+        }
       }
     }
+    for (auto& col : selected_columns) {
+      auto const& top_level_col_schema_idx = find_schema_child(root, col.name);
+      bool valid_column = build_column(&col, top_level_col_schema_idx, output_columns, false);
+      if (valid_column) output_column_schemas.push_back(top_level_col_schema_idx);
+    }
   }
-  for (auto& col : selected_columns) {
-    auto const& top_level_col_schema_idx = find_schema_child(root, col.name);
-    bool valid_column = build_column(&col, top_level_col_schema_idx, output_columns, false);
-    if (valid_column) output_column_schemas.push_back(top_level_col_schema_idx);
-  }
-}
 
-return std::make_tuple(
-  std::move(input_columns), std::move(output_columns), std::move(output_column_schemas));
+  return std::make_tuple(
+    std::move(input_columns), std::move(output_columns), std::move(output_column_schemas));
 }
 
 }  // namespace cudf::io::parquet::detail

From 6c67c289f5a3376244a5056ccc2daf3af2e3b21d Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Tue, 30 Apr 2024 03:45:08 +0000
Subject: [PATCH 03/53] clang-format changes

---
 cpp/include/cudf/io/ipc/flatbuffers/buffer.h             | 2 +-
 cpp/include/cudf/io/ipc/flatbuffers/flatbuffer_builder.h | 4 ++--
 cpp/include/cudf/io/ipc/flatbuffers/string.h             | 2 +-
 cpp/include/cudf/io/ipc/flatbuffers/verifier.h           | 2 +-
 4 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/cpp/include/cudf/io/ipc/flatbuffers/buffer.h b/cpp/include/cudf/io/ipc/flatbuffers/buffer.h
index 9b2d98cd9e5..9e574a46bce 100644
--- a/cpp/include/cudf/io/ipc/flatbuffers/buffer.h
+++ b/cpp/include/cudf/io/ipc/flatbuffers/buffer.h
@@ -67,7 +67,7 @@ inline void EndianCheck()
 template <typename T>
 FLATBUFFERS_CONSTEXPR size_t AlignOf()
 {
-  // clang-format off
+// clang-format off
   #ifdef _MSC_VER
     return __alignof(T);
   #else
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/flatbuffer_builder.h b/cpp/include/cudf/io/ipc/flatbuffers/flatbuffer_builder.h
index c901d637eb6..74a55955d52 100644
--- a/cpp/include/cudf/io/ipc/flatbuffers/flatbuffer_builder.h
+++ b/cpp/include/cudf/io/ipc/flatbuffers/flatbuffer_builder.h
@@ -610,7 +610,7 @@ class FlatBufferBuilderImpl {
     return CreateString<OffsetT>(str.c_str(), str.length());
   }
 
-// clang-format off
+  // clang-format off
   #ifdef FLATBUFFERS_HAS_STRING_VIEW
   /// @brief Store a string in the buffer, which can contain any binary data.
   /// @param[in] str A const string_view to copy in to the buffer.
@@ -805,7 +805,7 @@ class FlatBufferBuilderImpl {
     AssertScalarT<T>();
     StartVector<T, OffsetT, LenT>(len);
     if (len > 0) {
-      // clang-format off
+// clang-format off
       #if FLATBUFFERS_LITTLEENDIAN
         PushBytes(reinterpret_cast<const uint8_t *>(v), len * sizeof(T));
       #else
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/string.h b/cpp/include/cudf/io/ipc/flatbuffers/string.h
index be877fde35c..95e937ffca9 100644
--- a/cpp/include/cudf/io/ipc/flatbuffers/string.h
+++ b/cpp/include/cudf/io/ipc/flatbuffers/string.h
@@ -28,7 +28,7 @@ struct String : public Vector<char> {
   const char* c_str() const { return reinterpret_cast<const char*>(Data()); }
   std::string str() const { return std::string(c_str(), size()); }
 
-// clang-format off
+  // clang-format off
   #ifdef FLATBUFFERS_HAS_STRING_VIEW
   flatbuffers::string_view string_view() const {
     return flatbuffers::string_view(c_str(), size());
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/verifier.h b/cpp/include/cudf/io/ipc/flatbuffers/verifier.h
index 18ed19d03fb..38effcf43df 100644
--- a/cpp/include/cudf/io/ipc/flatbuffers/verifier.h
+++ b/cpp/include/cudf/io/ipc/flatbuffers/verifier.h
@@ -68,7 +68,7 @@ class VerifierTemplate FLATBUFFERS_FINAL_CLASS {
   // Central location where any verification failures register.
   bool Check(const bool ok) const
   {
-// clang-format off
+    // clang-format off
     #ifdef FLATBUFFERS_DEBUG_VERIFICATION_FAILURE
       if (opts_.assert) { FLATBUFFERS_ASSERT(ok); }
     #endif

From 0e6fc4a96f8b5a34dc305ba079a97daa242e0769 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <14217455+mhaseeb123@users.noreply.github.com>
Date: Tue, 30 Apr 2024 11:50:45 -0700
Subject: [PATCH 04/53] Update cpp/src/io/parquet/reader_impl_helpers.cpp

Co-authored-by: Ed Seidl <etseidl@users.noreply.github.com>
---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index e0a8ab8fe30..fb5e2026f7f 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -181,7 +181,7 @@ type_id to_type_id(SchemaElement const& schema,
     case BOOLEAN: return type_id::BOOL8;
     case INT32: return type_id::INT32;
     case INT64:
-      return (duration_type.id() == cudf::type_id::EMPTY) ? type_id::INT64 : duration_type.id();
+      return (duration_type.id() == type_id::EMPTY) ? type_id::INT64 : duration_type.id();
     case FLOAT: return type_id::FLOAT32;
     case DOUBLE: return type_id::FLOAT64;
     case BYTE_ARRAY:

From a6eca13089f6058affb4394e2aaa76607505c321 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Wed, 1 May 2024 04:16:54 +0000
Subject: [PATCH 05/53] Co-walk arrow and parquet schema

---
 cpp/src/io/parquet/parquet.hpp             |   3 +
 cpp/src/io/parquet/reader_impl.cpp         |   3 +-
 cpp/src/io/parquet/reader_impl_helpers.cpp | 213 ++++++++++++---------
 cpp/src/io/parquet/reader_impl_helpers.hpp |  21 +-
 4 files changed, 141 insertions(+), 99 deletions(-)

diff --git a/cpp/src/io/parquet/parquet.hpp b/cpp/src/io/parquet/parquet.hpp
index 08f9fae145b..6515dd7cbae 100644
--- a/cpp/src/io/parquet/parquet.hpp
+++ b/cpp/src/io/parquet/parquet.hpp
@@ -183,6 +183,9 @@ struct SchemaElement {
   // extra cudf specific fields
   bool output_as_byte_array = false;
 
+  // cudf type determined from arrow:schema
+  thrust::optional<type_id> arrow_type;
+
   // The following fields are filled in later during schema initialization
   int max_definition_level = 0;
   int max_repetition_level = 0;
diff --git a/cpp/src/io/parquet/reader_impl.cpp b/cpp/src/io/parquet/reader_impl.cpp
index fb574d5e915..d887d5fffd5 100644
--- a/cpp/src/io/parquet/reader_impl.cpp
+++ b/cpp/src/io/parquet/reader_impl.cpp
@@ -452,8 +452,7 @@ void reader::impl::populate_metadata(table_metadata& out_metadata)
 table_with_metadata reader::impl::read_chunk_internal(
   bool uses_custom_row_bounds, std::optional<std::reference_wrapper<ast::expression const>> filter)
 {
-  // If `_output_metadata` has been constructed, just
-  // copy it over.
+  // If `_output_metadata` has been constructed, just copy it over.
   auto out_metadata = _output_metadata ? table_metadata{*_output_metadata} : table_metadata{};
   out_metadata.schema_info.resize(_output_buffers.size());
 
diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index fb5e2026f7f..80c924dc144 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -16,27 +16,14 @@
 
 #include "reader_impl_helpers.hpp"
 
-#include "cudf/detail/utilities/assert.cuh"
-#include "cudf/types.hpp"
-#include "cudf/utilities/error.hpp"
 #include "io/parquet/parquet.hpp"
-#include "io/parquet/parquet_common.hpp"
 #include "io/utilities/row_selection.hpp"
 
 #include <cudf/detail/utilities/base64_utils.hpp>
-// flatbuffer headers
 #include <cudf/io/ipc/detail/Message_generated.h>
 #include <cudf/io/ipc/detail/Schema_generated.h>
 
-#include <arrow/scalar.h>
-#include <arrow/type_fwd.h>
-
-#include <algorithm>
-#include <cstdint>
-#include <iterator>
-#include <memory>
 #include <numeric>
-#include <optional>
 #include <regex>
 
 namespace cudf::io::parquet::detail {
@@ -83,10 +70,10 @@ thrust::optional<LogicalType> converted_to_logical_type(SchemaElement const& sch
  */
 type_id to_type_id(SchemaElement const& schema,
                    bool strings_to_categorical,
-                   type_id timestamp_type_id,
-                   cudf::data_type duration_type)
+                   type_id timestamp_type_id)
 {
   auto const physical = schema.type;
+  auto const arrow    = schema.arrow_type;
   auto logical_type   = schema.logical_type;
   // sanity check, but not worth failing over
   if (schema.converted_type.has_value() and not logical_type.has_value()) {
@@ -180,8 +167,7 @@ type_id to_type_id(SchemaElement const& schema,
   switch (physical) {
     case BOOLEAN: return type_id::BOOL8;
     case INT32: return type_id::INT32;
-    case INT64:
-      return (duration_type.id() == type_id::EMPTY) ? type_id::INT64 : duration_type.id();
+    case INT64: return arrow.value_or(type_id::INT64);
     case FLOAT: return type_id::FLOAT32;
     case DOUBLE: return type_id::FLOAT64;
     case BYTE_ARRAY:
@@ -560,25 +546,28 @@ aggregate_reader_metadata::aggregate_reader_metadata(
   }
 
   if (arrow_schema.has_value()) {
-    // erase "ARROW:schema" from the output pfm.
-    std::for_each(
-      keyval_maps.begin(), keyval_maps.end(), [](auto& pfm) { pfm.erase("ARROW:schema"); });
+    // consume arrow schema into the parquet schema
+    consume_arrow_schema();
+    // we no longer keep arrow schema alive
+    arrow_schema.reset();
   }
+
+  // erase "ARROW:schema" from the output pfm if exists
+  std::for_each(
+    keyval_maps.begin(), keyval_maps.end(), [](auto& pfm) { pfm.erase("ARROW:schema"); });
 }
 
-[[nodiscard]] std::optional<arrow_schema_t> aggregate_reader_metadata::collect_arrow_schema() const
+[[nodiscard]] std::optional<arrow_schema_data_types>
+aggregate_reader_metadata::collect_arrow_schema() const
 {
   // Check if the key_value metadata contains an ARROW:schema
   // If yes, read and decode the flatbuffer schema
 
-  // TODO: Should we check if any file has the "ARROW:schema" key or
+  // Question: Should we check if any file has the "ARROW:schema" key or
   // Or if all files have the same "ARROW:schema"?
   auto it = keyval_maps[0].find("ARROW:schema");
   if (it == keyval_maps[0].end()) { return std::nullopt; }
 
-  // Local arrow::schema object
-  arrow_schema_t schema;
-
   // Read arrow schema from flatbuffers
   std::string encoded_serialized_message = it->second;
 
@@ -642,66 +631,123 @@ aggregate_reader_metadata::aggregate_reader_metadata(
     return cudf::data_type{};
   };
 
-  // Question: Should we not walk the schema here and return flatbuf:Fields *
-  // and walk fields in `select_columns` function where we actually
-  // use the to_type_id function?
-
   // Lambda function to walk a field and its children in DFS manner and
   // return boolean walk success status
-  std::function<bool(const flatbuf::Field*)> walk_field =
-    [&schema, &duration_from_flatbuffer, &walk_field](const flatbuf::Field* field) -> bool {
-    // DFS: recursively walk over its children first
-    const auto& children = field->children();
-    if (children != nullptr) {
-      auto iter = std::find_if_not(children->cbegin(),
-                                   children->cend(),
-                                   [&walk_field](const auto& child) { return walk_field(child); });
-      if (iter != children->end()) { return false; }
-    }
+  std::function<bool(const flatbuf::Field*, arrow_schema_data_types&)> walk_field =
+    [&walk_field, &duration_from_flatbuffer](const flatbuf::Field* field,
+                                             arrow_schema_data_types& schema_elem) {
+      // DFS: recursively walk over the children first
+      auto const& field_children = field->children();
+
+      if (field_children != nullptr) {
+        auto schema_children = std::vector<arrow_schema_data_types>(field->children()->size());
+        // TODO: raw loop. Should try and change to STL.
+        for (uint32_t idx = 0; idx < field_children->size(); idx++) {
+          if (not walk_field(*(field_children->begin() + idx), schema_children[idx])) {
+            return false;
+          }
+        }
+        schema_elem.children = std::move(schema_children);
+      }
 
-    // Walk the field itself
-    // TODO: is the 'name' a good key? What if cols at different levels have the same name.
-    // Solution: build strings like: "parent.child.grandchild.greatgrandchild" to ensure
-    // uniqueness?
-    auto name = (field->name() != nullptr) ? field->name()->str() : "";
-
-    if (field->type_type() == flatbuf::Type::Type_Duration) {
-      auto type_data = field->type_as_Duration();
-      if (type_data != nullptr) {
-        // add an entry to the the unordered_map
-        schema[name] = duration_from_flatbuffer(type_data);
-      } else {
-        CUDF_LOG_ERROR("Parquet reader encountered an invalid type_data pointer.",
-                       "arrow:schema not processed.");
-        return false;
+      // Walk the field itself
+      if (field->type_type() == flatbuf::Type::Type_Duration) {
+        auto type_data = field->type_as_Duration();
+        if (type_data != nullptr) {
+          auto name = (field->name()) ? field->name()->str() : "";
+          // set the schema_elem type to duration type
+          schema_elem.type = duration_from_flatbuffer(type_data);
+        } else {
+          CUDF_LOG_ERROR("Parquet reader encountered an invalid type_data pointer.",
+                         "arrow:schema not processed.");
+          return false;
+        }
       }
+      return true;
+    };
+
+  // arrow schema structure to return
+  arrow_schema_data_types schema;
+
+  // Recursively walk the arrow schema and set cudf::data_type
+  // for all duration columns
+  if (fields->size() > 0) {
+    schema.children = std::vector<arrow_schema_data_types>(fields->size());
+    // TODO: raw loop. Should try and change to STL.
+    for (uint32_t idx = 0; idx < fields->size(); idx++) {
+      if (not walk_field(*(fields->begin() + idx), schema.children[idx])) { return std::nullopt; }
     }
-    return true;
+  }
+
+  return std::make_optional(std::move(schema));
+}
+
+void aggregate_reader_metadata::consume_arrow_schema()
+{
+  auto schema_root       = get_schema(0);
+  auto arrow_schema_root = arrow_schema.value();
+
+  /*
+   * Recursively verify that the number of columns at each level in
+   * Parquet schema and arrow schema are the same. If yes, do the
+   * co-walk between them, else skip it
+   */
+
+  // Should verify at each level rather than total number of fields
+  auto num_fields       = arrow_schema_root.children.size();
+  auto num_schema_elems = schema_root.children_idx.size();
+
+  // lambda to compute total number of fields in arrow schema
+  std::function<int32_t(const arrow_schema_data_types&)> calc_num_fields =
+    [&calc_num_fields](const arrow_schema_data_types& arrow_schema_elem) -> int32_t {
+    int32_t num_fields = arrow_schema_elem.children.size();
+    std::for_each(arrow_schema_elem.children.cbegin(),
+                  arrow_schema_elem.children.cend(),
+                  [&](auto const& schema_elem) { num_fields += calc_num_fields(schema_elem); });
+
+    return num_fields;
   };
 
-  // Walk all fields and extract all DurationType columns
-  auto iter = std::find_if_not(fields->cbegin(), fields->cend(), [&walk_field](const auto& field) {
-    return walk_field(field);
-  });
+  // calculate the total number of fields.
+  std::for_each(arrow_schema_root.children.cbegin(),
+                arrow_schema_root.children.cend(),
+                [&](auto const& schema_elem) { num_fields += calc_num_fields(schema_elem); });
 
-  if (iter != fields->end()) { return std::nullopt; }
+  // check if total number of fields are equal
+  if (num_fields != num_schema_elems) {
+    CUDF_LOG_ERROR("Parquet reader encountered a mismatch between Parquet and arrow schema.",
+                   "arrow:schema not processed.");
+    return;
+  }
 
-  // TODO: Get endianness from arrow:schema object - We aren't using this for now
-  [[maybe_unused]] auto endianness = fb_schema->endianness();
+  // All good, now co-walk schemas
+  std::function<void(arrow_schema_data_types&, int)> co_walk_schemas =
+    [&](arrow_schema_data_types& arrow_schema, int schema_idx) {
+      auto& schema_elem = per_file_metadata[0].schema[schema_idx];
+      // TODO: raw loop. Should try and change to STL.
+      for (int32_t idx = 0; idx < static_cast<int32_t>(arrow_schema.children.size()); idx++) {
+        co_walk_schemas(arrow_schema.children[idx], schema_elem.children_idx[idx]);
+      }
 
-  // TODO: Get an arrow:KeyValue map of custom_metadata from arrow:schema object -
-  // We aren't using this for now
-  [[maybe_unused]] auto custom_metadata = fb_schema->custom_metadata();
+      if (arrow_schema.type.id() != type_id::EMPTY and schema_elem.type == Type::INT64 and
+          not schema_elem.logical_type.has_value() and not schema_elem.converted_type.has_value()) {
+        schema_elem.arrow_type = arrow_schema.type.id();
+      }
+    };
+  // TODO: raw loop. Should try and change to STL.
+  for (int32_t idx = 0; idx < static_cast<int32_t>(arrow_schema_root.children.size()); idx++) {
+    co_walk_schemas(arrow_schema_root.children[idx], schema_root.children_idx[idx]);
+  }
 
-  return std::make_optional(std::move(schema));
+  return;
 }
 
 const void* aggregate_reader_metadata::decode_ipc_message(std::string& serialized_message) const
 {
   // Constants copied from arrow source and renamed to match the case
-  constexpr auto message_decoder_next_required_size_initial         = sizeof(int32_t);
+  constexpr auto MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL         = sizeof(int32_t);
   constexpr auto message_decoder_next_required_size_metadata_length = sizeof(int32_t);
-  constexpr int32_t ipc_continuation_token                          = -1;
+  constexpr int32_t IPC_CONTINUATION_TOKEN                          = -1;
 
   // message buffer
   auto message_buf = serialized_message.data();
@@ -715,24 +761,24 @@ const void* aggregate_reader_metadata::decode_ipc_message(std::string& serialize
     return static_cast<const void*>(nullptr);
   }
   // Check for improper message.
-  if (message_size - message_decoder_next_required_size_initial < 0) {
+  if (message_size - MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL < 0) {
     CUDF_LOG_ERROR("Parquet reader encountered unexpected arrow:schema message length.",
                    "arrow:schema not processed.");
   }
 
   // Get the first 4 bytes (continuation) of the ipc message
   int32_t continuation;
-  std::memcpy(&continuation, message_buf, message_decoder_next_required_size_initial);
+  std::memcpy(&continuation, message_buf, MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL);
 
   // Check if the continuation matches the expected token
-  if (continuation != ipc_continuation_token) {
+  if (continuation != IPC_CONTINUATION_TOKEN) {
     CUDF_LOG_ERROR("Parquet reader encountered unexpected IPC continuation token.",
                    "arrow:schema not processed.");
     return static_cast<const void*>(nullptr);
   } else {
     // Offset the message buf and reduce remaining size
-    message_buf += message_decoder_next_required_size_initial;
-    message_size -= message_decoder_next_required_size_initial;
+    message_buf += MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL;
+    message_size -= MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL;
   }
 
   // Check for improper message.
@@ -967,17 +1013,11 @@ aggregate_reader_metadata::select_columns(std::optional<std::vector<std::string>
 
       auto const one_level_list = schema_elem.is_one_level_list(get_schema(schema_elem.parent_idx));
 
-      auto duration_type = cudf::data_type{};
-      if (arrow_schema.has_value() and
-          arrow_schema.value().find(schema_elem.name) != arrow_schema.value().end()) {
-        duration_type = arrow_schema.value().at(schema_elem.name);
-      }
       // if we're at the root, this is a new output column
-      auto const col_type =
-        one_level_list
-          ? type_id::LIST
-          : to_type_id(schema_elem, strings_to_categorical, timestamp_type_id, duration_type);
-      auto const dtype = to_data_type(col_type, schema_elem);
+      auto const col_type = one_level_list
+                              ? type_id::LIST
+                              : to_type_id(schema_elem, strings_to_categorical, timestamp_type_id);
+      auto const dtype    = to_data_type(col_type, schema_elem);
 
       cudf::io::detail::inline_column_buffer output_col(dtype,
                                                         schema_elem.repetition_type == OPTIONAL);
@@ -1016,13 +1056,8 @@ aggregate_reader_metadata::select_columns(std::optional<std::vector<std::string>
         // set up child output column for one-level encoding list
         if (one_level_list) {
           // determine the element data type
-          auto duration_type = cudf::data_type{};
-          if (arrow_schema.has_value() and
-              arrow_schema.value().find(schema_elem.name) != arrow_schema.value().end()) {
-            duration_type = arrow_schema.value().at(schema_elem.name);
-          }
           auto const element_type =
-            to_type_id(schema_elem, strings_to_categorical, timestamp_type_id, duration_type);
+            to_type_id(schema_elem, strings_to_categorical, timestamp_type_id);
           auto const element_dtype = to_data_type(element_type, schema_elem);
 
           cudf::io::detail::inline_column_buffer element_col(
diff --git a/cpp/src/io/parquet/reader_impl_helpers.hpp b/cpp/src/io/parquet/reader_impl_helpers.hpp
index d78e8c67de6..0ca557c4b1d 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.hpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.hpp
@@ -103,8 +103,7 @@ struct row_group_info {
  */
 [[nodiscard]] type_id to_type_id(SchemaElement const& schema,
                                  bool strings_to_categorical,
-                                 type_id timestamp_type_id,
-                                 cudf::data_type duration_type = cudf::data_type{});
+                                 type_id timestamp_type_id);
 
 /**
  * @brief Converts cuDF type enum to column logical type
@@ -124,12 +123,15 @@ struct metadata : public FileMetaData {
   void sanitize_schema();
 };
 
-using arrow_schema_t = std::unordered_map<std::string, cudf::data_type>;
+struct arrow_schema_data_types {
+  std::vector<arrow_schema_data_types> children;
+  data_type type{type_id::EMPTY};
+};
 
 class aggregate_reader_metadata {
   std::vector<metadata> per_file_metadata;
   std::vector<std::unordered_map<std::string, std::string>> keyval_maps;
-  std::optional<arrow_schema_t> arrow_schema;
+  std::optional<arrow_schema_data_types> arrow_schema;
 
   int64_t num_rows;
   size_type num_row_groups;
@@ -147,13 +149,16 @@ class aggregate_reader_metadata {
     const;
 
   /**
-   * @brief Walks over an "ARROW:schema" flatbuffer and collects type information for DurationType
-   * columns into an unordered map.
+   * @brief Decodes and walks over "ARROW:schema"  from Parquet key value
+   * metadata section and return it.
    */
-  [[nodiscard]] std::optional<arrow_schema_t> collect_arrow_schema() const;
+  [[nodiscard]] std::optional<arrow_schema_data_types> collect_arrow_schema() const;
+
+  void consume_arrow_schema();
 
   /**
-   * @brief Decode an arrow:IPC message and returns a const void pointer to its metadata header
+   * @brief Decode an arrow:IPC message and returns a const void pointer
+   * to its metadata header
    */
   [[nodiscard]] const void* decode_ipc_message(std::string& serialized_message) const;
 

From ced5dd9e248811b3f76cf1484d031588e821ea28 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Wed, 1 May 2024 04:22:03 +0000
Subject: [PATCH 06/53] fixing copyrights

---
 cpp/src/io/parquet/parquet.hpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cpp/src/io/parquet/parquet.hpp b/cpp/src/io/parquet/parquet.hpp
index 6515dd7cbae..d744c731f38 100644
--- a/cpp/src/io/parquet/parquet.hpp
+++ b/cpp/src/io/parquet/parquet.hpp
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2018-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2018-2024, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.

From b192352dc50834ac07926b379f6361b5b760507f Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Wed, 1 May 2024 04:38:42 +0000
Subject: [PATCH 07/53] fix the hardcoded if conditions for duration type

---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 80c924dc144..ccdb60e52d8 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -715,7 +715,7 @@ void aggregate_reader_metadata::consume_arrow_schema()
 
   // check if total number of fields are equal
   if (num_fields != num_schema_elems) {
-    CUDF_LOG_ERROR("Parquet reader encountered a mismatch between Parquet and arrow schema.",
+    CUDF_LOG_DEBUG("Parquet reader encountered a mismatch between Parquet and arrow schema.",
                    "arrow:schema not processed.");
     return;
   }
@@ -729,8 +729,8 @@ void aggregate_reader_metadata::consume_arrow_schema()
         co_walk_schemas(arrow_schema.children[idx], schema_elem.children_idx[idx]);
       }
 
-      if (arrow_schema.type.id() != type_id::EMPTY and schema_elem.type == Type::INT64 and
-          not schema_elem.logical_type.has_value() and not schema_elem.converted_type.has_value()) {
+      // true for DurationType columns only for now.
+      if (arrow_schema.type.id() != type_id::EMPTY) {
         schema_elem.arrow_type = arrow_schema.type.id();
       }
     };

From 18d5e6c654ef5b6838621b797418eab64d8f169f Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Wed, 1 May 2024 04:56:48 +0000
Subject: [PATCH 08/53] add boolean check for arrow type columns

---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 12 ++++++++++--
 1 file changed, 10 insertions(+), 2 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index ccdb60e52d8..2a87372b2c6 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -631,11 +631,15 @@ aggregate_reader_metadata::collect_arrow_schema() const
     return cudf::data_type{};
   };
 
+  // variable that tracks if an arrow_type specific column is seen
+  // in the walk
+  bool arrow_type_col_seen = false;
+
   // Lambda function to walk a field and its children in DFS manner and
   // return boolean walk success status
   std::function<bool(const flatbuf::Field*, arrow_schema_data_types&)> walk_field =
-    [&walk_field, &duration_from_flatbuffer](const flatbuf::Field* field,
-                                             arrow_schema_data_types& schema_elem) {
+    [&walk_field, &duration_from_flatbuffer, &arrow_type_col_seen](
+      const flatbuf::Field* field, arrow_schema_data_types& schema_elem) {
       // DFS: recursively walk over the children first
       auto const& field_children = field->children();
 
@@ -657,6 +661,7 @@ aggregate_reader_metadata::collect_arrow_schema() const
           auto name = (field->name()) ? field->name()->str() : "";
           // set the schema_elem type to duration type
           schema_elem.type = duration_from_flatbuffer(type_data);
+          arrow_type_col_seen |= (schema_elem.type.id() != type_id::EMPTY);
         } else {
           CUDF_LOG_ERROR("Parquet reader encountered an invalid type_data pointer.",
                          "arrow:schema not processed.");
@@ -677,6 +682,9 @@ aggregate_reader_metadata::collect_arrow_schema() const
     for (uint32_t idx = 0; idx < fields->size(); idx++) {
       if (not walk_field(*(fields->begin() + idx), schema.children[idx])) { return std::nullopt; }
     }
+
+    // if no arrow type column seen, return nullopt.
+    if (not arrow_type_col_seen) { return std::nullopt; }
   }
 
   return std::make_optional(std::move(schema));

From 8f559831d8667e3d4b8feb91d28ed89d7d3b0780 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Wed, 1 May 2024 19:29:35 +0000
Subject: [PATCH 09/53] add basic testing for duration type

---
 cpp/src/io/functions.cpp               |  3 ---
 python/cudf/cudf/tests/test_parquet.py | 21 +++++++++++++++++++++
 2 files changed, 21 insertions(+), 3 deletions(-)

diff --git a/cpp/src/io/functions.cpp b/cpp/src/io/functions.cpp
index fbc1f123905..f0a37839810 100644
--- a/cpp/src/io/functions.cpp
+++ b/cpp/src/io/functions.cpp
@@ -484,15 +484,12 @@ table_with_metadata read_parquet(parquet_reader_options const& options,
                                  rmm::cuda_stream_view stream,
                                  rmm::device_async_resource_ref mr)
 {
-  // MH: This is where the reader starts
   CUDF_FUNC_RANGE();
 
   auto datasources = make_datasources(options.get_source());
-  // MH: reader object is made here
   auto reader =
     std::make_unique<detail_parquet::reader>(std::move(datasources), options, stream, mr);
 
-  // MH: read function called
   return reader->read(options);
 }
 
diff --git a/python/cudf/cudf/tests/test_parquet.py b/python/cudf/cudf/tests/test_parquet.py
index 56a4281aad9..897ef71a278 100644
--- a/python/cudf/cudf/tests/test_parquet.py
+++ b/python/cudf/cudf/tests/test_parquet.py
@@ -3180,3 +3180,24 @@ def test_parquet_reader_zstd_huff_tables(datadir):
     expected = pa.parquet.read_table(fname).to_pandas()
     actual = cudf.read_parquet(fname)
     assert_eq(actual, expected)
+
+
+def test_parquet_reader_duration_types():
+    pdf = pd.DataFrame(
+        {
+            "s": pd.Series([1234, 3456, 32442], dtype="timedelta64[s]"),
+            "ms": pd.Series([1234, 3456, 32442], dtype="timedelta64[ms]"),
+            "us": pd.Series([1234, 3456, 32442], dtype="timedelta64[us]"),
+            "ns": pd.Series([1234, 3456, 32442], dtype="timedelta64[ns]"),
+            "i64": pd.Series([1234, 3456, 32442], dtype="int64"),
+        }
+    )
+
+    # Write parquet with arrow for now (to write arrow:schema)
+    buffer = BytesIO()
+    pdf.to_parquet(buffer, engine="pyarrow")
+
+    # Check results
+    got = cudf.read_parquet(buffer)
+    assert_eq(pdf.dtypes, got.dtypes)
+    assert_eq(pdf, got)

From 6883c7ef1deb2766c6a4dc54895cbdbc00a84682 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Wed, 1 May 2024 19:33:56 +0000
Subject: [PATCH 10/53] revert clangd induced formatting

---
 cpp/src/io/parquet/reader_impl.cpp | 36 ++++++++++--------------------
 1 file changed, 12 insertions(+), 24 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl.cpp b/cpp/src/io/parquet/reader_impl.cpp
index d887d5fffd5..9d54f98dc3c 100644
--- a/cpp/src/io/parquet/reader_impl.cpp
+++ b/cpp/src/io/parquet/reader_impl.cpp
@@ -461,8 +461,7 @@ table_with_metadata reader::impl::read_chunk_internal(
   auto out_columns = std::vector<std::unique_ptr<column>>{};
   out_columns.reserve(_output_buffers.size());
 
-  // no work to do (this can happen on the first pass if
-  // we have no rows to read)
+  // no work to do (this can happen on the first pass if we have no rows to read)
   if (!has_more_work()) { return finalize_output(out_metadata, out_columns, filter); }
 
   auto& pass            = *_pass_itm_data;
@@ -486,8 +485,7 @@ table_with_metadata reader::impl::read_chunk_internal(
       metadata = std::make_optional<reader_column_schema>();
       metadata->set_convert_binary_to_strings(false);
     }
-    // Only construct `out_metadata` if
-    // `_output_metadata` has not been cached.
+    // Only construct `out_metadata` if `_output_metadata` has not been cached.
     if (!_output_metadata) {
       column_name_info& col_name = out_metadata.schema_info[i];
       out_columns.emplace_back(make_column(_output_buffers[i], &col_name, metadata, _stream));
@@ -496,8 +494,7 @@ table_with_metadata reader::impl::read_chunk_internal(
     }
   }
 
-  // Add empty columns if needed. Filter output columns
-  // based on filter.
+  // Add empty columns if needed. Filter output columns based on filter.
   return finalize_output(out_metadata, out_columns, filter);
 }
 
@@ -506,8 +503,7 @@ table_with_metadata reader::impl::finalize_output(
   std::vector<std::unique_ptr<column>>& out_columns,
   std::optional<std::reference_wrapper<ast::expression const>> filter)
 {
-  // Create empty columns as needed (this can happen if
-  // we've ended up with no actual data to read)
+  // Create empty columns as needed (this can happen if we've ended up with no actual data to read)
   for (size_t i = out_columns.size(); i < _output_buffers.size(); ++i) {
     if (!_output_metadata) {
       column_name_info& col_name = out_metadata.schema_info[i];
@@ -519,8 +515,7 @@ table_with_metadata reader::impl::finalize_output(
 
   if (!_output_metadata) {
     populate_metadata(out_metadata);
-    // Finally, save the output table metadata into
-    // `_output_metadata` for reuse next time.
+    // Finally, save the output table metadata into `_output_metadata` for reuse next time.
     _output_metadata = std::make_unique<table_metadata>(out_metadata);
   }
 
@@ -552,8 +547,7 @@ table_with_metadata reader::impl::read(
   std::optional<std::reference_wrapper<ast::expression const>> filter)
 {
   CUDF_EXPECTS(_output_chunk_read_limit == 0,
-               "Reading the whole file must not have "
-               "non-zero byte_limit.");
+               "Reading the whole file must not have non-zero byte_limit.");
   table_metadata metadata;
   populate_metadata(metadata);
   auto expr_conv     = named_to_reference_converter(filter, metadata);
@@ -565,9 +559,8 @@ table_with_metadata reader::impl::read(
 
 table_with_metadata reader::impl::read_chunk()
 {
-  // Reset the output buffers to their original states
-  // (right after reader construction). Don't need to do
-  // it if we read the file all at once.
+  // Reset the output buffers to their original states (right after reader construction).
+  // Don't need to do it if we read the file all at once.
   if (_file_itm_data._output_chunk_count > 0) {
     _output_buffers.resize(0);
     for (auto const& buff : _output_buffers_template) {
@@ -578,9 +571,7 @@ table_with_metadata reader::impl::read_chunk()
   prepare_data(0 /*skip_rows*/,
                std::nullopt /*num_rows, `nullopt` means unlimited*/,
                true /*uses_custom_row_bounds*/,
-               {} /*row_group_indices, empty means read all row
-                     groups*/
-               ,
+               {} /*row_group_indices, empty means read all row groups*/,
                std::nullopt /*filter*/);
   return read_chunk_internal(true, std::nullopt);
 }
@@ -590,14 +581,11 @@ bool reader::impl::has_next()
   prepare_data(0 /*skip_rows*/,
                std::nullopt /*num_rows, `nullopt` means unlimited*/,
                true /*uses_custom_row_bounds*/,
-               {} /*row_group_indices, empty means read all row
-                     groups*/
-               ,
+               {} /*row_group_indices, empty means read all row groups*/,
                std::nullopt /*filter*/);
 
-  // current_input_pass will only be incremented to be ==
-  // num_passes after the last chunk in the last subpass
-  // in the last pass has been returned
+  // current_input_pass will only be incremented to be == num_passes after
+  // the last chunk in the last subpass in the last pass has been returned
   return has_more_work();
 }
 

From ab5cacd9ac29754ac4a426b823950239d7ca5bdc Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Wed, 1 May 2024 19:36:01 +0000
Subject: [PATCH 11/53] more reverting clangd

---
 cpp/src/io/parquet/reader_impl.cpp         | 3 +--
 cpp/src/io/parquet/reader_impl_helpers.cpp | 1 +
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl.cpp b/cpp/src/io/parquet/reader_impl.cpp
index 9d54f98dc3c..a524e7c6dcc 100644
--- a/cpp/src/io/parquet/reader_impl.cpp
+++ b/cpp/src/io/parquet/reader_impl.cpp
@@ -456,8 +456,7 @@ table_with_metadata reader::impl::read_chunk_internal(
   auto out_metadata = _output_metadata ? table_metadata{*_output_metadata} : table_metadata{};
   out_metadata.schema_info.resize(_output_buffers.size());
 
-  // output cudf columns as determined by the top level
-  // schema
+  // output cudf columns as determined by the top level schema
   auto out_columns = std::vector<std::unique_ptr<column>>{};
   out_columns.reserve(_output_buffers.size());
 
diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 2a87372b2c6..77e7bfbc579 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -75,6 +75,7 @@ type_id to_type_id(SchemaElement const& schema,
   auto const physical = schema.type;
   auto const arrow    = schema.arrow_type;
   auto logical_type   = schema.logical_type;
+
   // sanity check, but not worth failing over
   if (schema.converted_type.has_value() and not logical_type.has_value()) {
     CUDF_LOG_WARN("ConvertedType is specified but not LogicalType");

From 649148cf3f671dba36aaf29f6f5fd7ff511e026b Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Thu, 2 May 2024 01:53:32 +0000
Subject: [PATCH 12/53] remove raw for loops, verify equal fields at each
 schema level

---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 220 +++++++++++----------
 1 file changed, 118 insertions(+), 102 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 77e7bfbc579..d8c674fa87d 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -23,6 +23,8 @@
 #include <cudf/io/ipc/detail/Message_generated.h>
 #include <cudf/io/ipc/detail/Schema_generated.h>
 
+#include <thrust/iterator/counting_iterator.h>
+
 #include <numeric>
 #include <regex>
 
@@ -561,58 +563,9 @@ aggregate_reader_metadata::aggregate_reader_metadata(
 [[nodiscard]] std::optional<arrow_schema_data_types>
 aggregate_reader_metadata::collect_arrow_schema() const
 {
-  // Check if the key_value metadata contains an ARROW:schema
-  // If yes, read and decode the flatbuffer schema
-
-  // Question: Should we check if any file has the "ARROW:schema" key or
-  // Or if all files have the same "ARROW:schema"?
-  auto it = keyval_maps[0].find("ARROW:schema");
-  if (it == keyval_maps[0].end()) { return std::nullopt; }
-
-  // Read arrow schema from flatbuffers
-  std::string encoded_serialized_message = it->second;
-
-  // Decode the base64 encoded ipc message string
-
-  // Note: Store the output from base64_decode in the lvalue here and then pass
-  // it to decode_ipc_message. Directly passing rvalue from base64_decode to
-  // decode_ipc_message can lead to unintended nullptr dereferences.
-  auto decoded_message = cudf::detail::base64_decode(encoded_serialized_message);
-
-  // Decode the ipc message to get a const void pointer to the arrow:Message flatbuffer
-  auto metadata_buf = decode_ipc_message(decoded_message);
-
-  if (metadata_buf == nullptr) {
-    CUDF_LOG_ERROR("Parquet reader encountered an invalid metadata pointer.",
-                   "arrow:schema not processed.");
-    return std::nullopt;
-  }
-
-  // Get an arrow:ipc message object from ipc:message's decoded metadata section
-  auto ipc_message = flatbuf::GetMessage(metadata_buf);
-  if (ipc_message == nullptr) {
-    CUDF_LOG_ERROR("Parquet reader encountered an invalid ipc_message pointer.",
-                   "arrow:schema not processed.");
-    return std::nullopt;
-  }
+  // Check the key_value metadata for ARROW:schema, decode and walk it
 
-  // Get schema object from the arrow:ipc message
-  auto fb_schema = ipc_message->header_as_Schema();
-  if (fb_schema == nullptr) {
-    CUDF_LOG_ERROR("Parquet reader encountered an invalid fb_schema pointer.",
-                   "arrow:schema not processed.");
-    return std::nullopt;
-  }
-
-  // Get the vector of fields from arrow:schema object
-  const auto fields = fb_schema->fields();
-  if (fields == nullptr) {
-    CUDF_LOG_ERROR("Parquet reader encountered an invalid fields pointer.",
-                   "arrow:schema not processed.");
-    return std::nullopt;
-  }
-
-  // This lambda function converts from flatbuf::duration type to cudf::type_id
+  // Function to convert from flatbuf::duration type to cudf::type_id
   auto duration_from_flatbuffer = [](flatbuf::Duration const* duration) {
     // TODO: we only need this for arrow::DurationType for now. Else, we can take in a
     // void ptr and typecast it to the corresponding type based on the type_id.
@@ -646,12 +599,16 @@ aggregate_reader_metadata::collect_arrow_schema() const
 
       if (field_children != nullptr) {
         auto schema_children = std::vector<arrow_schema_data_types>(field->children()->size());
-        // TODO: raw loop. Should try and change to STL.
-        for (uint32_t idx = 0; idx < field_children->size(); idx++) {
-          if (not walk_field(*(field_children->begin() + idx), schema_children[idx])) {
-            return false;
-          }
+
+        if (not std::all_of(
+              thrust::make_counting_iterator(0),
+              thrust::make_counting_iterator(static_cast<int32_t>(field_children->size())),
+              [&](auto const& idx) {
+                return walk_field(*(field_children->begin() + idx), schema_children[idx]);
+              })) {
+          return false;
         }
+
         schema_elem.children = std::move(schema_children);
       }
 
@@ -672,16 +629,67 @@ aggregate_reader_metadata::collect_arrow_schema() const
       return true;
     };
 
+  // Question: Should we check if any file has the "ARROW:schema" key or
+  // Or if all files have the same "ARROW:schema"?
+  auto it = keyval_maps[0].find("ARROW:schema");
+  if (it == keyval_maps[0].end()) { return std::nullopt; }
+
+  // Read arrow schema from flatbuffers
+  std::string encoded_serialized_message = it->second;
+
+  // Decode the base64 encoded ipc message string
+
+  // Note: Store the output from base64_decode in the lvalue here and then pass
+  // it to decode_ipc_message. Directly passing rvalue from base64_decode to
+  // decode_ipc_message can lead to unintended nullptr dereferences.
+  auto decoded_message = cudf::detail::base64_decode(encoded_serialized_message);
+
+  // Decode the ipc message to get a const void pointer to the arrow:Message flatbuffer
+  auto metadata_buf = decode_ipc_message(decoded_message);
+
+  if (metadata_buf == nullptr) {
+    CUDF_LOG_ERROR("Parquet reader encountered an invalid metadata pointer.",
+                   "arrow:schema not processed.");
+    return std::nullopt;
+  }
+
+  // Get an arrow:ipc message object from ipc:message's decoded metadata section
+  auto ipc_message = flatbuf::GetMessage(metadata_buf);
+  if (ipc_message == nullptr) {
+    CUDF_LOG_ERROR("Parquet reader encountered an invalid ipc_message pointer.",
+                   "arrow:schema not processed.");
+    return std::nullopt;
+  }
+
+  // Get schema object from the arrow:ipc message
+  auto fb_schema = ipc_message->header_as_Schema();
+  if (fb_schema == nullptr) {
+    CUDF_LOG_ERROR("Parquet reader encountered an invalid fb_schema pointer.",
+                   "arrow:schema not processed.");
+    return std::nullopt;
+  }
+
+  // Get the vector of fields from arrow:schema object
+  const auto fields = fb_schema->fields();
+  if (fields == nullptr) {
+    CUDF_LOG_ERROR("Parquet reader encountered an invalid fields pointer.",
+                   "arrow:schema not processed.");
+    return std::nullopt;
+  }
+
   // arrow schema structure to return
   arrow_schema_data_types schema;
 
-  // Recursively walk the arrow schema and set cudf::data_type
-  // for all duration columns
+  // Recursively walk the arrow schema and set cudf::data_type for all duration columns
   if (fields->size() > 0) {
     schema.children = std::vector<arrow_schema_data_types>(fields->size());
-    // TODO: raw loop. Should try and change to STL.
-    for (uint32_t idx = 0; idx < fields->size(); idx++) {
-      if (not walk_field(*(fields->begin() + idx), schema.children[idx])) { return std::nullopt; }
+
+    if (not std::all_of(thrust::make_counting_iterator(0),
+                        thrust::make_counting_iterator(static_cast<int32_t>(fields->size())),
+                        [&](auto const& idx) {
+                          return walk_field(*(fields->begin() + idx), schema.children[idx]);
+                        })) {
+      return std::nullopt;
     }
 
     // if no arrow type column seen, return nullopt.
@@ -693,61 +701,69 @@ aggregate_reader_metadata::collect_arrow_schema() const
 
 void aggregate_reader_metadata::consume_arrow_schema()
 {
-  auto schema_root       = get_schema(0);
-  auto arrow_schema_root = arrow_schema.value();
-
-  /*
-   * Recursively verify that the number of columns at each level in
-   * Parquet schema and arrow schema are the same. If yes, do the
-   * co-walk between them, else skip it
-   */
-
-  // Should verify at each level rather than total number of fields
-  auto num_fields       = arrow_schema_root.children.size();
-  auto num_schema_elems = schema_root.children_idx.size();
-
-  // lambda to compute total number of fields in arrow schema
-  std::function<int32_t(const arrow_schema_data_types&)> calc_num_fields =
-    [&calc_num_fields](const arrow_schema_data_types& arrow_schema_elem) -> int32_t {
-    int32_t num_fields = arrow_schema_elem.children.size();
-    std::for_each(arrow_schema_elem.children.cbegin(),
-                  arrow_schema_elem.children.cend(),
-                  [&](auto const& schema_elem) { num_fields += calc_num_fields(schema_elem); });
-
-    return num_fields;
-  };
+  // Function to verify equal num_children at each level in Parquet and arrow schemas.
+  std::function<bool(arrow_schema_data_types&, int)> validate_schemas =
+    [&](arrow_schema_data_types& arrow_schema, int schema_idx) {
+      auto& schema_elem = per_file_metadata[0].schema[schema_idx];
 
-  // calculate the total number of fields.
-  std::for_each(arrow_schema_root.children.cbegin(),
-                arrow_schema_root.children.cend(),
-                [&](auto const& schema_elem) { num_fields += calc_num_fields(schema_elem); });
+      // TODO: raw loops. Should change to STL if possible.
+      if (not std::all_of(thrust::make_counting_iterator(0),
+                          thrust::make_counting_iterator(schema_elem.num_children),
+                          [&](auto const& idx) {
+                            return validate_schemas(arrow_schema.children[idx],
+                                                    schema_elem.children_idx[idx]);
+                          })) {
+        return false;
+      }
 
-  // check if total number of fields are equal
-  if (num_fields != num_schema_elems) {
-    CUDF_LOG_DEBUG("Parquet reader encountered a mismatch between Parquet and arrow schema.",
-                   "arrow:schema not processed.");
-    return;
-  }
+      return schema_elem.num_children == static_cast<int32_t>(arrow_schema.children.size());
+    };
 
-  // All good, now co-walk schemas
+  // Function to co-walk arrow and parquet schemas
   std::function<void(arrow_schema_data_types&, int)> co_walk_schemas =
     [&](arrow_schema_data_types& arrow_schema, int schema_idx) {
       auto& schema_elem = per_file_metadata[0].schema[schema_idx];
-      // TODO: raw loop. Should try and change to STL.
-      for (int32_t idx = 0; idx < static_cast<int32_t>(arrow_schema.children.size()); idx++) {
-        co_walk_schemas(arrow_schema.children[idx], schema_elem.children_idx[idx]);
-      }
+      std::for_each(thrust::make_counting_iterator(0),
+                    thrust::make_counting_iterator(schema_elem.num_children),
+                    [&](auto const& idx) {
+                      co_walk_schemas(arrow_schema.children[idx], schema_elem.children_idx[idx]);
+                    });
 
       // true for DurationType columns only for now.
       if (arrow_schema.type.id() != type_id::EMPTY) {
         schema_elem.arrow_type = arrow_schema.type.id();
       }
     };
-  // TODO: raw loop. Should try and change to STL.
-  for (int32_t idx = 0; idx < static_cast<int32_t>(arrow_schema_root.children.size()); idx++) {
-    co_walk_schemas(arrow_schema_root.children[idx], schema_root.children_idx[idx]);
+
+  auto schema_root       = get_schema(0);
+  auto arrow_schema_root = arrow_schema.value();
+
+  // verify equal number of children at root level
+  if (schema_root.num_children != static_cast<int32_t>(arrow_schema_root.children.size())) {
+    CUDF_LOG_DEBUG("Parquet reader encountered a mismatch between Parquet and arrow schema.",
+                   "arrow:schema not processed.");
+    return;
+  }
+
+  // Verify equal number of children at all sub-levels
+  if (not std::all_of(thrust::make_counting_iterator(0),
+                      thrust::make_counting_iterator(schema_root.num_children),
+                      [&](auto const& idx) {
+                        return validate_schemas(arrow_schema_root.children[idx],
+                                                schema_root.children_idx[idx]);
+                      })) {
+    CUDF_LOG_DEBUG("Parquet reader encountered a mismatch between Parquet and arrow schema.",
+                   "arrow:schema not processed.");
+    return;
   }
 
+  // All good, now co-walk schemas
+  std::for_each(thrust::make_counting_iterator(0),
+                thrust::make_counting_iterator(schema_root.num_children),
+                [&](auto const& idx) {
+                  co_walk_schemas(arrow_schema_root.children[idx], schema_root.children_idx[idx]);
+                });
+
   return;
 }
 

From 416dbbd95d44228413fab38efc673b1e80054580 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Thu, 2 May 2024 05:20:22 +0000
Subject: [PATCH 13/53] Remove flatbuffer files. Add flatbuffers via CMake

---
 cpp/CMakeLists.txt                            |    3 +
 cpp/cmake/thirdparty/get_flatbuffers.cmake    |   33 +
 .../cudf/detail/utilities/base64_utils.hpp    |   63 +-
 .../cudf/io/ipc/detail/Message_generated.h    |    4 +-
 .../cudf/io/ipc/detail/Schema_generated.h     |    2 +-
 .../cudf/io/ipc/flatbuffers/allocator.h       |   73 -
 cpp/include/cudf/io/ipc/flatbuffers/array.h   |  267 ---
 cpp/include/cudf/io/ipc/flatbuffers/base.h    |  498 ------
 cpp/include/cudf/io/ipc/flatbuffers/buffer.h  |  222 ---
 .../cudf/io/ipc/flatbuffers/buffer_ref.h      |   58 -
 .../io/ipc/flatbuffers/default_allocator.h    |   70 -
 .../cudf/io/ipc/flatbuffers/detached_buffer.h |  128 --
 .../io/ipc/flatbuffers/flatbuffer_builder.h   | 1574 -----------------
 .../cudf/io/ipc/flatbuffers/flatbuffers.h     |  289 ---
 .../cudf/io/ipc/flatbuffers/stl_emulation.h   |  568 ------
 cpp/include/cudf/io/ipc/flatbuffers/string.h  |   70 -
 cpp/include/cudf/io/ipc/flatbuffers/struct.h  |   60 -
 cpp/include/cudf/io/ipc/flatbuffers/table.h   |  202 ---
 cpp/include/cudf/io/ipc/flatbuffers/vector.h  |  416 -----
 .../cudf/io/ipc/flatbuffers/vector_downward.h |  316 ----
 .../cudf/io/ipc/flatbuffers/verifier.h        |  389 ----
 21 files changed, 70 insertions(+), 5235 deletions(-)
 create mode 100644 cpp/cmake/thirdparty/get_flatbuffers.cmake
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/allocator.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/array.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/base.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/buffer.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/buffer_ref.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/default_allocator.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/detached_buffer.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/flatbuffer_builder.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/flatbuffers.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/stl_emulation.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/string.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/struct.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/table.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/vector.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/vector_downward.h
 delete mode 100644 cpp/include/cudf/io/ipc/flatbuffers/verifier.h

diff --git a/cpp/CMakeLists.txt b/cpp/CMakeLists.txt
index 60d0094efac..c4e98e02fcc 100644
--- a/cpp/CMakeLists.txt
+++ b/cpp/CMakeLists.txt
@@ -192,6 +192,8 @@ include(cmake/thirdparty/get_cccl.cmake)
 include(cmake/thirdparty/get_rmm.cmake)
 # find arrow
 include(cmake/thirdparty/get_arrow.cmake)
+# find flatbuffers
+include(cmake/thirdparty/get_flatbuffers.cmake)
 # find dlpack
 include(cmake/thirdparty/get_dlpack.cmake)
 # find cuCollections, should come after including CCCL
@@ -739,6 +741,7 @@ target_include_directories(
          "$<BUILD_INTERFACE:${CUDF_GENERATED_INCLUDE_DIR}/include>"
   PRIVATE "$<BUILD_INTERFACE:${CUDF_SOURCE_DIR}/src>"
           "$<BUILD_INTERFACE:${nanoarrow_SOURCE_DIR}/src>"
+          "$<BUILD_INTERFACE:${FlatBuffers_SOURCE_DIR}/include>"
   INTERFACE "$<INSTALL_INTERFACE:include>"
 )
 
diff --git a/cpp/cmake/thirdparty/get_flatbuffers.cmake b/cpp/cmake/thirdparty/get_flatbuffers.cmake
new file mode 100644
index 00000000000..b0ece38b8ef
--- /dev/null
+++ b/cpp/cmake/thirdparty/get_flatbuffers.cmake
@@ -0,0 +1,33 @@
+# =============================================================================
+# Copyright (c) 2024, NVIDIA CORPORATION.
+#
+# Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except
+# in compliance with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software distributed under the License
+# is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
+# or implied. See the License for the specific language governing permissions and limitations under
+# the License.
+# =============================================================================
+
+# Use CPM to find or clone flatbuffers
+function(find_and_configure_flatbuffers VERSION)
+
+  rapids_cpm_find(
+    flatbuffers ${VERSION}
+    GLOBAL_TARGETS flatbuffers
+    CPM_ARGS
+    GIT_REPOSITORY https://github.com/google/flatbuffers.git
+    GIT_TAG v${VERSION}
+    GIT_SHALLOW TRUE
+  )
+
+  rapids_export_find_package_root(
+    BUILD flatbuffers "${flatbuffers_BINARY_DIR}" EXPORT_SET cudf-exports
+  )
+
+endfunction()
+
+find_and_configure_flatbuffers(24.3.25)
diff --git a/cpp/include/cudf/detail/utilities/base64_utils.hpp b/cpp/include/cudf/detail/utilities/base64_utils.hpp
index fd8e85ec382..18d1475922f 100644
--- a/cpp/include/cudf/detail/utilities/base64_utils.hpp
+++ b/cpp/include/cudf/detail/utilities/base64_utils.hpp
@@ -1,33 +1,32 @@
 /*
-   base64_utils.cpp and base64_utils.hpp
-
-   base64 encoding and decoding with C++.
-
-   Version: 1.01.00
-
-   Copyright (C) 2004-2017 René Nyffenegger
-
-   This source code is provided 'as-is', without any express or implied
-   warranty. In no event will the author be held liable for any damages
-   arising from the use of this software.
-
-   Permission is granted to anyone to use this software for any purpose,
-   including commercial applications, and to alter it and redistribute it
-   freely, subject to the following restrictions:
-
-   1. The origin of this source code must not be misrepresented; you must not
-      claim that you wrote the original source code. If you use this source code
-      in a product, an acknowledgment in the product documentation would be
-      appreciated but is not required.
-
-   2. Altered source versions must be plainly marked as such, and must not be
-      misrepresented as being the original source code.
-
-   3. This notice may not be removed or altered from any source distribution.
-
-   René Nyffenegger rene.nyffenegger@adp-gmbh.ch
-
-*/
+ *  base64_utils.cpp and base64_utils.hpp
+ *
+ *  base64 encoding and decoding with C++.
+ *
+ *  Version: 1.01.00
+ *
+ *  Copyright (C) 2004-2017 René Nyffenegger
+ *
+ *  This source code is provided 'as-is', without any express or implied
+ *  warranty. In no event will the author be held liable for any damages
+ *  arising from the use of this software.
+ *
+ *  Permission is granted to anyone to use this software for any purpose,
+ *  including commercial applications, and to alter it and redistribute it
+ *  freely, subject to the following restrictions:
+ *
+ *  1. The origin of this source code must not be misrepresented; you must not
+ *     claim that you wrote the original source code. If you use this source code
+ *     in a product, an acknowledgment in the product documentation would be
+ *     appreciated but is not required.
+ *
+ *  2. Altered source versions must be plainly marked as such, and must not be
+ *     misrepresented as being the original source code.
+ *
+ *  3. This notice may not be removed or altered from any source distribution.
+ *
+ *  René Nyffenegger rene.nyffenegger@adp-gmbh.ch
+ */
 
 /**
  * @file base64_utils.hpp
@@ -143,9 +142,9 @@ std::string base64_decode(std::string_view encoded_string)
     }
     char_array_3[0] = (char_array_4[0] << 2) + ((char_array_4[1] & 0x30) >> 4);
     char_array_3[1] = ((char_array_4[1] & 0xf) << 4) + ((char_array_4[2] & 0x3c) >> 2);
-    // altered: TODO: arrow source code doesn't have the below line.
-    // altered: This is inconsequential as it is never appended to
-    // altered: `decoded` as max(i) = 3 and 0 <= j < 2.
+    // altered: arrow source code doesn't have the below line.
+    //          This is inconsequential as it is never appended to
+    //          `decoded` as max(i) = 3 and 0 <= j < 2.
     char_array_3[2] = ((char_array_4[2] & 0x3) << 6) + char_array_4[3];
 
     for (j = 0; j < i - 1; j++) {
diff --git a/cpp/include/cudf/io/ipc/detail/Message_generated.h b/cpp/include/cudf/io/ipc/detail/Message_generated.h
index 1cede9a963d..8ddd859f51c 100644
--- a/cpp/include/cudf/io/ipc/detail/Message_generated.h
+++ b/cpp/include/cudf/io/ipc/detail/Message_generated.h
@@ -3,7 +3,7 @@
 #ifndef FLATBUFFERS_GENERATED_MESSAGE_CUDF_IO_PARQUET_FLATBUF_H_
 #define FLATBUFFERS_GENERATED_MESSAGE_CUDF_IO_PARQUET_FLATBUF_H_
 
-#include <cudf/io/ipc/flatbuffers/flatbuffers.h>
+#include <flatbuffers/flatbuffers.h>
 
 // Ensure the included flatbuffers.h is the same version as when this file was
 // generated, otherwise it may not be compatible.
@@ -11,7 +11,7 @@ static_assert(FLATBUFFERS_VERSION_MAJOR == 24 && FLATBUFFERS_VERSION_MINOR == 3
                 FLATBUFFERS_VERSION_REVISION == 25,
               "Non-compatible flatbuffers version included");
 
-#include <cudf/io/ipc/detail/Schema_generated.h>
+#include "Schema_generated.h"
 
 namespace cudf {
 namespace io {
diff --git a/cpp/include/cudf/io/ipc/detail/Schema_generated.h b/cpp/include/cudf/io/ipc/detail/Schema_generated.h
index 0f086ecdc2c..27141b4af31 100644
--- a/cpp/include/cudf/io/ipc/detail/Schema_generated.h
+++ b/cpp/include/cudf/io/ipc/detail/Schema_generated.h
@@ -3,7 +3,7 @@
 #ifndef FLATBUFFERS_GENERATED_SCHEMA_CUDF_IO_PARQUET_FLATBUF_H_
 #define FLATBUFFERS_GENERATED_SCHEMA_CUDF_IO_PARQUET_FLATBUF_H_
 
-#include <cudf/io/ipc/flatbuffers/flatbuffers.h>
+#include <flatbuffers/flatbuffers.h>
 
 // Ensure the included flatbuffers.h is the same version as when this file was
 // generated, otherwise it may not be compatible.
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/allocator.h b/cpp/include/cudf/io/ipc/flatbuffers/allocator.h
deleted file mode 100644
index f887543ab9a..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/allocator.h
+++ /dev/null
@@ -1,73 +0,0 @@
-/*
- * Copyright 2021 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_ALLOCATOR_H_
-#define FLATBUFFERS_ALLOCATOR_H_
-
-#include <cudf/io/ipc/flatbuffers/base.h>
-
-namespace flatbuffers {
-
-// Allocator interface. This is flatbuffers-specific and meant only for
-// `vector_downward` usage.
-class Allocator {
- public:
-  virtual ~Allocator() {}
-
-  // Allocate `size` bytes of memory.
-  virtual uint8_t* allocate(size_t size) = 0;
-
-  // Deallocate `size` bytes of memory at `p` allocated by this allocator.
-  virtual void deallocate(uint8_t* p, size_t size) = 0;
-
-  // Reallocate `new_size` bytes of memory, replacing the old region of size
-  // `old_size` at `p`. In contrast to a normal realloc, this grows downwards,
-  // and is intended specifically for `vector_downward` use.
-  // `in_use_back` and `in_use_front` indicate how much of `old_size` is
-  // actually in use at each end, and needs to be copied.
-  virtual uint8_t* reallocate_downward(
-    uint8_t* old_p, size_t old_size, size_t new_size, size_t in_use_back, size_t in_use_front)
-  {
-    FLATBUFFERS_ASSERT(new_size > old_size);  // vector_downward only grows
-    uint8_t* new_p = allocate(new_size);
-    memcpy_downward(old_p, old_size, new_p, new_size, in_use_back, in_use_front);
-    deallocate(old_p, old_size);
-    return new_p;
-  }
-
- protected:
-  // Called by `reallocate_downward` to copy memory from `old_p` of `old_size`
-  // to `new_p` of `new_size`. Only memory of size `in_use_front` and
-  // `in_use_back` will be copied from the front and back of the old memory
-  // allocation.
-  void memcpy_downward(uint8_t* old_p,
-                       size_t old_size,
-                       uint8_t* new_p,
-                       size_t new_size,
-                       size_t in_use_back,
-                       size_t in_use_front)
-  {
-    memcpy(new_p + new_size - in_use_back, old_p + old_size - in_use_back, in_use_back);
-    memcpy(new_p, old_p, in_use_front);
-  }
-};
-
-}  // namespace flatbuffers
-
-#endif  // FLATBUFFERS_ALLOCATOR_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/array.h b/cpp/include/cudf/io/ipc/flatbuffers/array.h
deleted file mode 100644
index bcd68b3ca74..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/array.h
+++ /dev/null
@@ -1,267 +0,0 @@
-/*
- * Copyright 2021 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_ARRAY_H_
-#define FLATBUFFERS_ARRAY_H_
-
-#include <cudf/io/ipc/flatbuffers/base.h>
-#include <cudf/io/ipc/flatbuffers/stl_emulation.h>
-#include <cudf/io/ipc/flatbuffers/vector.h>
-
-#include <cstdint>
-#include <memory>
-
-namespace flatbuffers {
-
-// This is used as a helper type for accessing arrays.
-template <typename T, uint16_t length>
-class Array {
-  // Array<T> can carry only POD data types (scalars or structs).
-  typedef typename flatbuffers::bool_constant<flatbuffers::is_scalar<T>::value> scalar_tag;
-  typedef
-    typename flatbuffers::conditional<scalar_tag::value, T, const T*>::type IndirectHelperType;
-
- public:
-  typedef uint16_t size_type;
-  typedef typename IndirectHelper<IndirectHelperType>::return_type return_type;
-  typedef VectorConstIterator<T, return_type, uoffset_t> const_iterator;
-  typedef VectorReverseIterator<const_iterator> const_reverse_iterator;
-
-  // If T is a LE-scalar or a struct (!scalar_tag::value).
-  static FLATBUFFERS_CONSTEXPR bool is_span_observable =
-    (scalar_tag::value && (FLATBUFFERS_LITTLEENDIAN || sizeof(T) == 1)) || !scalar_tag::value;
-
-  FLATBUFFERS_CONSTEXPR uint16_t size() const { return length; }
-
-  return_type Get(uoffset_t i) const
-  {
-    FLATBUFFERS_ASSERT(i < size());
-    return IndirectHelper<IndirectHelperType>::Read(Data(), i);
-  }
-
-  return_type operator[](uoffset_t i) const { return Get(i); }
-
-  // If this is a Vector of enums, T will be its storage type, not the enum
-  // type. This function makes it convenient to retrieve value with enum
-  // type E.
-  template <typename E>
-  E GetEnum(uoffset_t i) const
-  {
-    return static_cast<E>(Get(i));
-  }
-
-  const_iterator begin() const { return const_iterator(Data(), 0); }
-  const_iterator end() const { return const_iterator(Data(), size()); }
-
-  const_reverse_iterator rbegin() const { return const_reverse_iterator(end()); }
-  const_reverse_iterator rend() const { return const_reverse_iterator(begin()); }
-
-  const_iterator cbegin() const { return begin(); }
-  const_iterator cend() const { return end(); }
-
-  const_reverse_iterator crbegin() const { return rbegin(); }
-  const_reverse_iterator crend() const { return rend(); }
-
-  // Get a mutable pointer to elements inside this array.
-  // This method used to mutate arrays of structs followed by a @p Mutate
-  // operation. For primitive types use @p Mutate directly.
-  // @warning Assignments and reads to/from the dereferenced pointer are not
-  //  automatically converted to the correct endianness.
-  typename flatbuffers::conditional<scalar_tag::value, void, T*>::type GetMutablePointer(
-    uoffset_t i) const
-  {
-    FLATBUFFERS_ASSERT(i < size());
-    return const_cast<T*>(&data()[i]);
-  }
-
-  // Change elements if you have a non-const pointer to this object.
-  void Mutate(uoffset_t i, const T& val) { MutateImpl(scalar_tag(), i, val); }
-
-  // The raw data in little endian format. Use with care.
-  const uint8_t* Data() const { return data_; }
-
-  uint8_t* Data() { return data_; }
-
-  // Similarly, but typed, much like std::vector::data
-  const T* data() const { return reinterpret_cast<const T*>(Data()); }
-  T* data() { return reinterpret_cast<T*>(Data()); }
-
-  // Copy data from a span with endian conversion.
-  // If this Array and the span overlap, the behavior is undefined.
-  void CopyFromSpan(flatbuffers::span<const T, length> src)
-  {
-    const auto p1 = reinterpret_cast<const uint8_t*>(src.data());
-    const auto p2 = Data();
-    FLATBUFFERS_ASSERT(!(p1 >= p2 && p1 < (p2 + length)) && !(p2 >= p1 && p2 < (p1 + length)));
-    (void)p1;
-    (void)p2;
-    CopyFromSpanImpl(flatbuffers::bool_constant<is_span_observable>(), src);
-  }
-
- protected:
-  void MutateImpl(flatbuffers::true_type, uoffset_t i, const T& val)
-  {
-    FLATBUFFERS_ASSERT(i < size());
-    WriteScalar(data() + i, val);
-  }
-
-  void MutateImpl(flatbuffers::false_type, uoffset_t i, const T& val)
-  {
-    *(GetMutablePointer(i)) = val;
-  }
-
-  void CopyFromSpanImpl(flatbuffers::true_type, flatbuffers::span<const T, length> src)
-  {
-    // Use std::memcpy() instead of std::copy() to avoid performance degradation
-    // due to aliasing if T is char or unsigned char.
-    // The size is known at compile time, so memcpy would be inlined.
-    std::memcpy(data(), src.data(), length * sizeof(T));
-  }
-
-  // Copy data from flatbuffers::span with endian conversion.
-  void CopyFromSpanImpl(flatbuffers::false_type, flatbuffers::span<const T, length> src)
-  {
-    for (size_type k = 0; k < length; k++) {
-      Mutate(k, src[k]);
-    }
-  }
-
-  // This class is only used to access pre-existing data. Don't ever
-  // try to construct these manually.
-  // 'constexpr' allows us to use 'size()' at compile time.
-  // @note Must not use 'FLATBUFFERS_CONSTEXPR' here, as const is not allowed on
-  //  a constructor.
-#if defined(__cpp_constexpr)
-  constexpr Array();
-#else
-  Array();
-#endif
-
-  uint8_t data_[length * sizeof(T)];
-
- private:
-  // This class is a pointer. Copying will therefore create an invalid object.
-  // Private and unimplemented copy constructor.
-  Array(const Array&);
-  Array& operator=(const Array&);
-};
-
-// Specialization for Array[struct] with access using Offset<void> pointer.
-// This specialization used by idl_gen_text.cpp.
-template <typename T, uint16_t length, template <typename> class OffsetT>
-class Array<OffsetT<T>, length> {
-  static_assert(flatbuffers::is_same<T, void>::value, "unexpected type T");
-
- public:
-  typedef const void* return_type;
-  typedef uint16_t size_type;
-
-  const uint8_t* Data() const { return data_; }
-
-  // Make idl_gen_text.cpp::PrintContainer happy.
-  return_type operator[](uoffset_t) const
-  {
-    FLATBUFFERS_ASSERT(false);
-    return nullptr;
-  }
-
- private:
-  // This class is only used to access pre-existing data.
-  Array();
-  Array(const Array&);
-  Array& operator=(const Array&);
-
-  uint8_t data_[1];
-};
-
-template <class U, uint16_t N>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<U, N> make_span(Array<U, N>& arr) FLATBUFFERS_NOEXCEPT
-{
-  static_assert(Array<U, N>::is_span_observable,
-                "wrong type U, only plain struct, LE-scalar, or byte types are allowed");
-  return span<U, N>(arr.data(), N);
-}
-
-template <class U, uint16_t N>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const U, N> make_span(const Array<U, N>& arr)
-  FLATBUFFERS_NOEXCEPT
-{
-  static_assert(Array<U, N>::is_span_observable,
-                "wrong type U, only plain struct, LE-scalar, or byte types are allowed");
-  return span<const U, N>(arr.data(), N);
-}
-
-template <class U, uint16_t N>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<uint8_t, sizeof(U) * N> make_bytes_span(
-  Array<U, N>& arr) FLATBUFFERS_NOEXCEPT
-{
-  static_assert(Array<U, N>::is_span_observable,
-                "internal error, Array<T> might hold only scalars or structs");
-  return span<uint8_t, sizeof(U) * N>(arr.Data(), sizeof(U) * N);
-}
-
-template <class U, uint16_t N>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const uint8_t, sizeof(U) * N> make_bytes_span(
-  const Array<U, N>& arr) FLATBUFFERS_NOEXCEPT
-{
-  static_assert(Array<U, N>::is_span_observable,
-                "internal error, Array<T> might hold only scalars or structs");
-  return span<const uint8_t, sizeof(U) * N>(arr.Data(), sizeof(U) * N);
-}
-
-// Cast a raw T[length] to a raw flatbuffers::Array<T, length>
-// without endian conversion. Use with care.
-// TODO: move these Cast-methods to `internal` namespace.
-template <typename T, uint16_t length>
-Array<T, length>& CastToArray(T (&arr)[length])
-{
-  return *reinterpret_cast<Array<T, length>*>(arr);
-}
-
-template <typename T, uint16_t length>
-const Array<T, length>& CastToArray(const T (&arr)[length])
-{
-  return *reinterpret_cast<const Array<T, length>*>(arr);
-}
-
-template <typename E, typename T, uint16_t length>
-Array<E, length>& CastToArrayOfEnum(T (&arr)[length])
-{
-  static_assert(sizeof(E) == sizeof(T), "invalid enum type E");
-  return *reinterpret_cast<Array<E, length>*>(arr);
-}
-
-template <typename E, typename T, uint16_t length>
-const Array<E, length>& CastToArrayOfEnum(const T (&arr)[length])
-{
-  static_assert(sizeof(E) == sizeof(T), "invalid enum type E");
-  return *reinterpret_cast<const Array<E, length>*>(arr);
-}
-
-template <typename T, uint16_t length>
-bool operator==(const Array<T, length>& lhs, const Array<T, length>& rhs) noexcept
-{
-  return std::addressof(lhs) == std::addressof(rhs) ||
-         (lhs.size() == rhs.size() &&
-          std::memcmp(lhs.Data(), rhs.Data(), rhs.size() * sizeof(T)) == 0);
-}
-
-}  // namespace flatbuffers
-
-#endif  // FLATBUFFERS_ARRAY_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/base.h b/cpp/include/cudf/io/ipc/flatbuffers/base.h
deleted file mode 100644
index cbe241cb116..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/base.h
+++ /dev/null
@@ -1,498 +0,0 @@
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-#ifndef FLATBUFFERS_BASE_H_
-#define FLATBUFFERS_BASE_H_
-
-// clang-format off
-
-// If activate should be declared and included first.
-#if defined(FLATBUFFERS_MEMORY_LEAK_TRACKING) && \
-    defined(_MSC_VER) && defined(_DEBUG)
-  // The _CRTDBG_MAP_ALLOC inside <crtdbg.h> will replace
-  // calloc/free (etc) to its debug version using #define directives.
-  #define _CRTDBG_MAP_ALLOC
-  #include <stdlib.h>
-  #include <crtdbg.h>
-  // Replace operator new by trace-enabled version.
-  #define DEBUG_NEW new(_NORMAL_BLOCK, __FILE__, __LINE__)
-  #define new DEBUG_NEW
-#endif
-
-#if !defined(FLATBUFFERS_ASSERT)
-#include <assert.h>
-#define FLATBUFFERS_ASSERT assert
-#elif defined(FLATBUFFERS_ASSERT_INCLUDE)
-// Include file with forward declaration
-#include FLATBUFFERS_ASSERT_INCLUDE
-#endif
-
-#ifndef ARDUINO
-#include <cstdint>
-#endif
-
-#include <cstddef>
-#include <cstdlib>
-#include <cstring>
-
-#if defined(ARDUINO) && !defined(ARDUINOSTL_M_H) && defined(__AVR__)
-  #include <utility.h>
-#else
-  #include <utility>
-#endif
-
-#include <string>
-#include <type_traits>
-#include <vector>
-#include <set>
-#include <algorithm>
-#include <limits>
-#include <iterator>
-#include <memory>
-
-#if defined(__unix__) && !defined(FLATBUFFERS_LOCALE_INDEPENDENT)
-  #include <unistd.h>
-#endif
-
-#ifdef __ANDROID__
-  #include <android/api-level.h>
-#endif
-
-#if defined(__ICCARM__)
-#include <intrinsics.h>
-#endif
-
-// Note the __clang__ check is needed, because clang presents itself
-// as an older GNUC compiler (4.2).
-// Clang 3.3 and later implement all of the ISO C++ 2011 standard.
-// Clang 3.4 and later implement all of the ISO C++ 2014 standard.
-// http://clang.llvm.org/cxx_status.html
-
-// Note the MSVC value '__cplusplus' may be incorrect:
-// The '__cplusplus' predefined macro in the MSVC stuck at the value 199711L,
-// indicating (erroneously!) that the compiler conformed to the C++98 Standard.
-// This value should be correct starting from MSVC2017-15.7-Preview-3.
-// The '__cplusplus' will be valid only if MSVC2017-15.7-P3 and the `/Zc:__cplusplus` switch is set.
-// Workaround (for details see MSDN):
-// Use the _MSC_VER and _MSVC_LANG definition instead of the __cplusplus  for compatibility.
-// The _MSVC_LANG macro reports the Standard version regardless of the '/Zc:__cplusplus' switch.
-
-#if defined(__GNUC__) && !defined(__clang__)
-  #define FLATBUFFERS_GCC (__GNUC__ * 10000 + __GNUC_MINOR__ * 100 + __GNUC_PATCHLEVEL__)
-#else
-  #define FLATBUFFERS_GCC 0
-#endif
-
-#if defined(__clang__)
-  #define FLATBUFFERS_CLANG (__clang_major__ * 10000 + __clang_minor__ * 100 + __clang_patchlevel__)
-#else
-  #define FLATBUFFERS_CLANG 0
-#endif
-
-/// @cond FLATBUFFERS_INTERNAL
-#if __cplusplus <= 199711L && \
-    (!defined(_MSC_VER) || _MSC_VER < 1600) && \
-    (!defined(__GNUC__) || \
-      (__GNUC__ * 10000 + __GNUC_MINOR__ * 100 + __GNUC_PATCHLEVEL__ < 40400))
-  #error A C++11 compatible compiler with support for the auto typing is \
-         required for FlatBuffers.
-  #error __cplusplus _MSC_VER __GNUC__  __GNUC_MINOR__  __GNUC_PATCHLEVEL__
-#endif
-
-#if !defined(__clang__) && \
-    defined(__GNUC__) && \
-    (__GNUC__ * 10000 + __GNUC_MINOR__ * 100 + __GNUC_PATCHLEVEL__ < 40600)
-  // Backwards compatibility for g++ 4.4, and 4.5 which don't have the nullptr
-  // and constexpr keywords. Note the __clang__ check is needed, because clang
-  // presents itself as an older GNUC compiler.
-  #ifndef nullptr_t
-    const class nullptr_t {
-    public:
-      template<class T> inline operator T*() const { return 0; }
-    private:
-      void operator&() const;
-    } nullptr = {};
-  #endif
-  #ifndef constexpr
-    #define constexpr const
-  #endif
-#endif
-
-// The wire format uses a little endian encoding (since that's efficient for
-// the common platforms).
-#if defined(__s390x__)
-  #define FLATBUFFERS_LITTLEENDIAN 0
-#endif // __s390x__
-#if !defined(FLATBUFFERS_LITTLEENDIAN)
-  #if defined(__GNUC__) || defined(__clang__) || defined(__ICCARM__)
-    #if (defined(__BIG_ENDIAN__) || \
-         (defined(__BYTE_ORDER__) && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__))
-      #define FLATBUFFERS_LITTLEENDIAN 0
-    #else
-      #define FLATBUFFERS_LITTLEENDIAN 1
-    #endif // __BIG_ENDIAN__
-  #elif defined(_MSC_VER)
-    #if defined(_M_PPC)
-      #define FLATBUFFERS_LITTLEENDIAN 0
-    #else
-      #define FLATBUFFERS_LITTLEENDIAN 1
-    #endif
-  #else
-    #error Unable to determine endianness, define FLATBUFFERS_LITTLEENDIAN.
-  #endif
-#endif // !defined(FLATBUFFERS_LITTLEENDIAN)
-
-#define FLATBUFFERS_VERSION_MAJOR 24
-#define FLATBUFFERS_VERSION_MINOR 3
-#define FLATBUFFERS_VERSION_REVISION 25
-#define FLATBUFFERS_STRING_EXPAND(X) #X
-#define FLATBUFFERS_STRING(X) FLATBUFFERS_STRING_EXPAND(X)
-namespace flatbuffers {
-  // Returns version as string  "MAJOR.MINOR.REVISION".
-  const char* FLATBUFFERS_VERSION();
-}
-
-#if (!defined(_MSC_VER) || _MSC_VER > 1600) && \
-    (!defined(__GNUC__) || (__GNUC__ * 100 + __GNUC_MINOR__ >= 407)) || \
-    defined(__clang__)
-  #define FLATBUFFERS_FINAL_CLASS final
-  #define FLATBUFFERS_OVERRIDE override
-  #define FLATBUFFERS_EXPLICIT_CPP11 explicit
-  #define FLATBUFFERS_VTABLE_UNDERLYING_TYPE : ::flatbuffers::voffset_t
-#else
-  #define FLATBUFFERS_FINAL_CLASS
-  #define FLATBUFFERS_OVERRIDE
-  #define FLATBUFFERS_EXPLICIT_CPP11
-  #define FLATBUFFERS_VTABLE_UNDERLYING_TYPE
-#endif
-
-#if (!defined(_MSC_VER) || _MSC_VER >= 1900) && \
-    (!defined(__GNUC__) || (__GNUC__ * 100 + __GNUC_MINOR__ >= 406)) || \
-    (defined(__cpp_constexpr) && __cpp_constexpr >= 200704)
-  #define FLATBUFFERS_CONSTEXPR constexpr
-  #define FLATBUFFERS_CONSTEXPR_CPP11 constexpr
-  #define FLATBUFFERS_CONSTEXPR_DEFINED
-#else
-  #define FLATBUFFERS_CONSTEXPR const
-  #define FLATBUFFERS_CONSTEXPR_CPP11
-#endif
-
-#if (defined(__cplusplus) && __cplusplus >= 201402L) || \
-    (defined(__cpp_constexpr) && __cpp_constexpr >= 201304)
-  #define FLATBUFFERS_CONSTEXPR_CPP14 FLATBUFFERS_CONSTEXPR_CPP11
-#else
-  #define FLATBUFFERS_CONSTEXPR_CPP14
-#endif
-
-#if (defined(__GXX_EXPERIMENTAL_CXX0X__) && (__GNUC__ * 100 + __GNUC_MINOR__ >= 406)) || \
-    (defined(_MSC_FULL_VER) && (_MSC_FULL_VER >= 190023026)) || \
-    defined(__clang__)
-  #define FLATBUFFERS_NOEXCEPT noexcept
-#else
-  #define FLATBUFFERS_NOEXCEPT
-#endif
-
-// NOTE: the FLATBUFFERS_DELETE_FUNC macro may change the access mode to
-// private, so be sure to put it at the end or reset access mode explicitly.
-#if (!defined(_MSC_VER) || _MSC_FULL_VER >= 180020827) && \
-    (!defined(__GNUC__) || (__GNUC__ * 100 + __GNUC_MINOR__ >= 404)) || \
-    defined(__clang__)
-  #define FLATBUFFERS_DELETE_FUNC(func) func = delete
-#else
-  #define FLATBUFFERS_DELETE_FUNC(func) private: func
-#endif
-
-#if (!defined(_MSC_VER) || _MSC_VER >= 1900) && \
-    (!defined(__GNUC__) || (__GNUC__ * 100 + __GNUC_MINOR__ >= 409)) || \
-    defined(__clang__)
-  #define FLATBUFFERS_DEFAULT_DECLARATION
-#endif
-
-// Check if we can use template aliases
-// Not possible if Microsoft Compiler before 2012
-// Possible is the language feature __cpp_alias_templates is defined well
-// Or possible if the C++ std is C+11 or newer
-#if (defined(_MSC_VER) && _MSC_VER > 1700 /* MSVC2012 */) \
-    || (defined(__cpp_alias_templates) && __cpp_alias_templates >= 200704) \
-    || (defined(__cplusplus) && __cplusplus >= 201103L)
-  #define FLATBUFFERS_TEMPLATES_ALIASES
-#endif
-
-#ifndef FLATBUFFERS_HAS_STRING_VIEW
-  // Only provide flatbuffers::string_view if __has_include can be used
-  // to detect a header that provides an implementation
-  #if defined(__has_include)
-    // Check for std::string_view (in c++17)
-    #if __has_include(<string_view>) && (__cplusplus >= 201606 || (defined(_HAS_CXX17) && _HAS_CXX17))
-      #include <string_view>
-      namespace flatbuffers {
-        typedef std::string_view string_view;
-      }
-      #define FLATBUFFERS_HAS_STRING_VIEW 1
-    // Check for std::experimental::string_view (in c++14, compiler-dependent)
-    #elif __has_include(<experimental/string_view>) && (__cplusplus >= 201411)
-      #include <experimental/string_view>
-      namespace flatbuffers {
-        typedef std::experimental::string_view string_view;
-      }
-      #define FLATBUFFERS_HAS_STRING_VIEW 1
-    // Check for absl::string_view
-    #elif __has_include("absl/strings/string_view.h") && \
-          __has_include("absl/base/config.h") && \
-          (__cplusplus >= 201411)
-      #include "absl/base/config.h"
-      #if !defined(ABSL_USES_STD_STRING_VIEW)
-        #include "absl/strings/string_view.h"
-        namespace flatbuffers {
-          typedef absl::string_view string_view;
-        }
-        #define FLATBUFFERS_HAS_STRING_VIEW 1
-      #endif
-    #endif
-  #endif // __has_include
-#endif // !FLATBUFFERS_HAS_STRING_VIEW
-
-#ifndef FLATBUFFERS_GENERAL_HEAP_ALLOC_OK
-  // Allow heap allocations to be used
-  #define FLATBUFFERS_GENERAL_HEAP_ALLOC_OK 1
-#endif // !FLATBUFFERS_GENERAL_HEAP_ALLOC_OK
-
-#ifndef FLATBUFFERS_HAS_NEW_STRTOD
-  // Modern (C++11) strtod and strtof functions are available for use.
-  // 1) nan/inf strings as argument of strtod;
-  // 2) hex-float  as argument of  strtod/strtof.
-  #if (defined(_MSC_VER) && _MSC_VER >= 1900) || \
-      (defined(__GNUC__) && (__GNUC__ * 100 + __GNUC_MINOR__ >= 409)) || \
-      (defined(__clang__))
-    #define FLATBUFFERS_HAS_NEW_STRTOD 1
-  #endif
-#endif // !FLATBUFFERS_HAS_NEW_STRTOD
-
-#ifndef FLATBUFFERS_LOCALE_INDEPENDENT
-  // Enable locale independent functions {strtof_l, strtod_l,strtoll_l,
-  // strtoull_l}.
-  #if (defined(_MSC_VER) && _MSC_VER >= 1800) || \
-      (defined(__ANDROID_API__) && __ANDROID_API__>= 21) || \
-      (defined(_XOPEN_VERSION) && (_XOPEN_VERSION >= 700)) && \
-        (!defined(__Fuchsia__) && !defined(__ANDROID_API__))
-    #define FLATBUFFERS_LOCALE_INDEPENDENT 1
-  #else
-    #define FLATBUFFERS_LOCALE_INDEPENDENT 0
-  #endif
-#endif  // !FLATBUFFERS_LOCALE_INDEPENDENT
-
-// Suppress Undefined Behavior Sanitizer (recoverable only). Usage:
-// - FLATBUFFERS_SUPPRESS_UBSAN("undefined")
-// - FLATBUFFERS_SUPPRESS_UBSAN("signed-integer-overflow")
-#if defined(__clang__) && (__clang_major__ > 3 || (__clang_major__ == 3 && __clang_minor__ >=7))
-  #define FLATBUFFERS_SUPPRESS_UBSAN(type) __attribute__((no_sanitize(type)))
-#elif defined(__GNUC__) && (__GNUC__ * 100 + __GNUC_MINOR__ >= 409)
-  #define FLATBUFFERS_SUPPRESS_UBSAN(type) __attribute__((no_sanitize_undefined))
-#else
-  #define FLATBUFFERS_SUPPRESS_UBSAN(type)
-#endif
-
-namespace flatbuffers {
-  // This is constexpr function used for checking compile-time constants.
-  // Avoid `#pragma warning(disable: 4127) // C4127: expression is constant`.
-  template<typename T> FLATBUFFERS_CONSTEXPR inline bool IsConstTrue(T t) {
-    return !!t;
-  }
-}
-
-// Enable C++ attribute [[]] if std:c++17 or higher.
-#if ((__cplusplus >= 201703L) \
-    || (defined(_MSVC_LANG) &&  (_MSVC_LANG >= 201703L)))
-  // All attributes unknown to an implementation are ignored without causing an error.
-  #define FLATBUFFERS_ATTRIBUTE(attr) attr
-
-  #define FLATBUFFERS_FALLTHROUGH() [[fallthrough]]
-#else
-  #define FLATBUFFERS_ATTRIBUTE(attr)
-
-  #if FLATBUFFERS_CLANG >= 30800
-    #define FLATBUFFERS_FALLTHROUGH() [[clang::fallthrough]]
-  #elif FLATBUFFERS_GCC >= 70300
-    #define FLATBUFFERS_FALLTHROUGH() [[gnu::fallthrough]]
-  #else
-    #define FLATBUFFERS_FALLTHROUGH()
-  #endif
-#endif
-
-/// @endcond
-
-/// @file
-namespace flatbuffers {
-
-/// @cond FLATBUFFERS_INTERNAL
-// Our default offset / size type, 32bit on purpose on 64bit systems.
-// Also, using a consistent offset type maintains compatibility of serialized
-// offset values between 32bit and 64bit systems.
-typedef uint32_t uoffset_t;
-typedef uint64_t uoffset64_t;
-
-// Signed offsets for references that can go in both directions.
-typedef int32_t soffset_t;
-typedef int64_t soffset64_t;
-
-// Offset/index used in v-tables, can be changed to uint8_t in
-// format forks to save a bit of space if desired.
-typedef uint16_t voffset_t;
-
-typedef uintmax_t largest_scalar_t;
-
-// In 32bits, this evaluates to 2GB - 1
-#define FLATBUFFERS_MAX_BUFFER_SIZE std::numeric_limits<::flatbuffers::soffset_t>::max()
-#define FLATBUFFERS_MAX_64_BUFFER_SIZE std::numeric_limits<::flatbuffers::soffset64_t>::max()
-
-// The minimum size buffer that can be a valid flatbuffer.
-// Includes the offset to the root table (uoffset_t), the offset to the vtable
-// of the root table (soffset_t), the size of the vtable (uint16_t), and the
-// size of the referring table (uint16_t).
-#define FLATBUFFERS_MIN_BUFFER_SIZE sizeof(uoffset_t) + sizeof(soffset_t) + \
-   sizeof(uint16_t) + sizeof(uint16_t)
-
-// We support aligning the contents of buffers up to this size.
-#ifndef FLATBUFFERS_MAX_ALIGNMENT
-  #define FLATBUFFERS_MAX_ALIGNMENT 32
-#endif
-
-/// @brief The length of a FlatBuffer file header.
-static const size_t kFileIdentifierLength = 4;
-
-inline bool VerifyAlignmentRequirements(size_t align, size_t min_align = 1) {
-  return (min_align <= align) && (align <= (FLATBUFFERS_MAX_ALIGNMENT)) &&
-         (align & (align - 1)) == 0;  // must be power of 2
-}
-
-#if defined(_MSC_VER)
-  #pragma warning(push)
-  #pragma warning(disable: 4127) // C4127: conditional expression is constant
-#endif
-
-template<typename T> T EndianSwap(T t) {
-  #if defined(_MSC_VER)
-    #define FLATBUFFERS_BYTESWAP16 _byteswap_ushort
-    #define FLATBUFFERS_BYTESWAP32 _byteswap_ulong
-    #define FLATBUFFERS_BYTESWAP64 _byteswap_uint64
-  #elif defined(__ICCARM__)
-    #define FLATBUFFERS_BYTESWAP16 __REV16
-    #define FLATBUFFERS_BYTESWAP32 __REV
-    #define FLATBUFFERS_BYTESWAP64(x) \
-       ((__REV(static_cast<uint32_t>(x >> 32U))) | (static_cast<uint64_t>(__REV(static_cast<uint32_t>(x)))) << 32U)
-  #else
-    #if defined(__GNUC__) && __GNUC__ * 100 + __GNUC_MINOR__ < 408 && !defined(__clang__)
-      // __builtin_bswap16 was missing prior to GCC 4.8.
-      #define FLATBUFFERS_BYTESWAP16(x) \
-        static_cast<uint16_t>(__builtin_bswap32(static_cast<uint32_t>(x) << 16))
-    #else
-      #define FLATBUFFERS_BYTESWAP16 __builtin_bswap16
-    #endif
-    #define FLATBUFFERS_BYTESWAP32 __builtin_bswap32
-    #define FLATBUFFERS_BYTESWAP64 __builtin_bswap64
-  #endif
-  if (sizeof(T) == 1) {   // Compile-time if-then's.
-    return t;
-  } else if (sizeof(T) == 2) {
-    union { T t; uint16_t i; } u = { t };
-    u.i = FLATBUFFERS_BYTESWAP16(u.i);
-    return u.t;
-  } else if (sizeof(T) == 4) {
-    union { T t; uint32_t i; } u = { t };
-    u.i = FLATBUFFERS_BYTESWAP32(u.i);
-    return u.t;
-  } else if (sizeof(T) == 8) {
-    union { T t; uint64_t i; } u = { t };
-    u.i = FLATBUFFERS_BYTESWAP64(u.i);
-    return u.t;
-  } else {
-    FLATBUFFERS_ASSERT(0);
-    return t;
-  }
-}
-
-#if defined(_MSC_VER)
-  #pragma warning(pop)
-#endif
-
-
-template<typename T> T EndianScalar(T t) {
-  #if FLATBUFFERS_LITTLEENDIAN
-    return t;
-  #else
-    return EndianSwap(t);
-  #endif
-}
-
-template<typename T>
-// UBSAN: C++ aliasing type rules, see std::bit_cast<> for details.
-FLATBUFFERS_SUPPRESS_UBSAN("alignment")
-T ReadScalar(const void *p) {
-  return EndianScalar(*reinterpret_cast<const T *>(p));
-}
-
-// See https://github.com/google/flatbuffers/issues/5950
-
-#if (FLATBUFFERS_GCC >= 100000) && (FLATBUFFERS_GCC < 110000)
-  #pragma GCC diagnostic push
-  #pragma GCC diagnostic ignored "-Wstringop-overflow"
-#endif
-
-template<typename T>
-// UBSAN: C++ aliasing type rules, see std::bit_cast<> for details.
-FLATBUFFERS_SUPPRESS_UBSAN("alignment")
-void WriteScalar(void *p, T t) {
-  *reinterpret_cast<T *>(p) = EndianScalar(t);
-}
-
-template<typename T> struct Offset;
-template<typename T> FLATBUFFERS_SUPPRESS_UBSAN("alignment") void WriteScalar(void *p, Offset<T> t) {
-  *reinterpret_cast<uoffset_t *>(p) = EndianScalar(t.o);
-}
-
-#if (FLATBUFFERS_GCC >= 100000) && (FLATBUFFERS_GCC < 110000)
-  #pragma GCC diagnostic pop
-#endif
-
-// Computes how many bytes you'd have to pad to be able to write an
-// "scalar_size" scalar if the buffer had grown to "buf_size" (downwards in
-// memory).
-FLATBUFFERS_SUPPRESS_UBSAN("unsigned-integer-overflow")
-inline size_t PaddingBytes(size_t buf_size, size_t scalar_size) {
-  return ((~buf_size) + 1) & (scalar_size - 1);
-}
-
-// Generic 'operator==' with conditional specialisations.
-// T e - new value of a scalar field.
-// T def - default of scalar (is known at compile-time).
-template<typename T> inline bool IsTheSameAs(T e, T def) { return e == def; }
-
-#if defined(FLATBUFFERS_NAN_DEFAULTS) && \
-    defined(FLATBUFFERS_HAS_NEW_STRTOD) && (FLATBUFFERS_HAS_NEW_STRTOD > 0)
-// Like `operator==(e, def)` with weak NaN if T=(float|double).
-template<typename T> inline bool IsFloatTheSameAs(T e, T def) {
-  return (e == def) || ((def != def) && (e != e));
-}
-template<> inline bool IsTheSameAs<float>(float e, float def) {
-  return IsFloatTheSameAs(e, def);
-}
-template<> inline bool IsTheSameAs<double>(double e, double def) {
-  return IsFloatTheSameAs(e, def);
-}
-#endif
-
-// Check 'v' is out of closed range [low; high].
-// Workaround for GCC warning [-Werror=type-limits]:
-// comparison is always true due to limited range of data type.
-template<typename T>
-inline bool IsOutRange(const T &v, const T &low, const T &high) {
-  return (v < low) || (high < v);
-}
-
-// Check 'v' is in closed range [low; high].
-template<typename T>
-inline bool IsInRange(const T &v, const T &low, const T &high) {
-  return !IsOutRange(v, low, high);
-}
-
-}  // namespace flatbuffers
-#endif  // FLATBUFFERS_BASE_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/buffer.h b/cpp/include/cudf/io/ipc/flatbuffers/buffer.h
deleted file mode 100644
index 9e574a46bce..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/buffer.h
+++ /dev/null
@@ -1,222 +0,0 @@
-/*
- * Copyright 2021 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_BUFFER_H_
-#define FLATBUFFERS_BUFFER_H_
-
-#include <cudf/io/ipc/flatbuffers/base.h>
-
-#include <algorithm>
-
-namespace flatbuffers {
-
-// Wrapper for uoffset_t to allow safe template specialization.
-// Value is allowed to be 0 to indicate a null object (see e.g. AddOffset).
-template <typename T = void>
-struct Offset {
-  // The type of offset to use.
-  typedef uoffset_t offset_type;
-
-  offset_type o;
-  Offset() : o(0) {}
-  Offset(const offset_type _o) : o(_o) {}
-  Offset<> Union() const { return o; }
-  bool IsNull() const { return !o; }
-};
-
-// Wrapper for uoffset64_t Offsets.
-template <typename T = void>
-struct Offset64 {
-  // The type of offset to use.
-  typedef uoffset64_t offset_type;
-
-  offset_type o;
-  Offset64() : o(0) {}
-  Offset64(const offset_type offset) : o(offset) {}
-  Offset64<> Union() const { return o; }
-  bool IsNull() const { return !o; }
-};
-
-// Litmus check for ensuring the Offsets are the expected size.
-static_assert(sizeof(Offset<>) == 4, "Offset has wrong size");
-static_assert(sizeof(Offset64<>) == 8, "Offset64 has wrong size");
-
-inline void EndianCheck()
-{
-  [[maybe_unused]] int endiantest = 1;
-  // If this fails, see FLATBUFFERS_LITTLEENDIAN above.
-  FLATBUFFERS_ASSERT(*reinterpret_cast<char*>(&endiantest) == FLATBUFFERS_LITTLEENDIAN);
-  (void)endiantest;
-}
-
-template <typename T>
-FLATBUFFERS_CONSTEXPR size_t AlignOf()
-{
-// clang-format off
-  #ifdef _MSC_VER
-    return __alignof(T);
-  #else
-    #ifndef alignof
-      return __alignof__(T);
-    #else
-      return alignof(T);
-    #endif
-  #endif
-  // clang-format on
-}
-
-// Lexicographically compare two strings (possibly containing nulls), and
-// return true if the first is less than the second.
-static inline bool StringLessThan(const char* a_data,
-                                  uoffset_t a_size,
-                                  const char* b_data,
-                                  uoffset_t b_size)
-{
-  const auto cmp = memcmp(a_data, b_data, (std::min)(a_size, b_size));
-  return cmp == 0 ? a_size < b_size : cmp < 0;
-}
-
-// When we read serialized data from memory, in the case of most scalars,
-// we want to just read T, but in the case of Offset, we want to actually
-// perform the indirection and return a pointer.
-// The template specialization below does just that.
-// It is wrapped in a struct since function templates can't overload on the
-// return type like this.
-// The typedef is for the convenience of callers of this function
-// (avoiding the need for a trailing return decltype)
-template <typename T>
-struct IndirectHelper {
-  typedef T return_type;
-  typedef T mutable_return_type;
-  static const size_t element_stride = sizeof(T);
-
-  static return_type Read(const uint8_t* p, const size_t i)
-  {
-    return EndianScalar((reinterpret_cast<const T*>(p))[i]);
-  }
-  static mutable_return_type Read(uint8_t* p, const size_t i)
-  {
-    return reinterpret_cast<mutable_return_type>(Read(const_cast<const uint8_t*>(p), i));
-  }
-};
-
-// For vector of Offsets.
-template <typename T, template <typename> class OffsetT>
-struct IndirectHelper<OffsetT<T>> {
-  typedef const T* return_type;
-  typedef T* mutable_return_type;
-  typedef typename OffsetT<T>::offset_type offset_type;
-  static const offset_type element_stride = sizeof(offset_type);
-
-  static return_type Read(const uint8_t* const p, const offset_type i)
-  {
-    // Offsets are relative to themselves, so first update the pointer to
-    // point to the offset location.
-    const uint8_t* const offset_location = p + i * element_stride;
-
-    // Then read the scalar value of the offset (which may be 32 or 64-bits) and
-    // then determine the relative location from the offset location.
-    return reinterpret_cast<return_type>(offset_location +
-                                         ReadScalar<offset_type>(offset_location));
-  }
-  static mutable_return_type Read(uint8_t* const p, const offset_type i)
-  {
-    // Offsets are relative to themselves, so first update the pointer to
-    // point to the offset location.
-    uint8_t* const offset_location = p + i * element_stride;
-
-    // Then read the scalar value of the offset (which may be 32 or 64-bits) and
-    // then determine the relative location from the offset location.
-    return reinterpret_cast<mutable_return_type>(offset_location +
-                                                 ReadScalar<offset_type>(offset_location));
-  }
-};
-
-// For vector of structs.
-template <typename T>
-struct IndirectHelper<const T*> {
-  typedef const T* return_type;
-  typedef T* mutable_return_type;
-  static const size_t element_stride = sizeof(T);
-
-  static return_type Read(const uint8_t* const p, const size_t i)
-  {
-    // Structs are stored inline, relative to the first struct pointer.
-    return reinterpret_cast<return_type>(p + i * element_stride);
-  }
-  static mutable_return_type Read(uint8_t* const p, const size_t i)
-  {
-    // Structs are stored inline, relative to the first struct pointer.
-    return reinterpret_cast<mutable_return_type>(p + i * element_stride);
-  }
-};
-
-/// @brief Get a pointer to the file_identifier section of the buffer.
-/// @return Returns a const char pointer to the start of the file_identifier
-/// characters in the buffer.  The returned char * has length
-/// 'flatbuffers::FlatBufferBuilder::kFileIdentifierLength'.
-/// This function is UNDEFINED for FlatBuffers whose schema does not include
-/// a file_identifier (likely points at padding or the start of a the root
-/// vtable).
-inline const char* GetBufferIdentifier(const void* buf, bool size_prefixed = false)
-{
-  return reinterpret_cast<const char*>(buf) +
-         ((size_prefixed) ? 2 * sizeof(uoffset_t) : sizeof(uoffset_t));
-}
-
-// Helper to see if the identifier in a buffer has the expected value.
-inline bool BufferHasIdentifier(const void* buf, const char* identifier, bool size_prefixed = false)
-{
-  return strncmp(GetBufferIdentifier(buf, size_prefixed),
-                 identifier,
-                 flatbuffers::kFileIdentifierLength) == 0;
-}
-
-/// @cond FLATBUFFERS_INTERNAL
-// Helpers to get a typed pointer to the root object contained in the buffer.
-template <typename T>
-T* GetMutableRoot(void* buf)
-{
-  if (!buf) return nullptr;
-  EndianCheck();
-  return reinterpret_cast<T*>(reinterpret_cast<uint8_t*>(buf) +
-                              EndianScalar(*reinterpret_cast<uoffset_t*>(buf)));
-}
-
-template <typename T, typename SizeT = uoffset_t>
-T* GetMutableSizePrefixedRoot(void* buf)
-{
-  return GetMutableRoot<T>(reinterpret_cast<uint8_t*>(buf) + sizeof(SizeT));
-}
-
-template <typename T>
-const T* GetRoot(const void* buf)
-{
-  return GetMutableRoot<T>(const_cast<void*>(buf));
-}
-
-template <typename T, typename SizeT = uoffset_t>
-const T* GetSizePrefixedRoot(const void* buf)
-{
-  return GetRoot<T>(reinterpret_cast<const uint8_t*>(buf) + sizeof(SizeT));
-}
-
-}  // namespace flatbuffers
-
-#endif  // FLATBUFFERS_BUFFER_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/buffer_ref.h b/cpp/include/cudf/io/ipc/flatbuffers/buffer_ref.h
deleted file mode 100644
index f8e493ecdf9..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/buffer_ref.h
+++ /dev/null
@@ -1,58 +0,0 @@
-/*
- * Copyright 2021 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_BUFFER_REF_H_
-#define FLATBUFFERS_BUFFER_REF_H_
-
-#include <cudf/io/ipc/flatbuffers/base.h>
-#include <cudf/io/ipc/flatbuffers/verifier.h>
-
-namespace flatbuffers {
-
-// Convenient way to bundle a buffer and its length, to pass it around
-// typed by its root.
-// A BufferRef does not own its buffer.
-struct BufferRefBase {};  // for std::is_base_of
-
-template <typename T>
-struct BufferRef : BufferRefBase {
-  BufferRef() : buf(nullptr), len(0), must_free(false) {}
-  BufferRef(uint8_t* _buf, uoffset_t _len) : buf(_buf), len(_len), must_free(false) {}
-
-  ~BufferRef()
-  {
-    if (must_free) free(buf);
-  }
-
-  const T* GetRoot() const { return flatbuffers::GetRoot<T>(buf); }
-
-  bool Verify()
-  {
-    Verifier verifier(buf, len);
-    return verifier.VerifyBuffer<T>(nullptr);
-  }
-
-  uint8_t* buf;
-  uoffset_t len;
-  bool must_free;
-};
-
-}  // namespace flatbuffers
-
-#endif  // FLATBUFFERS_BUFFER_REF_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/default_allocator.h b/cpp/include/cudf/io/ipc/flatbuffers/default_allocator.h
deleted file mode 100644
index 20fa65bc78e..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/default_allocator.h
+++ /dev/null
@@ -1,70 +0,0 @@
-/*
- * Copyright 2021 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_DEFAULT_ALLOCATOR_H_
-#define FLATBUFFERS_DEFAULT_ALLOCATOR_H_
-
-#include <cudf/io/ipc/flatbuffers/allocator.h>
-#include <cudf/io/ipc/flatbuffers/base.h>
-
-namespace flatbuffers {
-
-// DefaultAllocator uses new/delete to allocate memory regions
-class DefaultAllocator : public Allocator {
- public:
-  uint8_t* allocate(size_t size) FLATBUFFERS_OVERRIDE { return new uint8_t[size]; }
-
-  void deallocate(uint8_t* p, size_t) FLATBUFFERS_OVERRIDE { delete[] p; }
-
-  static void dealloc(void* p, size_t) { delete[] static_cast<uint8_t*>(p); }
-};
-
-// These functions allow for a null allocator to mean use the default allocator,
-// as used by DetachedBuffer and vector_downward below.
-// This is to avoid having a statically or dynamically allocated default
-// allocator, or having to move it between the classes that may own it.
-inline uint8_t* Allocate(Allocator* allocator, size_t size)
-{
-  return allocator ? allocator->allocate(size) : DefaultAllocator().allocate(size);
-}
-
-inline void Deallocate(Allocator* allocator, uint8_t* p, size_t size)
-{
-  if (allocator)
-    allocator->deallocate(p, size);
-  else
-    DefaultAllocator().deallocate(p, size);
-}
-
-inline uint8_t* ReallocateDownward(Allocator* allocator,
-                                   uint8_t* old_p,
-                                   size_t old_size,
-                                   size_t new_size,
-                                   size_t in_use_back,
-                                   size_t in_use_front)
-{
-  return allocator
-           ? allocator->reallocate_downward(old_p, old_size, new_size, in_use_back, in_use_front)
-           : DefaultAllocator().reallocate_downward(
-               old_p, old_size, new_size, in_use_back, in_use_front);
-}
-
-}  // namespace flatbuffers
-
-#endif  // FLATBUFFERS_DEFAULT_ALLOCATOR_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/detached_buffer.h b/cpp/include/cudf/io/ipc/flatbuffers/detached_buffer.h
deleted file mode 100644
index 35fc82f72d4..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/detached_buffer.h
+++ /dev/null
@@ -1,128 +0,0 @@
-/*
- * Copyright 2021 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_DETACHED_BUFFER_H_
-#define FLATBUFFERS_DETACHED_BUFFER_H_
-
-#include <cudf/io/ipc/flatbuffers/allocator.h>
-#include <cudf/io/ipc/flatbuffers/base.h>
-#include <cudf/io/ipc/flatbuffers/default_allocator.h>
-
-namespace flatbuffers {
-
-// DetachedBuffer is a finished flatbuffer memory region, detached from its
-// builder. The original memory region and allocator are also stored so that
-// the DetachedBuffer can manage the memory lifetime.
-class DetachedBuffer {
- public:
-  DetachedBuffer()
-    : allocator_(nullptr),
-      own_allocator_(false),
-      buf_(nullptr),
-      reserved_(0),
-      cur_(nullptr),
-      size_(0)
-  {
-  }
-
-  DetachedBuffer(Allocator* allocator,
-                 bool own_allocator,
-                 uint8_t* buf,
-                 size_t reserved,
-                 uint8_t* cur,
-                 size_t sz)
-    : allocator_(allocator),
-      own_allocator_(own_allocator),
-      buf_(buf),
-      reserved_(reserved),
-      cur_(cur),
-      size_(sz)
-  {
-  }
-
-  DetachedBuffer(DetachedBuffer&& other) noexcept
-    : allocator_(other.allocator_),
-      own_allocator_(other.own_allocator_),
-      buf_(other.buf_),
-      reserved_(other.reserved_),
-      cur_(other.cur_),
-      size_(other.size_)
-  {
-    other.reset();
-  }
-
-  DetachedBuffer& operator=(DetachedBuffer&& other) noexcept
-  {
-    if (this == &other) return *this;
-
-    destroy();
-
-    allocator_     = other.allocator_;
-    own_allocator_ = other.own_allocator_;
-    buf_           = other.buf_;
-    reserved_      = other.reserved_;
-    cur_           = other.cur_;
-    size_          = other.size_;
-
-    other.reset();
-
-    return *this;
-  }
-
-  ~DetachedBuffer() { destroy(); }
-
-  const uint8_t* data() const { return cur_; }
-
-  uint8_t* data() { return cur_; }
-
-  size_t size() const { return size_; }
-
-  // These may change access mode, leave these at end of public section
-  FLATBUFFERS_DELETE_FUNC(DetachedBuffer(const DetachedBuffer& other));
-  FLATBUFFERS_DELETE_FUNC(DetachedBuffer& operator=(const DetachedBuffer& other));
-
- protected:
-  Allocator* allocator_;
-  bool own_allocator_;
-  uint8_t* buf_;
-  size_t reserved_;
-  uint8_t* cur_;
-  size_t size_;
-
-  inline void destroy()
-  {
-    if (buf_) Deallocate(allocator_, buf_, reserved_);
-    if (own_allocator_ && allocator_) { delete allocator_; }
-    reset();
-  }
-
-  inline void reset()
-  {
-    allocator_     = nullptr;
-    own_allocator_ = false;
-    buf_           = nullptr;
-    reserved_      = 0;
-    cur_           = nullptr;
-    size_          = 0;
-  }
-};
-
-}  // namespace flatbuffers
-
-#endif  // FLATBUFFERS_DETACHED_BUFFER_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/flatbuffer_builder.h b/cpp/include/cudf/io/ipc/flatbuffers/flatbuffer_builder.h
deleted file mode 100644
index 74a55955d52..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/flatbuffer_builder.h
+++ /dev/null
@@ -1,1574 +0,0 @@
-/*
- * Copyright 2021 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_FLATBUFFER_BUILDER_H_
-#define FLATBUFFERS_FLATBUFFER_BUILDER_H_
-
-#include <cudf/io/ipc/flatbuffers/allocator.h>
-#include <cudf/io/ipc/flatbuffers/array.h>
-#include <cudf/io/ipc/flatbuffers/base.h>
-#include <cudf/io/ipc/flatbuffers/buffer.h>
-#include <cudf/io/ipc/flatbuffers/buffer_ref.h>
-#include <cudf/io/ipc/flatbuffers/default_allocator.h>
-#include <cudf/io/ipc/flatbuffers/detached_buffer.h>
-#include <cudf/io/ipc/flatbuffers/stl_emulation.h>
-#include <cudf/io/ipc/flatbuffers/string.h>
-#include <cudf/io/ipc/flatbuffers/struct.h>
-#include <cudf/io/ipc/flatbuffers/table.h>
-#include <cudf/io/ipc/flatbuffers/vector.h>
-#include <cudf/io/ipc/flatbuffers/vector_downward.h>
-#include <cudf/io/ipc/flatbuffers/verifier.h>
-
-#include <algorithm>
-#include <cstdint>
-#include <functional>
-#include <initializer_list>
-#include <type_traits>
-
-namespace flatbuffers {
-
-// Converts a Field ID to a virtual table offset.
-inline voffset_t FieldIndexToOffset(voffset_t field_id)
-{
-  // Should correspond to what EndTable() below builds up.
-  const voffset_t fixed_fields = 2 * sizeof(voffset_t);  // Vtable size and Object Size.
-  size_t offset                = fixed_fields + field_id * sizeof(voffset_t);
-  FLATBUFFERS_ASSERT(offset < std::numeric_limits<voffset_t>::max());
-  return static_cast<voffset_t>(offset);
-}
-
-template <typename T, typename Alloc = std::allocator<T>>
-const T* data(const std::vector<T, Alloc>& v)
-{
-  // Eventually the returned pointer gets passed down to memcpy, so
-  // we need it to be non-null to avoid undefined behavior.
-  static uint8_t t;
-  return v.empty() ? reinterpret_cast<const T*>(&t) : &v.front();
-}
-template <typename T, typename Alloc = std::allocator<T>>
-T* data(std::vector<T, Alloc>& v)
-{
-  // Eventually the returned pointer gets passed down to memcpy, so
-  // we need it to be non-null to avoid undefined behavior.
-  static uint8_t t;
-  return v.empty() ? reinterpret_cast<T*>(&t) : &v.front();
-}
-
-/// @addtogroup flatbuffers_cpp_api
-/// @{
-/// @class FlatBufferBuilder
-/// @brief Helper class to hold data needed in creation of a FlatBuffer.
-/// To serialize data, you typically call one of the `Create*()` functions in
-/// the generated code, which in turn call a sequence of `StartTable`/
-/// `PushElement`/`AddElement`/`EndTable`, or the builtin `CreateString`/
-/// `CreateVector` functions. Do this is depth-first order to build up a tree to
-/// the root. `Finish()` wraps up the buffer ready for transport.
-template <bool Is64Aware = false>
-class FlatBufferBuilderImpl {
- public:
-  // This switches the size type of the builder, based on if its 64-bit aware
-  // (uoffset64_t) or not (uoffset_t).
-  typedef typename std::conditional<Is64Aware, uoffset64_t, uoffset_t>::type SizeT;
-
-  /// @brief Default constructor for FlatBufferBuilder.
-  /// @param[in] initial_size The initial size of the buffer, in bytes. Defaults
-  /// to `1024`.
-  /// @param[in] allocator An `Allocator` to use. If null will use
-  /// `DefaultAllocator`.
-  /// @param[in] own_allocator Whether the builder/vector should own the
-  /// allocator. Defaults to / `false`.
-  /// @param[in] buffer_minalign Force the buffer to be aligned to the given
-  /// minimum alignment upon reallocation. Only needed if you intend to store
-  /// types with custom alignment AND you wish to read the buffer in-place
-  /// directly after creation.
-  explicit FlatBufferBuilderImpl(size_t initial_size    = 1024,
-                                 Allocator* allocator   = nullptr,
-                                 bool own_allocator     = false,
-                                 size_t buffer_minalign = AlignOf<largest_scalar_t>())
-    : buf_(initial_size,
-           allocator,
-           own_allocator,
-           buffer_minalign,
-           static_cast<SizeT>(Is64Aware ? FLATBUFFERS_MAX_64_BUFFER_SIZE
-                                        : FLATBUFFERS_MAX_BUFFER_SIZE)),
-      num_field_loc(0),
-      max_voffset_(0),
-      length_of_64_bit_region_(0),
-      nested(false),
-      finished(false),
-      minalign_(1),
-      force_defaults_(false),
-      dedup_vtables_(true),
-      string_pool(nullptr)
-  {
-    EndianCheck();
-  }
-
-  /// @brief Move constructor for FlatBufferBuilder.
-  FlatBufferBuilderImpl(FlatBufferBuilderImpl&& other) noexcept
-    : buf_(1024,
-           nullptr,
-           false,
-           AlignOf<largest_scalar_t>(),
-           static_cast<SizeT>(Is64Aware ? FLATBUFFERS_MAX_64_BUFFER_SIZE
-                                        : FLATBUFFERS_MAX_BUFFER_SIZE)),
-      num_field_loc(0),
-      max_voffset_(0),
-      length_of_64_bit_region_(0),
-      nested(false),
-      finished(false),
-      minalign_(1),
-      force_defaults_(false),
-      dedup_vtables_(true),
-      string_pool(nullptr)
-  {
-    EndianCheck();
-    // Default construct and swap idiom.
-    // Lack of delegating constructors in vs2010 makes it more verbose than
-    // needed.
-    Swap(other);
-  }
-
-  /// @brief Move assignment operator for FlatBufferBuilder.
-  FlatBufferBuilderImpl& operator=(FlatBufferBuilderImpl&& other) noexcept
-  {
-    // Move construct a temporary and swap idiom
-    FlatBufferBuilderImpl temp(std::move(other));
-    Swap(temp);
-    return *this;
-  }
-
-  void Swap(FlatBufferBuilderImpl& other)
-  {
-    using std::swap;
-    buf_.swap(other.buf_);
-    swap(num_field_loc, other.num_field_loc);
-    swap(max_voffset_, other.max_voffset_);
-    swap(length_of_64_bit_region_, other.length_of_64_bit_region_);
-    swap(nested, other.nested);
-    swap(finished, other.finished);
-    swap(minalign_, other.minalign_);
-    swap(force_defaults_, other.force_defaults_);
-    swap(dedup_vtables_, other.dedup_vtables_);
-    swap(string_pool, other.string_pool);
-  }
-
-  ~FlatBufferBuilderImpl()
-  {
-    if (string_pool) delete string_pool;
-  }
-
-  void Reset()
-  {
-    Clear();       // clear builder state
-    buf_.reset();  // deallocate buffer
-  }
-
-  /// @brief Reset all the state in this FlatBufferBuilder so it can be reused
-  /// to construct another buffer.
-  void Clear()
-  {
-    ClearOffsets();
-    buf_.clear();
-    nested                   = false;
-    finished                 = false;
-    minalign_                = 1;
-    length_of_64_bit_region_ = 0;
-    if (string_pool) string_pool->clear();
-  }
-
-  /// @brief The current size of the serialized buffer, counting from the end.
-  /// @return Returns an `SizeT` with the current size of the buffer.
-  SizeT GetSize() const { return buf_.size(); }
-
-  /// @brief The current size of the serialized buffer relative to the end of
-  /// the 32-bit region.
-  /// @return Returns an `uoffset_t` with the current size of the buffer.
-  template <bool is_64 = Is64Aware>
-  // Only enable this method for the 64-bit builder, as only that builder is
-  // concerned with the 32/64-bit boundary, and should be the one to bare any
-  // run time costs.
-  typename std::enable_if<is_64, uoffset_t>::type GetSizeRelative32BitRegion() const
-  {
-    //[32-bit region][64-bit region]
-    //         [XXXXXXXXXXXXXXXXXXX] GetSize()
-    //               [YYYYYYYYYYYYY] length_of_64_bit_region_
-    //         [ZZZZ]                return size
-    return static_cast<uoffset_t>(GetSize() - length_of_64_bit_region_);
-  }
-
-  template <bool is_64 = Is64Aware>
-  // Only enable this method for the 32-bit builder.
-  typename std::enable_if<!is_64, uoffset_t>::type GetSizeRelative32BitRegion() const
-  {
-    return static_cast<uoffset_t>(GetSize());
-  }
-
-  /// @brief Get the serialized buffer (after you call `Finish()`).
-  /// @return Returns an `uint8_t` pointer to the FlatBuffer data inside the
-  /// buffer.
-  uint8_t* GetBufferPointer() const
-  {
-    Finished();
-    return buf_.data();
-  }
-
-  /// @brief Get the serialized buffer (after you call `Finish()`) as a span.
-  /// @return Returns a constructed flatbuffers::span that is a view over the
-  /// FlatBuffer data inside the buffer.
-  flatbuffers::span<uint8_t> GetBufferSpan() const
-  {
-    Finished();
-    return flatbuffers::span<uint8_t>(buf_.data(), buf_.size());
-  }
-
-  /// @brief Get a pointer to an unfinished buffer.
-  /// @return Returns a `uint8_t` pointer to the unfinished buffer.
-  uint8_t* GetCurrentBufferPointer() const { return buf_.data(); }
-
-  /// @brief Get the released DetachedBuffer.
-  /// @return A `DetachedBuffer` that owns the buffer and its allocator.
-  DetachedBuffer Release()
-  {
-    Finished();
-    DetachedBuffer buffer = buf_.release();
-    Clear();
-    return buffer;
-  }
-
-  /// @brief Get the released pointer to the serialized buffer.
-  /// @param size The size of the memory block containing
-  /// the serialized `FlatBuffer`.
-  /// @param offset The offset from the released pointer where the finished
-  /// `FlatBuffer` starts.
-  /// @return A raw pointer to the start of the memory block containing
-  /// the serialized `FlatBuffer`.
-  /// @remark If the allocator is owned, it gets deleted when the destructor is
-  /// called.
-  uint8_t* ReleaseRaw(size_t& size, size_t& offset)
-  {
-    Finished();
-    uint8_t* raw = buf_.release_raw(size, offset);
-    Clear();
-    return raw;
-  }
-
-  /// @brief get the minimum alignment this buffer needs to be accessed
-  /// properly. This is only known once all elements have been written (after
-  /// you call Finish()). You can use this information if you need to embed
-  /// a FlatBuffer in some other buffer, such that you can later read it
-  /// without first having to copy it into its own buffer.
-  size_t GetBufferMinAlignment() const
-  {
-    Finished();
-    return minalign_;
-  }
-
-  /// @cond FLATBUFFERS_INTERNAL
-  void Finished() const
-  {
-    // If you get this assert, you're attempting to get access a buffer
-    // which hasn't been finished yet. Be sure to call
-    // FlatBufferBuilder::Finish with your root table.
-    // If you really need to access an unfinished buffer, call
-    // GetCurrentBufferPointer instead.
-    FLATBUFFERS_ASSERT(finished);
-  }
-  /// @endcond
-
-  /// @brief In order to save space, fields that are set to their default value
-  /// don't get serialized into the buffer.
-  /// @param[in] fd When set to `true`, always serializes default values that
-  /// are set. Optional fields which are not set explicitly, will still not be
-  /// serialized.
-  void ForceDefaults(bool fd) { force_defaults_ = fd; }
-
-  /// @brief By default vtables are deduped in order to save space.
-  /// @param[in] dedup When set to `true`, dedup vtables.
-  void DedupVtables(bool dedup) { dedup_vtables_ = dedup; }
-
-  /// @cond FLATBUFFERS_INTERNAL
-  void Pad(size_t num_bytes) { buf_.fill(num_bytes); }
-
-  void TrackMinAlign(size_t elem_size)
-  {
-    if (elem_size > minalign_) minalign_ = elem_size;
-  }
-
-  void Align(size_t elem_size)
-  {
-    TrackMinAlign(elem_size);
-    buf_.fill(PaddingBytes(buf_.size(), elem_size));
-  }
-
-  void PushFlatBuffer(const uint8_t* bytes, size_t size)
-  {
-    PushBytes(bytes, size);
-    finished = true;
-  }
-
-  void PushBytes(const uint8_t* bytes, size_t size) { buf_.push(bytes, size); }
-
-  void PopBytes(size_t amount) { buf_.pop(amount); }
-
-  template <typename T>
-  void AssertScalarT()
-  {
-    // The code assumes power of 2 sizes and endian-swap-ability.
-    static_assert(flatbuffers::is_scalar<T>::value, "T must be a scalar type");
-  }
-
-  // Write a single aligned scalar to the buffer
-  template <typename T, typename ReturnT = uoffset_t>
-  ReturnT PushElement(T element)
-  {
-    AssertScalarT<T>();
-    Align(sizeof(T));
-    buf_.push_small(EndianScalar(element));
-    return CalculateOffset<ReturnT>();
-  }
-
-  template <typename T, template <typename> class OffsetT = Offset>
-  uoffset_t PushElement(OffsetT<T> off)
-  {
-    // Special case for offsets: see ReferTo below.
-    return PushElement(ReferTo(off.o));
-  }
-
-  // When writing fields, we track where they are, so we can create correct
-  // vtables later.
-  void TrackField(voffset_t field, uoffset_t off)
-  {
-    FieldLoc fl = {off, field};
-    buf_.scratch_push_small(fl);
-    num_field_loc++;
-    if (field > max_voffset_) { max_voffset_ = field; }
-  }
-
-  // Like PushElement, but additionally tracks the field this represents.
-  template <typename T>
-  void AddElement(voffset_t field, T e, T def)
-  {
-    // We don't serialize values equal to the default.
-    if (IsTheSameAs(e, def) && !force_defaults_) return;
-    TrackField(field, PushElement(e));
-  }
-
-  template <typename T>
-  void AddElement(voffset_t field, T e)
-  {
-    TrackField(field, PushElement(e));
-  }
-
-  template <typename T>
-  void AddOffset(voffset_t field, Offset<T> off)
-  {
-    if (off.IsNull()) return;  // Don't store.
-    AddElement(field, ReferTo(off.o), static_cast<uoffset_t>(0));
-  }
-
-  template <typename T>
-  void AddOffset(voffset_t field, Offset64<T> off)
-  {
-    if (off.IsNull()) return;  // Don't store.
-    AddElement(field, ReferTo(off.o), static_cast<uoffset64_t>(0));
-  }
-
-  template <typename T>
-  void AddStruct(voffset_t field, const T* structptr)
-  {
-    if (!structptr) return;  // Default, don't store.
-    Align(AlignOf<T>());
-    buf_.push_small(*structptr);
-    TrackField(field, CalculateOffset<uoffset_t>());
-  }
-
-  void AddStructOffset(voffset_t field, uoffset_t off) { TrackField(field, off); }
-
-  // Offsets initially are relative to the end of the buffer (downwards).
-  // This function converts them to be relative to the current location
-  // in the buffer (when stored here), pointing upwards.
-  uoffset_t ReferTo(uoffset_t off)
-  {
-    // Align to ensure GetSizeRelative32BitRegion() below is correct.
-    Align(sizeof(uoffset_t));
-    // 32-bit offsets are relative to the tail of the 32-bit region of the
-    // buffer. For most cases (without 64-bit entities) this is equivalent to
-    // size of the whole buffer (e.g. GetSize())
-    return ReferTo(off, GetSizeRelative32BitRegion());
-  }
-
-  uoffset64_t ReferTo(uoffset64_t off)
-  {
-    // Align to ensure GetSize() below is correct.
-    Align(sizeof(uoffset64_t));
-    // 64-bit offsets are relative to tail of the whole buffer
-    return ReferTo(off, GetSize());
-  }
-
-  template <typename T, typename T2>
-  T ReferTo(const T off, const T2 size)
-  {
-    FLATBUFFERS_ASSERT(off && off <= size);
-    return size - off + static_cast<T>(sizeof(T));
-  }
-
-  template <typename T>
-  T ReferTo(const T off, const T size)
-  {
-    FLATBUFFERS_ASSERT(off && off <= size);
-    return size - off + static_cast<T>(sizeof(T));
-  }
-
-  void NotNested()
-  {
-    // If you hit this, you're trying to construct a Table/Vector/String
-    // during the construction of its parent table (between the MyTableBuilder
-    // and table.Finish().
-    // Move the creation of these sub-objects to above the MyTableBuilder to
-    // not get this assert.
-    // Ignoring this assert may appear to work in simple cases, but the reason
-    // it is here is that storing objects in-line may cause vtable offsets
-    // to not fit anymore. It also leads to vtable duplication.
-    FLATBUFFERS_ASSERT(!nested);
-    // If you hit this, fields were added outside the scope of a table.
-    FLATBUFFERS_ASSERT(!num_field_loc);
-  }
-
-  // From generated code (or from the parser), we call StartTable/EndTable
-  // with a sequence of AddElement calls in between.
-  uoffset_t StartTable()
-  {
-    NotNested();
-    nested = true;
-    return GetSizeRelative32BitRegion();
-  }
-
-  // This finishes one serialized object by generating the vtable if it's a
-  // table, comparing it against existing vtables, and writing the
-  // resulting vtable offset.
-  uoffset_t EndTable(uoffset_t start)
-  {
-    // If you get this assert, a corresponding StartTable wasn't called.
-    FLATBUFFERS_ASSERT(nested);
-    // Write the vtable offset, which is the start of any Table.
-    // We fill its value later.
-    // This is relative to the end of the 32-bit region.
-    const uoffset_t vtable_offset_loc = static_cast<uoffset_t>(PushElement<soffset_t>(0));
-    // Write a vtable, which consists entirely of voffset_t elements.
-    // It starts with the number of offsets, followed by a type id, followed
-    // by the offsets themselves. In reverse:
-    // Include space for the last offset and ensure empty tables have a
-    // minimum size.
-    max_voffset_ =
-      (std::max)(static_cast<voffset_t>(max_voffset_ + sizeof(voffset_t)), FieldIndexToOffset(0));
-    buf_.fill_big(max_voffset_);
-    const uoffset_t table_object_size = vtable_offset_loc - start;
-    // Vtable use 16bit offsets.
-    FLATBUFFERS_ASSERT(table_object_size < 0x10000);
-    WriteScalar<voffset_t>(buf_.data() + sizeof(voffset_t),
-                           static_cast<voffset_t>(table_object_size));
-    WriteScalar<voffset_t>(buf_.data(), max_voffset_);
-    // Write the offsets into the table
-    for (auto it = buf_.scratch_end() - num_field_loc * sizeof(FieldLoc); it < buf_.scratch_end();
-         it += sizeof(FieldLoc)) {
-      auto field_location = reinterpret_cast<FieldLoc*>(it);
-      const voffset_t pos = static_cast<voffset_t>(vtable_offset_loc - field_location->off);
-      // If this asserts, it means you've set a field twice.
-      FLATBUFFERS_ASSERT(!ReadScalar<voffset_t>(buf_.data() + field_location->id));
-      WriteScalar<voffset_t>(buf_.data() + field_location->id, pos);
-    }
-    ClearOffsets();
-    auto vt1      = reinterpret_cast<voffset_t*>(buf_.data());
-    auto vt1_size = ReadScalar<voffset_t>(vt1);
-    auto vt_use   = GetSizeRelative32BitRegion();
-    // See if we already have generated a vtable with this exact same
-    // layout before. If so, make it point to the old one, remove this one.
-    if (dedup_vtables_) {
-      for (auto it = buf_.scratch_data(); it < buf_.scratch_end(); it += sizeof(uoffset_t)) {
-        auto vt_offset_ptr = reinterpret_cast<uoffset_t*>(it);
-        auto vt2           = reinterpret_cast<voffset_t*>(buf_.data_at(*vt_offset_ptr));
-        auto vt2_size      = ReadScalar<voffset_t>(vt2);
-        if (vt1_size != vt2_size || 0 != memcmp(vt2, vt1, vt1_size)) continue;
-        vt_use = *vt_offset_ptr;
-        buf_.pop(GetSizeRelative32BitRegion() - vtable_offset_loc);
-        break;
-      }
-    }
-    // If this is a new vtable, remember it.
-    if (vt_use == GetSizeRelative32BitRegion()) { buf_.scratch_push_small(vt_use); }
-    // Fill the vtable offset we created above.
-    // The offset points from the beginning of the object to where the vtable is
-    // stored.
-    // Offsets default direction is downward in memory for future format
-    // flexibility (storing all vtables at the start of the file).
-    WriteScalar(buf_.data_at(vtable_offset_loc + length_of_64_bit_region_),
-                static_cast<soffset_t>(vt_use) - static_cast<soffset_t>(vtable_offset_loc));
-    nested = false;
-    return vtable_offset_loc;
-  }
-
-  FLATBUFFERS_ATTRIBUTE([[deprecated("call the version above instead")]])
-  uoffset_t EndTable(uoffset_t start, voffset_t /*numfields*/) { return EndTable(start); }
-
-  // This checks a required field has been set in a given table that has
-  // just been constructed.
-  template <typename T>
-  void Required(Offset<T> table, voffset_t field)
-  {
-    auto table_ptr = reinterpret_cast<const Table*>(buf_.data_at(table.o));
-    bool ok        = table_ptr->GetOptionalFieldOffset(field) != 0;
-    // If this fails, the caller will show what field needs to be set.
-    FLATBUFFERS_ASSERT(ok);
-    (void)ok;
-  }
-
-  uoffset_t StartStruct(size_t alignment)
-  {
-    Align(alignment);
-    return GetSizeRelative32BitRegion();
-  }
-
-  uoffset_t EndStruct() { return GetSizeRelative32BitRegion(); }
-
-  void ClearOffsets()
-  {
-    buf_.scratch_pop(num_field_loc * sizeof(FieldLoc));
-    num_field_loc = 0;
-    max_voffset_  = 0;
-  }
-
-  // Aligns such that when "len" bytes are written, an object can be written
-  // after it (forward in the buffer) with "alignment" without padding.
-  void PreAlign(size_t len, size_t alignment)
-  {
-    if (len == 0) return;
-    TrackMinAlign(alignment);
-    buf_.fill(PaddingBytes(GetSize() + len, alignment));
-  }
-
-  // Aligns such than when "len" bytes are written, an object of type `AlignT`
-  // can be written after it (forward in the buffer) without padding.
-  template <typename AlignT>
-  void PreAlign(size_t len)
-  {
-    AssertScalarT<AlignT>();
-    PreAlign(len, AlignOf<AlignT>());
-  }
-  /// @endcond
-
-  /// @brief Store a string in the buffer, which can contain any binary data.
-  /// @param[in] str A const char pointer to the data to be stored as a string.
-  /// @param[in] len The number of bytes that should be stored from `str`.
-  /// @return Returns the offset in the buffer where the string starts.
-  template <template <typename> class OffsetT = Offset>
-  OffsetT<String> CreateString(const char* str, size_t len)
-  {
-    CreateStringImpl(str, len);
-    return OffsetT<String>(CalculateOffset<typename OffsetT<String>::offset_type>());
-  }
-
-  /// @brief Store a string in the buffer, which is null-terminated.
-  /// @param[in] str A const char pointer to a C-string to add to the buffer.
-  /// @return Returns the offset in the buffer where the string starts.
-  template <template <typename> class OffsetT = Offset>
-  OffsetT<String> CreateString(const char* str)
-  {
-    return CreateString<OffsetT>(str, strlen(str));
-  }
-
-  /// @brief Store a string in the buffer, which is null-terminated.
-  /// @param[in] str A char pointer to a C-string to add to the buffer.
-  /// @return Returns the offset in the buffer where the string starts.
-  template <template <typename> class OffsetT = Offset>
-  OffsetT<String> CreateString(char* str)
-  {
-    return CreateString<OffsetT>(str, strlen(str));
-  }
-
-  /// @brief Store a string in the buffer, which can contain any binary data.
-  /// @param[in] str A const reference to a std::string to store in the buffer.
-  /// @return Returns the offset in the buffer where the string starts.
-  template <template <typename> class OffsetT = Offset>
-  OffsetT<String> CreateString(const std::string& str)
-  {
-    return CreateString<OffsetT>(str.c_str(), str.length());
-  }
-
-  // clang-format off
-  #ifdef FLATBUFFERS_HAS_STRING_VIEW
-  /// @brief Store a string in the buffer, which can contain any binary data.
-  /// @param[in] str A const string_view to copy in to the buffer.
-  /// @return Returns the offset in the buffer where the string starts.
-  template<template <typename> class OffsetT = Offset>
-  OffsetT<String>CreateString(flatbuffers::string_view str) {
-    return CreateString<OffsetT>(str.data(), str.size());
-  }
-  #endif // FLATBUFFERS_HAS_STRING_VIEW
-  // clang-format on
-
-  /// @brief Store a string in the buffer, which can contain any binary data.
-  /// @param[in] str A const pointer to a `String` struct to add to the buffer.
-  /// @return Returns the offset in the buffer where the string starts
-  template <template <typename> class OffsetT = Offset>
-  OffsetT<String> CreateString(const String* str)
-  {
-    return str ? CreateString<OffsetT>(str->c_str(), str->size()) : 0;
-  }
-
-  /// @brief Store a string in the buffer, which can contain any binary data.
-  /// @param[in] str A const reference to a std::string like type with support
-  /// of T::data() and T::length() to store in the buffer.
-  /// @return Returns the offset in the buffer where the string starts.
-  template <template <typename> class OffsetT = Offset,
-            // No need to explicitly declare the T type, let the compiler deduce
-            // it.
-            int&... ExplicitArgumentBarrier,
-            typename T>
-  OffsetT<String> CreateString(const T& str)
-  {
-    return CreateString<OffsetT>(str.data(), str.length());
-  }
-
-  /// @brief Store a string in the buffer, which can contain any binary data.
-  /// If a string with this exact contents has already been serialized before,
-  /// instead simply returns the offset of the existing string. This uses a map
-  /// stored on the heap, but only stores the numerical offsets.
-  /// @param[in] str A const char pointer to the data to be stored as a string.
-  /// @param[in] len The number of bytes that should be stored from `str`.
-  /// @return Returns the offset in the buffer where the string starts.
-  Offset<String> CreateSharedString(const char* str, size_t len)
-  {
-    FLATBUFFERS_ASSERT(FLATBUFFERS_GENERAL_HEAP_ALLOC_OK);
-    if (!string_pool) { string_pool = new StringOffsetMap(StringOffsetCompare(buf_)); }
-
-    const size_t size_before_string = buf_.size();
-    // Must first serialize the string, since the set is all offsets into
-    // buffer.
-    const Offset<String> off = CreateString<Offset>(str, len);
-    auto it                  = string_pool->find(off);
-    // If it exists we reuse existing serialized data!
-    if (it != string_pool->end()) {
-      // We can remove the string we serialized.
-      buf_.pop(buf_.size() - size_before_string);
-      return *it;
-    }
-    // Record this string for future use.
-    string_pool->insert(off);
-    return off;
-  }
-
-#ifdef FLATBUFFERS_HAS_STRING_VIEW
-  /// @brief Store a string in the buffer, which can contain any binary data.
-  /// If a string with this exact contents has already been serialized before,
-  /// instead simply returns the offset of the existing string. This uses a map
-  /// stored on the heap, but only stores the numerical offsets.
-  /// @param[in] str A const std::string_view to store in the buffer.
-  /// @return Returns the offset in the buffer where the string starts
-  Offset<String> CreateSharedString(const flatbuffers::string_view str)
-  {
-    return CreateSharedString(str.data(), str.size());
-  }
-#else
-  /// @brief Store a string in the buffer, which null-terminated.
-  /// If a string with this exact contents has already been serialized before,
-  /// instead simply returns the offset of the existing string. This uses a map
-  /// stored on the heap, but only stores the numerical offsets.
-  /// @param[in] str A const char pointer to a C-string to add to the buffer.
-  /// @return Returns the offset in the buffer where the string starts.
-  Offset<String> CreateSharedString(const char* str)
-  {
-    return CreateSharedString(str, strlen(str));
-  }
-
-  /// @brief Store a string in the buffer, which can contain any binary data.
-  /// If a string with this exact contents has already been serialized before,
-  /// instead simply returns the offset of the existing string. This uses a map
-  /// stored on the heap, but only stores the numerical offsets.
-  /// @param[in] str A const reference to a std::string to store in the buffer.
-  /// @return Returns the offset in the buffer where the string starts.
-  Offset<String> CreateSharedString(const std::string& str)
-  {
-    return CreateSharedString(str.c_str(), str.length());
-  }
-#endif
-
-  /// @brief Store a string in the buffer, which can contain any binary data.
-  /// If a string with this exact contents has already been serialized before,
-  /// instead simply returns the offset of the existing string. This uses a map
-  /// stored on the heap, but only stores the numerical offsets.
-  /// @param[in] str A const pointer to a `String` struct to add to the buffer.
-  /// @return Returns the offset in the buffer where the string starts
-  Offset<String> CreateSharedString(const String* str)
-  {
-    return str ? CreateSharedString(str->c_str(), str->size()) : 0;
-  }
-
-  /// @cond FLATBUFFERS_INTERNAL
-  template <typename LenT = uoffset_t, typename ReturnT = uoffset_t>
-  ReturnT EndVector(size_t len)
-  {
-    FLATBUFFERS_ASSERT(nested);  // Hit if no corresponding StartVector.
-    nested = false;
-    return PushElement<LenT, ReturnT>(static_cast<LenT>(len));
-  }
-
-  template <template <typename> class OffsetT = Offset, typename LenT = uint32_t>
-  void StartVector(size_t len, size_t elemsize, size_t alignment)
-  {
-    NotNested();
-    nested = true;
-    // Align to the Length type of the vector (either 32-bit or 64-bit), so
-    // that the length of the buffer can be added without padding.
-    PreAlign<LenT>(len * elemsize);
-    PreAlign(len * elemsize, alignment);  // Just in case elemsize > uoffset_t.
-  }
-
-  template <typename T, template <typename> class OffsetT = Offset, typename LenT = uint32_t>
-  void StartVector(size_t len)
-  {
-    return StartVector<OffsetT, LenT>(len, sizeof(T), AlignOf<T>());
-  }
-
-  // Call this right before StartVector/CreateVector if you want to force the
-  // alignment to be something different than what the element size would
-  // normally dictate.
-  // This is useful when storing a nested_flatbuffer in a vector of bytes,
-  // or when storing SIMD floats, etc.
-  void ForceVectorAlignment(const size_t len, const size_t elemsize, const size_t alignment)
-  {
-    if (len == 0) return;
-    FLATBUFFERS_ASSERT(VerifyAlignmentRequirements(alignment));
-    PreAlign(len * elemsize, alignment);
-  }
-
-  template <bool is_64 = Is64Aware>
-  typename std::enable_if<is_64, void>::type ForceVectorAlignment64(const size_t len,
-                                                                    const size_t elemsize,
-                                                                    const size_t alignment)
-  {
-    // If you hit this assertion, you are trying to force alignment on a
-    // vector with offset64 after serializing a 32-bit offset.
-    FLATBUFFERS_ASSERT(GetSize() == length_of_64_bit_region_);
-
-    // Call through.
-    ForceVectorAlignment(len, elemsize, alignment);
-
-    // Update the 64 bit region.
-    length_of_64_bit_region_ = GetSize();
-  }
-
-  // Similar to ForceVectorAlignment but for String fields.
-  void ForceStringAlignment(size_t len, size_t alignment)
-  {
-    if (len == 0) return;
-    FLATBUFFERS_ASSERT(VerifyAlignmentRequirements(alignment));
-    PreAlign((len + 1) * sizeof(char), alignment);
-  }
-
-  /// @endcond
-
-  /// @brief Serialize an array into a FlatBuffer `vector`.
-  /// @tparam T The data type of the array elements.
-  /// @tparam OffsetT the type of offset to return
-  /// @tparam VectorT the type of vector to cast to.
-  /// @param[in] v A pointer to the array of type `T` to serialize into the
-  /// buffer as a `vector`.
-  /// @param[in] len The number of elements to serialize.
-  /// @return Returns a typed `TOffset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T,
-            template <typename...> class OffsetT = Offset,
-            template <typename...> class VectorT = Vector>
-  OffsetT<VectorT<T>> CreateVector(const T* v, size_t len)
-  {
-    // The type of the length field in the vector.
-    typedef typename VectorT<T>::size_type LenT;
-    typedef typename OffsetT<VectorT<T>>::offset_type offset_type;
-    // If this assert hits, you're specifying a template argument that is
-    // causing the wrong overload to be selected, remove it.
-    AssertScalarT<T>();
-    StartVector<T, OffsetT, LenT>(len);
-    if (len > 0) {
-// clang-format off
-      #if FLATBUFFERS_LITTLEENDIAN
-        PushBytes(reinterpret_cast<const uint8_t *>(v), len * sizeof(T));
-      #else
-        if (sizeof(T) == 1) {
-          PushBytes(reinterpret_cast<const uint8_t *>(v), len);
-        } else {
-          for (auto i = len; i > 0; ) {
-            PushElement(v[--i]);
-          }
-        }
-      #endif
-      // clang-format on
-    }
-    return OffsetT<VectorT<T>>(EndVector<LenT, offset_type>(len));
-  }
-
-  /// @brief Serialize an array like object into a FlatBuffer `vector`.
-  /// @tparam T The data type of the array elements.
-  /// @tparam C The type of the array.
-  /// @param[in] array A reference to an array like object of type `T` to
-  /// serialize into the buffer as a `vector`.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T, class C>
-  Offset<Vector<T>> CreateVector(const C& array)
-  {
-    return CreateVector(array.data(), array.size());
-  }
-
-  /// @brief Serialize an initializer list into a FlatBuffer `vector`.
-  /// @tparam T The data type of the initializer list elements.
-  /// @param[in] v The value of the initializer list.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T>
-  Offset<Vector<T>> CreateVector(std::initializer_list<T> v)
-  {
-    return CreateVector(v.begin(), v.size());
-  }
-
-  template <typename T>
-  Offset<Vector<Offset<T>>> CreateVector(const Offset<T>* v, size_t len)
-  {
-    StartVector<Offset<T>>(len);
-    for (auto i = len; i > 0;) {
-      PushElement(v[--i]);
-    }
-    return Offset<Vector<Offset<T>>>(EndVector(len));
-  }
-
-  /// @brief Serialize a `std::vector` into a FlatBuffer `vector`.
-  /// @tparam T The data type of the `std::vector` elements.
-  /// @param v A const reference to the `std::vector` to serialize into the
-  /// buffer as a `vector`.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T, typename Alloc = std::allocator<T>>
-  Offset<Vector<T>> CreateVector(const std::vector<T, Alloc>& v)
-  {
-    return CreateVector(data(v), v.size());
-  }
-
-  template <template <typename...> class VectorT = Vector64,
-            int&... ExplicitArgumentBarrier,
-            typename T>
-  Offset64<VectorT<T>> CreateVector64(const std::vector<T>& v)
-  {
-    return CreateVector<T, Offset64, VectorT>(data(v), v.size());
-  }
-
-  // vector<bool> may be implemented using a bit-set, so we can't access it as
-  // an array. Instead, read elements manually.
-  // Background: https://isocpp.org/blog/2012/11/on-vectorbool
-  Offset<Vector<uint8_t>> CreateVector(const std::vector<bool>& v)
-  {
-    StartVector<uint8_t>(v.size());
-    for (auto i = v.size(); i > 0;) {
-      PushElement(static_cast<uint8_t>(v[--i]));
-    }
-    return Offset<Vector<uint8_t>>(EndVector(v.size()));
-  }
-
-  /// @brief Serialize values returned by a function into a FlatBuffer `vector`.
-  /// This is a convenience function that takes care of iteration for you.
-  /// @tparam T The data type of the `std::vector` elements.
-  /// @param f A function that takes the current iteration 0..vector_size-1 and
-  /// returns any type that you can construct a FlatBuffers vector out of.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T>
-  Offset<Vector<T>> CreateVector(size_t vector_size, const std::function<T(size_t i)>& f)
-  {
-    FLATBUFFERS_ASSERT(FLATBUFFERS_GENERAL_HEAP_ALLOC_OK);
-    std::vector<T> elems(vector_size);
-    for (size_t i = 0; i < vector_size; i++)
-      elems[i] = f(i);
-    return CreateVector(elems);
-  }
-
-  /// @brief Serialize values returned by a function into a FlatBuffer `vector`.
-  /// This is a convenience function that takes care of iteration for you. This
-  /// uses a vector stored on the heap to store the intermediate results of the
-  /// iteration.
-  /// @tparam T The data type of the `std::vector` elements.
-  /// @param f A function that takes the current iteration 0..vector_size-1,
-  /// and the state parameter returning any type that you can construct a
-  /// FlatBuffers vector out of.
-  /// @param state State passed to f.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T, typename F, typename S>
-  Offset<Vector<T>> CreateVector(size_t vector_size, F f, S* state)
-  {
-    FLATBUFFERS_ASSERT(FLATBUFFERS_GENERAL_HEAP_ALLOC_OK);
-    std::vector<T> elems(vector_size);
-    for (size_t i = 0; i < vector_size; i++)
-      elems[i] = f(i, state);
-    return CreateVector(elems);
-  }
-
-  /// @brief Serialize a `std::vector<StringType>` into a FlatBuffer `vector`.
-  /// whereas StringType is any type that is accepted by the CreateString()
-  /// overloads.
-  /// This is a convenience function for a common case.
-  /// @param v A const reference to the `std::vector` to serialize into the
-  /// buffer as a `vector`.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename StringType = std::string, typename Alloc = std::allocator<StringType>>
-  Offset<Vector<Offset<String>>> CreateVectorOfStrings(const std::vector<StringType, Alloc>& v)
-  {
-    return CreateVectorOfStrings(v.cbegin(), v.cend());
-  }
-
-  /// @brief Serialize a collection of Strings into a FlatBuffer `vector`.
-  /// This is a convenience function for a common case.
-  /// @param begin The beginning iterator of the collection
-  /// @param end The ending iterator of the collection
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <class It>
-  Offset<Vector<Offset<String>>> CreateVectorOfStrings(It begin, It end)
-  {
-    auto distance = std::distance(begin, end);
-    FLATBUFFERS_ASSERT(distance >= 0);
-    auto size                 = static_cast<size_t>(distance);
-    auto scratch_buffer_usage = size * sizeof(Offset<String>);
-    // If there is not enough space to store the offsets, there definitely won't
-    // be enough space to store all the strings. So ensuring space for the
-    // scratch region is OK, for if it fails, it would have failed later.
-    buf_.ensure_space(scratch_buffer_usage);
-    for (auto it = begin; it != end; ++it) {
-      buf_.scratch_push_small(CreateString(*it));
-    }
-    StartVector<Offset<String>>(size);
-    for (size_t i = 1; i <= size; i++) {
-      // Note we re-evaluate the buf location each iteration to account for any
-      // underlying buffer resizing that may occur.
-      PushElement(
-        *reinterpret_cast<Offset<String>*>(buf_.scratch_end() - i * sizeof(Offset<String>)));
-    }
-    buf_.scratch_pop(scratch_buffer_usage);
-    return Offset<Vector<Offset<String>>>(EndVector(size));
-  }
-
-  /// @brief Serialize an array of structs into a FlatBuffer `vector`.
-  /// @tparam T The data type of the struct array elements.
-  /// @param[in] v A pointer to the array of type `T` to serialize into the
-  /// buffer as a `vector`.
-  /// @param[in] len The number of elements to serialize.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T,
-            template <typename...> class OffsetT = Offset,
-            template <typename...> class VectorT = Vector>
-  OffsetT<VectorT<const T*>> CreateVectorOfStructs(const T* v, size_t len)
-  {
-    // The type of the length field in the vector.
-    typedef typename VectorT<T>::size_type LenT;
-    typedef typename OffsetT<VectorT<const T*>>::offset_type offset_type;
-
-    StartVector<OffsetT, LenT>(len, sizeof(T), AlignOf<T>());
-    if (len > 0) { PushBytes(reinterpret_cast<const uint8_t*>(v), sizeof(T) * len); }
-    return OffsetT<VectorT<const T*>>(EndVector<LenT, offset_type>(len));
-  }
-
-  /// @brief Serialize an array of structs into a FlatBuffer `vector`.
-  /// @tparam T The data type of the struct array elements.
-  /// @param[in] filler A function that takes the current iteration
-  /// 0..vector_size-1 and a pointer to the struct that must be filled.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  /// This is mostly useful when flatbuffers are generated with mutation
-  /// accessors.
-  template <typename T>
-  Offset<Vector<const T*>> CreateVectorOfStructs(size_t vector_size,
-                                                 const std::function<void(size_t i, T*)>& filler)
-  {
-    T* structs = StartVectorOfStructs<T>(vector_size);
-    for (size_t i = 0; i < vector_size; i++) {
-      filler(i, structs);
-      structs++;
-    }
-    return EndVectorOfStructs<T>(vector_size);
-  }
-
-  /// @brief Serialize an array of structs into a FlatBuffer `vector`.
-  /// @tparam T The data type of the struct array elements.
-  /// @param[in] f A function that takes the current iteration 0..vector_size-1,
-  /// a pointer to the struct that must be filled and the state argument.
-  /// @param[in] state Arbitrary state to pass to f.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  /// This is mostly useful when flatbuffers are generated with mutation
-  /// accessors.
-  template <typename T, typename F, typename S>
-  Offset<Vector<const T*>> CreateVectorOfStructs(size_t vector_size, F f, S* state)
-  {
-    T* structs = StartVectorOfStructs<T>(vector_size);
-    for (size_t i = 0; i < vector_size; i++) {
-      f(i, structs, state);
-      structs++;
-    }
-    return EndVectorOfStructs<T>(vector_size);
-  }
-
-  /// @brief Serialize a `std::vector` of structs into a FlatBuffer `vector`.
-  /// @tparam T The data type of the `std::vector` struct elements.
-  /// @param[in] v A const reference to the `std::vector` of structs to
-  /// serialize into the buffer as a `vector`.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T,
-            template <typename...> class OffsetT = Offset,
-            template <typename...> class VectorT = Vector,
-            typename Alloc                       = std::allocator<T>>
-  OffsetT<VectorT<const T*>> CreateVectorOfStructs(const std::vector<T, Alloc>& v)
-  {
-    return CreateVectorOfStructs<T, OffsetT, VectorT>(data(v), v.size());
-  }
-
-  template <template <typename...> class VectorT = Vector64, int&..., typename T>
-  Offset64<VectorT<const T*>> CreateVectorOfStructs64(const std::vector<T>& v)
-  {
-    return CreateVectorOfStructs<T, Offset64, VectorT>(data(v), v.size());
-  }
-
-  /// @brief Serialize an array of native structs into a FlatBuffer `vector`.
-  /// @tparam T The data type of the struct array elements.
-  /// @tparam S The data type of the native struct array elements.
-  /// @param[in] v A pointer to the array of type `S` to serialize into the
-  /// buffer as a `vector`.
-  /// @param[in] len The number of elements to serialize.
-  /// @param[in] pack_func Pointer to a function to convert the native struct
-  /// to the FlatBuffer struct.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T, typename S>
-  Offset<Vector<const T*>> CreateVectorOfNativeStructs(const S* v,
-                                                       size_t len,
-                                                       T (*const pack_func)(const S&))
-  {
-    FLATBUFFERS_ASSERT(pack_func);
-    auto structs = StartVectorOfStructs<T>(len);
-    for (size_t i = 0; i < len; i++) {
-      structs[i] = pack_func(v[i]);
-    }
-    return EndVectorOfStructs<T>(len);
-  }
-
-  /// @brief Serialize an array of native structs into a FlatBuffer `vector`.
-  /// @tparam T The data type of the struct array elements.
-  /// @tparam S The data type of the native struct array elements.
-  /// @param[in] v A pointer to the array of type `S` to serialize into the
-  /// buffer as a `vector`.
-  /// @param[in] len The number of elements to serialize.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T, typename S>
-  Offset<Vector<const T*>> CreateVectorOfNativeStructs(const S* v, size_t len)
-  {
-    extern T Pack(const S&);
-    return CreateVectorOfNativeStructs(v, len, Pack);
-  }
-
-  /// @brief Serialize a `std::vector` of native structs into a FlatBuffer
-  /// `vector`.
-  /// @tparam T The data type of the `std::vector` struct elements.
-  /// @tparam S The data type of the `std::vector` native struct elements.
-  /// @param[in] v A const reference to the `std::vector` of structs to
-  /// serialize into the buffer as a `vector`.
-  /// @param[in] pack_func Pointer to a function to convert the native struct
-  /// to the FlatBuffer struct.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T, typename S, typename Alloc = std::allocator<T>>
-  Offset<Vector<const T*>> CreateVectorOfNativeStructs(const std::vector<S, Alloc>& v,
-                                                       T (*const pack_func)(const S&))
-  {
-    return CreateVectorOfNativeStructs<T, S>(data(v), v.size(), pack_func);
-  }
-
-  /// @brief Serialize a `std::vector` of native structs into a FlatBuffer
-  /// `vector`.
-  /// @tparam T The data type of the `std::vector` struct elements.
-  /// @tparam S The data type of the `std::vector` native struct elements.
-  /// @param[in] v A const reference to the `std::vector` of structs to
-  /// serialize into the buffer as a `vector`.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T, typename S, typename Alloc = std::allocator<S>>
-  Offset<Vector<const T*>> CreateVectorOfNativeStructs(const std::vector<S, Alloc>& v)
-  {
-    return CreateVectorOfNativeStructs<T, S>(data(v), v.size());
-  }
-
-  /// @cond FLATBUFFERS_INTERNAL
-  template <typename T>
-  struct StructKeyComparator {
-    bool operator()(const T& a, const T& b) const { return a.KeyCompareLessThan(&b); }
-  };
-  /// @endcond
-
-  /// @brief Serialize a `std::vector` of structs into a FlatBuffer `vector`
-  /// in sorted order.
-  /// @tparam T The data type of the `std::vector` struct elements.
-  /// @param[in] v A const reference to the `std::vector` of structs to
-  /// serialize into the buffer as a `vector`.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T, typename Alloc = std::allocator<T>>
-  Offset<Vector<const T*>> CreateVectorOfSortedStructs(std::vector<T, Alloc>* v)
-  {
-    return CreateVectorOfSortedStructs(data(*v), v->size());
-  }
-
-  /// @brief Serialize a `std::vector` of native structs into a FlatBuffer
-  /// `vector` in sorted order.
-  /// @tparam T The data type of the `std::vector` struct elements.
-  /// @tparam S The data type of the `std::vector` native struct elements.
-  /// @param[in] v A const reference to the `std::vector` of structs to
-  /// serialize into the buffer as a `vector`.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T, typename S, typename Alloc = std::allocator<T>>
-  Offset<Vector<const T*>> CreateVectorOfSortedNativeStructs(std::vector<S, Alloc>* v)
-  {
-    return CreateVectorOfSortedNativeStructs<T, S>(data(*v), v->size());
-  }
-
-  /// @brief Serialize an array of structs into a FlatBuffer `vector` in sorted
-  /// order.
-  /// @tparam T The data type of the struct array elements.
-  /// @param[in] v A pointer to the array of type `T` to serialize into the
-  /// buffer as a `vector`.
-  /// @param[in] len The number of elements to serialize.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T>
-  Offset<Vector<const T*>> CreateVectorOfSortedStructs(T* v, size_t len)
-  {
-    std::stable_sort(v, v + len, StructKeyComparator<T>());
-    return CreateVectorOfStructs(v, len);
-  }
-
-  /// @brief Serialize an array of native structs into a FlatBuffer `vector` in
-  /// sorted order.
-  /// @tparam T The data type of the struct array elements.
-  /// @tparam S The data type of the native struct array elements.
-  /// @param[in] v A pointer to the array of type `S` to serialize into the
-  /// buffer as a `vector`.
-  /// @param[in] len The number of elements to serialize.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T, typename S>
-  Offset<Vector<const T*>> CreateVectorOfSortedNativeStructs(S* v, size_t len)
-  {
-    extern T Pack(const S&);
-    auto structs = StartVectorOfStructs<T>(len);
-    for (size_t i = 0; i < len; i++) {
-      structs[i] = Pack(v[i]);
-    }
-    std::stable_sort(structs, structs + len, StructKeyComparator<T>());
-    return EndVectorOfStructs<T>(len);
-  }
-
-  /// @cond FLATBUFFERS_INTERNAL
-  template <typename T>
-  struct TableKeyComparator {
-    explicit TableKeyComparator(vector_downward<SizeT>& buf) : buf_(buf) {}
-    TableKeyComparator(const TableKeyComparator& other) : buf_(other.buf_) {}
-    bool operator()(const Offset<T>& a, const Offset<T>& b) const
-    {
-      auto table_a = reinterpret_cast<T*>(buf_.data_at(a.o));
-      auto table_b = reinterpret_cast<T*>(buf_.data_at(b.o));
-      return table_a->KeyCompareLessThan(table_b);
-    }
-    vector_downward<SizeT>& buf_;
-
-   private:
-    FLATBUFFERS_DELETE_FUNC(TableKeyComparator& operator=(const TableKeyComparator& other));
-  };
-  /// @endcond
-
-  /// @brief Serialize an array of `table` offsets as a `vector` in the buffer
-  /// in sorted order.
-  /// @tparam T The data type that the offset refers to.
-  /// @param[in] v An array of type `Offset<T>` that contains the `table`
-  /// offsets to store in the buffer in sorted order.
-  /// @param[in] len The number of elements to store in the `vector`.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T>
-  Offset<Vector<Offset<T>>> CreateVectorOfSortedTables(Offset<T>* v, size_t len)
-  {
-    std::stable_sort(v, v + len, TableKeyComparator<T>(buf_));
-    return CreateVector(v, len);
-  }
-
-  /// @brief Serialize an array of `table` offsets as a `vector` in the buffer
-  /// in sorted order.
-  /// @tparam T The data type that the offset refers to.
-  /// @param[in] v An array of type `Offset<T>` that contains the `table`
-  /// offsets to store in the buffer in sorted order.
-  /// @return Returns a typed `Offset` into the serialized data indicating
-  /// where the vector is stored.
-  template <typename T, typename Alloc = std::allocator<T>>
-  Offset<Vector<Offset<T>>> CreateVectorOfSortedTables(std::vector<Offset<T>, Alloc>* v)
-  {
-    return CreateVectorOfSortedTables(data(*v), v->size());
-  }
-
-  /// @brief Specialized version of `CreateVector` for non-copying use cases.
-  /// Write the data any time later to the returned buffer pointer `buf`.
-  /// @param[in] len The number of elements to store in the `vector`.
-  /// @param[in] elemsize The size of each element in the `vector`.
-  /// @param[out] buf A pointer to a `uint8_t` pointer that can be
-  /// written to at a later time to serialize the data into a `vector`
-  /// in the buffer.
-  uoffset_t CreateUninitializedVector(size_t len, size_t elemsize, size_t alignment, uint8_t** buf)
-  {
-    NotNested();
-    StartVector(len, elemsize, alignment);
-    buf_.make_space(len * elemsize);
-    const uoffset_t vec_start = GetSizeRelative32BitRegion();
-    auto vec_end              = EndVector(len);
-    *buf                      = buf_.data_at(vec_start);
-    return vec_end;
-  }
-
-  FLATBUFFERS_ATTRIBUTE([[deprecated("call the version above instead")]])
-  uoffset_t CreateUninitializedVector(size_t len, size_t elemsize, uint8_t** buf)
-  {
-    return CreateUninitializedVector(len, elemsize, elemsize, buf);
-  }
-
-  /// @brief Specialized version of `CreateVector` for non-copying use cases.
-  /// Write the data any time later to the returned buffer pointer `buf`.
-  /// @tparam T The data type of the data that will be stored in the buffer
-  /// as a `vector`.
-  /// @param[in] len The number of elements to store in the `vector`.
-  /// @param[out] buf A pointer to a pointer of type `T` that can be
-  /// written to at a later time to serialize the data into a `vector`
-  /// in the buffer.
-  template <typename T>
-  Offset<Vector<T>> CreateUninitializedVector(size_t len, T** buf)
-  {
-    AssertScalarT<T>();
-    return CreateUninitializedVector(
-      len, sizeof(T), AlignOf<T>(), reinterpret_cast<uint8_t**>(buf));
-  }
-
-  template <typename T>
-  Offset<Vector<const T*>> CreateUninitializedVectorOfStructs(size_t len, T** buf)
-  {
-    return CreateUninitializedVector(
-      len, sizeof(T), AlignOf<T>(), reinterpret_cast<uint8_t**>(buf));
-  }
-
-  // @brief Create a vector of scalar type T given as input a vector of scalar
-  // type U, useful with e.g. pre "enum class" enums, or any existing scalar
-  // data of the wrong type.
-  template <typename T, typename U>
-  Offset<Vector<T>> CreateVectorScalarCast(const U* v, size_t len)
-  {
-    AssertScalarT<T>();
-    AssertScalarT<U>();
-    StartVector<T>(len);
-    for (auto i = len; i > 0;) {
-      PushElement(static_cast<T>(v[--i]));
-    }
-    return Offset<Vector<T>>(EndVector(len));
-  }
-
-  /// @brief Write a struct by itself, typically to be part of a union.
-  template <typename T>
-  Offset<const T*> CreateStruct(const T& structobj)
-  {
-    NotNested();
-    Align(AlignOf<T>());
-    buf_.push_small(structobj);
-    return Offset<const T*>(CalculateOffset<typename Offset<const T*>::offset_type>());
-  }
-
-  /// @brief Finish serializing a buffer by writing the root offset.
-  /// @param[in] file_identifier If a `file_identifier` is given, the buffer
-  /// will be prefixed with a standard FlatBuffers file header.
-  template <typename T>
-  void Finish(Offset<T> root, const char* file_identifier = nullptr)
-  {
-    Finish(root.o, file_identifier, false);
-  }
-
-  /// @brief Finish a buffer with a 32 bit size field pre-fixed (size of the
-  /// buffer following the size field). These buffers are NOT compatible
-  /// with standard buffers created by Finish, i.e. you can't call GetRoot
-  /// on them, you have to use GetSizePrefixedRoot instead.
-  /// All >32 bit quantities in this buffer will be aligned when the whole
-  /// size pre-fixed buffer is aligned.
-  /// These kinds of buffers are useful for creating a stream of FlatBuffers.
-  template <typename T>
-  void FinishSizePrefixed(Offset<T> root, const char* file_identifier = nullptr)
-  {
-    Finish(root.o, file_identifier, true);
-  }
-
-  void SwapBufAllocator(FlatBufferBuilderImpl& other) { buf_.swap_allocator(other.buf_); }
-
-  /// @brief The length of a FlatBuffer file header.
-  static const size_t kFileIdentifierLength = ::flatbuffers::kFileIdentifierLength;
-
- protected:
-  // You shouldn't really be copying instances of this class.
-  FlatBufferBuilderImpl(const FlatBufferBuilderImpl&);
-  FlatBufferBuilderImpl& operator=(const FlatBufferBuilderImpl&);
-
-  void Finish(uoffset_t root, const char* file_identifier, bool size_prefix)
-  {
-    // A buffer can only be finished once. To reuse a builder use `clear()`.
-    FLATBUFFERS_ASSERT(!finished);
-
-    NotNested();
-    buf_.clear_scratch();
-
-    const size_t prefix_size = size_prefix ? sizeof(SizeT) : 0;
-    // Make sure we track the alignment of the size prefix.
-    TrackMinAlign(prefix_size);
-
-    const size_t root_offset_size = sizeof(uoffset_t);
-    const size_t file_id_size     = file_identifier ? kFileIdentifierLength : 0;
-
-    // This will cause the whole buffer to be aligned.
-    PreAlign(prefix_size + root_offset_size + file_id_size, minalign_);
-
-    if (file_identifier) {
-      FLATBUFFERS_ASSERT(strlen(file_identifier) == kFileIdentifierLength);
-      PushBytes(reinterpret_cast<const uint8_t*>(file_identifier), kFileIdentifierLength);
-    }
-    PushElement(ReferTo(root));  // Location of root.
-    if (size_prefix) { PushElement(GetSize()); }
-    finished = true;
-  }
-
-  struct FieldLoc {
-    uoffset_t off;
-    voffset_t id;
-  };
-
-  vector_downward<SizeT> buf_;
-
-  // Accumulating offsets of table members while it is being built.
-  // We store these in the scratch pad of buf_, after the vtable offsets.
-  uoffset_t num_field_loc;
-  // Track how much of the vtable is in use, so we can output the most compact
-  // possible vtable.
-  voffset_t max_voffset_;
-
-  // This is the length of the 64-bit region of the buffer. The buffer supports
-  // 64-bit offsets by forcing serialization of those elements in the "tail"
-  // region of the buffer (i.e. "64-bit region"). To properly keep track of
-  // offsets that are referenced from the tail of the buffer to not overflow
-  // their size (e.g. Offset is a uint32_t type), the boundary of the 32-/64-bit
-  // regions must be tracked.
-  //
-  // [    Complete FlatBuffer     ]
-  // [32-bit region][64-bit region]
-  //               ^              ^
-  //               |              Tail of the buffer.
-  //               |
-  //               Tail of the 32-bit region of the buffer.
-  //
-  // This keeps track of the size of the 64-bit region so that the tail of the
-  // 32-bit region can be calculated as `GetSize() - length_of_64_bit_region_`.
-  //
-  // This will remain 0 if no 64-bit offset types are added to the buffer.
-  size_t length_of_64_bit_region_;
-
-  // Ensure objects are not nested.
-  bool nested;
-
-  // Ensure the buffer is finished before it is being accessed.
-  bool finished;
-
-  size_t minalign_;
-
-  bool force_defaults_;  // Serialize values equal to their defaults anyway.
-
-  bool dedup_vtables_;
-
-  struct StringOffsetCompare {
-    explicit StringOffsetCompare(const vector_downward<SizeT>& buf) : buf_(&buf) {}
-    bool operator()(const Offset<String>& a, const Offset<String>& b) const
-    {
-      auto stra = reinterpret_cast<const String*>(buf_->data_at(a.o));
-      auto strb = reinterpret_cast<const String*>(buf_->data_at(b.o));
-      return StringLessThan(stra->data(), stra->size(), strb->data(), strb->size());
-    }
-    const vector_downward<SizeT>* buf_;
-  };
-
-  // For use with CreateSharedString. Instantiated on first use only.
-  typedef std::set<Offset<String>, StringOffsetCompare> StringOffsetMap;
-  StringOffsetMap* string_pool;
-
- private:
-  void CanAddOffset64()
-  {
-    // If you hit this assertion, you are attempting to add a 64-bit offset to
-    // a 32-bit only builder. This is because the builder has overloads that
-    // differ only on the offset size returned: e.g.:
-    //
-    //   FlatBufferBuilder builder;
-    //   Offset64<String> string_offset = builder.CreateString<Offset64>();
-    //
-    // Either use a 64-bit aware builder, or don't try to create an Offset64
-    // return type.
-    //
-    // TODO(derekbailey): we can probably do more enable_if to avoid this
-    // looking like its possible to the user.
-    static_assert(Is64Aware, "cannot add 64-bit offset to a 32-bit builder");
-
-    // If you hit this assertion, you are attempting to add an 64-bit offset
-    // item after already serializing a 32-bit item. All 64-bit offsets have to
-    // added to the tail of the buffer before any 32-bit items can be added.
-    // Otherwise some items might not be addressable due to the maximum range of
-    // the 32-bit offset.
-    FLATBUFFERS_ASSERT(GetSize() == length_of_64_bit_region_);
-  }
-
-  /// @brief Store a string in the buffer, which can contain any binary data.
-  /// @param[in] str A const char pointer to the data to be stored as a string.
-  /// @param[in] len The number of bytes that should be stored from `str`.
-  /// @return Returns the offset in the buffer where the string starts.
-  void CreateStringImpl(const char* str, size_t len)
-  {
-    NotNested();
-    PreAlign<uoffset_t>(len + 1);  // Always 0-terminated.
-    buf_.fill(1);
-    PushBytes(reinterpret_cast<const uint8_t*>(str), len);
-    PushElement(static_cast<uoffset_t>(len));
-  }
-
-  // Allocates space for a vector of structures.
-  // Must be completed with EndVectorOfStructs().
-  template <typename T, template <typename> class OffsetT = Offset>
-  T* StartVectorOfStructs(size_t vector_size)
-  {
-    StartVector<OffsetT>(vector_size, sizeof(T), AlignOf<T>());
-    return reinterpret_cast<T*>(buf_.make_space(vector_size * sizeof(T)));
-  }
-
-  // End the vector of structures in the flatbuffers.
-  // Vector should have previously be started with StartVectorOfStructs().
-  template <typename T, template <typename> class OffsetT = Offset>
-  OffsetT<Vector<const T*>> EndVectorOfStructs(size_t vector_size)
-  {
-    return OffsetT<Vector<const T*>>(
-      EndVector<typename Vector<const T*>::size_type,
-                typename OffsetT<Vector<const T*>>::offset_type>(vector_size));
-  }
-
-  template <typename T>
-  typename std::enable_if<std::is_same<T, uoffset_t>::value, T>::type CalculateOffset()
-  {
-    // Default to the end of the 32-bit region. This may or may not be the end
-    // of the buffer, depending on if any 64-bit offsets have been added.
-    return GetSizeRelative32BitRegion();
-  }
-
-  // Specializations to handle the 64-bit CalculateOffset, which is relative to
-  // end of the buffer.
-  template <typename T>
-  typename std::enable_if<std::is_same<T, uoffset64_t>::value, T>::type CalculateOffset()
-  {
-    // This should never be compiled in when not using a 64-bit builder.
-    static_assert(Is64Aware, "invalid 64-bit offset in 32-bit builder");
-
-    // Store how big the 64-bit region of the buffer is, so we can determine
-    // where the 32/64 bit boundary is.
-    length_of_64_bit_region_ = GetSize();
-
-    return length_of_64_bit_region_;
-  }
-};
-/// @}
-
-// Hack to `FlatBufferBuilder` mean `FlatBufferBuilder<false>` or
-// `FlatBufferBuilder<>`, where the template < > syntax is required.
-using FlatBufferBuilder   = FlatBufferBuilderImpl<false>;
-using FlatBufferBuilder64 = FlatBufferBuilderImpl<true>;
-
-// These are external due to GCC not allowing them in the class.
-// See: https://stackoverflow.com/q/8061456/868247
-template <>
-template <>
-inline Offset64<String> FlatBufferBuilder64::CreateString(const char* str, size_t len)
-{
-  CanAddOffset64();
-  CreateStringImpl(str, len);
-  return Offset64<String>(CalculateOffset<typename Offset64<String>::offset_type>());
-}
-
-// Used to distinguish from real Offsets.
-template <typename T = void>
-struct EmptyOffset {};
-
-// TODO(derekbailey): it would be nice to combine these two methods.
-template <>
-template <>
-inline void FlatBufferBuilder64::StartVector<Offset64, uint32_t>(size_t len,
-                                                                 size_t elemsize,
-                                                                 size_t alignment)
-{
-  CanAddOffset64();
-  StartVector<EmptyOffset, uint32_t>(len, elemsize, alignment);
-}
-
-template <>
-template <>
-inline void FlatBufferBuilder64::StartVector<Offset64, uint64_t>(size_t len,
-                                                                 size_t elemsize,
-                                                                 size_t alignment)
-{
-  CanAddOffset64();
-  StartVector<EmptyOffset, uint64_t>(len, elemsize, alignment);
-}
-
-/// Helpers to get a typed pointer to objects that are currently being built.
-/// @warning Creating new objects will lead to reallocations and invalidates
-/// the pointer!
-template <typename T>
-T* GetMutableTemporaryPointer(FlatBufferBuilder& fbb, Offset<T> offset)
-{
-  return reinterpret_cast<T*>(fbb.GetCurrentBufferPointer() + fbb.GetSize() - offset.o);
-}
-
-template <typename T>
-const T* GetTemporaryPointer(const FlatBufferBuilder& fbb, Offset<T> offset)
-{
-  return reinterpret_cast<const T*>(fbb.GetCurrentBufferPointer() + fbb.GetSize() - offset.o);
-}
-
-}  // namespace flatbuffers
-
-#endif  // FLATBUFFERS_FLATBUFFER_BUILDER_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/flatbuffers.h b/cpp/include/cudf/io/ipc/flatbuffers/flatbuffers.h
deleted file mode 100644
index d432398ebd8..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/flatbuffers.h
+++ /dev/null
@@ -1,289 +0,0 @@
-/*
- * Copyright 2014 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_H_
-#define FLATBUFFERS_H_
-
-#include <algorithm>
-
-// TODO: These includes are for mitigating the pains of users editing their
-// source because they relied on flatbuffers.h to include everything for them.
-#include <cudf/io/ipc/flatbuffers/array.h>
-#include <cudf/io/ipc/flatbuffers/base.h>
-#include <cudf/io/ipc/flatbuffers/buffer.h>
-#include <cudf/io/ipc/flatbuffers/buffer_ref.h>
-#include <cudf/io/ipc/flatbuffers/detached_buffer.h>
-#include <cudf/io/ipc/flatbuffers/flatbuffer_builder.h>
-#include <cudf/io/ipc/flatbuffers/stl_emulation.h>
-#include <cudf/io/ipc/flatbuffers/string.h>
-#include <cudf/io/ipc/flatbuffers/struct.h>
-#include <cudf/io/ipc/flatbuffers/table.h>
-#include <cudf/io/ipc/flatbuffers/vector.h>
-#include <cudf/io/ipc/flatbuffers/vector_downward.h>
-#include <cudf/io/ipc/flatbuffers/verifier.h>
-
-namespace flatbuffers {
-
-/// @brief This can compute the start of a FlatBuffer from a root pointer, i.e.
-/// it is the opposite transformation of GetRoot().
-/// This may be useful if you want to pass on a root and have the recipient
-/// delete the buffer afterwards.
-inline const uint8_t* GetBufferStartFromRootPointer(const void* root)
-{
-  auto table  = reinterpret_cast<const Table*>(root);
-  auto vtable = table->GetVTable();
-  // Either the vtable is before the root or after the root.
-  auto start = (std::min)(vtable, reinterpret_cast<const uint8_t*>(root));
-  // Align to at least sizeof(uoffset_t).
-  start =
-    reinterpret_cast<const uint8_t*>(reinterpret_cast<uintptr_t>(start) & ~(sizeof(uoffset_t) - 1));
-  // Additionally, there may be a file_identifier in the buffer, and the root
-  // offset. The buffer may have been aligned to any size between
-  // sizeof(uoffset_t) and FLATBUFFERS_MAX_ALIGNMENT (see "force_align").
-  // Sadly, the exact alignment is only known when constructing the buffer,
-  // since it depends on the presence of values with said alignment properties.
-  // So instead, we simply look at the next uoffset_t values (root,
-  // file_identifier, and alignment padding) to see which points to the root.
-  // None of the other values can "impersonate" the root since they will either
-  // be 0 or four ASCII characters.
-  static_assert(flatbuffers::kFileIdentifierLength == sizeof(uoffset_t),
-                "file_identifier is assumed to be the same size as uoffset_t");
-  for (auto possible_roots = FLATBUFFERS_MAX_ALIGNMENT / sizeof(uoffset_t) + 1; possible_roots;
-       possible_roots--) {
-    start -= sizeof(uoffset_t);
-    if (ReadScalar<uoffset_t>(start) + start == reinterpret_cast<const uint8_t*>(root))
-      return start;
-  }
-  // We didn't find the root, either the "root" passed isn't really a root,
-  // or the buffer is corrupt.
-  // Assert, because calling this function with bad data may cause reads
-  // outside of buffer boundaries.
-  FLATBUFFERS_ASSERT(false);
-  return nullptr;
-}
-
-/// @brief This return the prefixed size of a FlatBuffer.
-template <typename SizeT = uoffset_t>
-inline SizeT GetPrefixedSize(const uint8_t* buf)
-{
-  return ReadScalar<SizeT>(buf);
-}
-
-// Gets the total length of the buffer given a sized prefixed FlatBuffer.
-//
-// This includes the size of the prefix as well as the buffer:
-//
-//  [size prefix][flatbuffer]
-//  |---------length--------|
-template <typename SizeT = uoffset_t>
-inline SizeT GetSizePrefixedBufferLength(const uint8_t* const buf)
-{
-  return ReadScalar<SizeT>(buf) + sizeof(SizeT);
-}
-
-// Base class for native objects (FlatBuffer data de-serialized into native
-// C++ data structures).
-// Contains no functionality, purely documentative.
-struct NativeTable {};
-
-/// @brief Function types to be used with resolving hashes into objects and
-/// back again. The resolver gets a pointer to a field inside an object API
-/// object that is of the type specified in the schema using the attribute
-/// `cpp_type` (it is thus important whatever you write to this address
-/// matches that type). The value of this field is initially null, so you
-/// may choose to implement a delayed binding lookup using this function
-/// if you wish. The resolver does the opposite lookup, for when the object
-/// is being serialized again.
-typedef uint64_t hash_value_t;
-typedef std::function<void(void** pointer_adr, hash_value_t hash)> resolver_function_t;
-typedef std::function<hash_value_t(void* pointer)> rehasher_function_t;
-
-// Helper function to test if a field is present, using any of the field
-// enums in the generated code.
-// `table` must be a generated table type. Since this is a template parameter,
-// this is not typechecked to be a subclass of Table, so beware!
-// Note: this function will return false for fields equal to the default
-// value, since they're not stored in the buffer (unless force_defaults was
-// used).
-template <typename T>
-bool IsFieldPresent(const T* table, typename T::FlatBuffersVTableOffset field)
-{
-  // Cast, since Table is a private baseclass of any table types.
-  return reinterpret_cast<const Table*>(table)->CheckField(static_cast<voffset_t>(field));
-}
-
-// Utility function for reverse lookups on the EnumNames*() functions
-// (in the generated C++ code)
-// names must be NULL terminated.
-inline int LookupEnum(const char** names, const char* name)
-{
-  for (const char** p = names; *p; p++)
-    if (!strcmp(*p, name)) return static_cast<int>(p - names);
-  return -1;
-}
-
-// These macros allow us to layout a struct with a guarantee that they'll end
-// up looking the same on different compilers and platforms.
-// It does this by disallowing the compiler to do any padding, and then
-// does padding itself by inserting extra padding fields that make every
-// element aligned to its own size.
-// Additionally, it manually sets the alignment of the struct as a whole,
-// which is typically its largest element, or a custom size set in the schema
-// by the force_align attribute.
-// These are used in the generated code only.
-
-// clang-format off
-#if defined(_MSC_VER)
-  #define FLATBUFFERS_MANUALLY_ALIGNED_STRUCT(alignment) \
-    __pragma(pack(1)) \
-    struct __declspec(align(alignment))
-  #define FLATBUFFERS_STRUCT_END(name, size) \
-    __pragma(pack()) \
-    static_assert(sizeof(name) == size, "compiler breaks packing rules")
-#elif defined(__GNUC__) || defined(__clang__) || defined(__ICCARM__)
-  #define FLATBUFFERS_MANUALLY_ALIGNED_STRUCT(alignment) \
-    _Pragma("pack(1)") \
-    struct __attribute__((aligned(alignment)))
-  #define FLATBUFFERS_STRUCT_END(name, size) \
-    _Pragma("pack()") \
-    static_assert(sizeof(name) == size, "compiler breaks packing rules")
-#else
-  #error Unknown compiler, please define structure alignment macros
-#endif
-// clang-format on
-
-// Minimal reflection via code generation.
-// Besides full-fat reflection (see reflection.h) and parsing/printing by
-// loading schemas (see idl.h), we can also have code generation for minimal
-// reflection data which allows pretty-printing and other uses without needing
-// a schema or a parser.
-// Generate code with --reflect-types (types only) or --reflect-names (names
-// also) to enable.
-// See minireflect.h for utilities using this functionality.
-
-// These types are organized slightly differently as the ones in idl.h.
-enum SequenceType { ST_TABLE, ST_STRUCT, ST_UNION, ST_ENUM };
-
-// Scalars have the same order as in idl.h
-// clang-format off
-#define FLATBUFFERS_GEN_ELEMENTARY_TYPES(ET) \
-  ET(ET_UTYPE) \
-  ET(ET_BOOL) \
-  ET(ET_CHAR) \
-  ET(ET_UCHAR) \
-  ET(ET_SHORT) \
-  ET(ET_USHORT) \
-  ET(ET_INT) \
-  ET(ET_UINT) \
-  ET(ET_LONG) \
-  ET(ET_ULONG) \
-  ET(ET_FLOAT) \
-  ET(ET_DOUBLE) \
-  ET(ET_STRING) \
-  ET(ET_SEQUENCE)  // See SequenceType.
-
-enum ElementaryType {
-  #define FLATBUFFERS_ET(E) E,
-    FLATBUFFERS_GEN_ELEMENTARY_TYPES(FLATBUFFERS_ET)
-  #undef FLATBUFFERS_ET
-};
-
-inline const char * const *ElementaryTypeNames() {
-  static const char * const names[] = {
-    #define FLATBUFFERS_ET(E) #E,
-      FLATBUFFERS_GEN_ELEMENTARY_TYPES(FLATBUFFERS_ET)
-    #undef FLATBUFFERS_ET
-  };
-  return names;
-}
-// clang-format on
-
-// Basic type info cost just 16bits per field!
-// We're explicitly defining the signedness since the signedness of integer
-// bitfields is otherwise implementation-defined and causes warnings on older
-// GCC compilers.
-struct TypeCode {
-  // ElementaryType
-  unsigned short base_type : 4;
-  // Either vector (in table) or array (in struct)
-  unsigned short is_repeating : 1;
-  // Index into type_refs below, or -1 for none.
-  signed short sequence_ref : 11;
-};
-
-static_assert(sizeof(TypeCode) == 2, "TypeCode");
-
-struct TypeTable;
-
-// Signature of the static method present in each type.
-typedef const TypeTable* (*TypeFunction)();
-
-struct TypeTable {
-  SequenceType st;
-  size_t num_elems;               // of type_codes, values, names (but not type_refs).
-  const TypeCode* type_codes;     // num_elems count
-  const TypeFunction* type_refs;  // less than num_elems entries (see TypeCode).
-  const int16_t* array_sizes;     // less than num_elems entries (see TypeCode).
-  const int64_t* values;          // Only set for non-consecutive enum/union or structs.
-  const char* const* names;       // Only set if compiled with --reflect-names.
-};
-
-// String which identifies the current version of FlatBuffers.
-inline const char* flatbuffers_version_string()
-{
-  return "FlatBuffers " FLATBUFFERS_STRING(FLATBUFFERS_VERSION_MAJOR) "." FLATBUFFERS_STRING(
-    FLATBUFFERS_VERSION_MINOR) "." FLATBUFFERS_STRING(FLATBUFFERS_VERSION_REVISION);
-}
-
-// clang-format off
-#define FLATBUFFERS_DEFINE_BITMASK_OPERATORS(E, T)\
-    inline FLATBUFFERS_CONSTEXPR_CPP11 E operator | (E lhs, E rhs){\
-        return E(T(lhs) | T(rhs));\
-    }\
-    inline FLATBUFFERS_CONSTEXPR_CPP11 E operator & (E lhs, E rhs){\
-        return E(T(lhs) & T(rhs));\
-    }\
-    inline FLATBUFFERS_CONSTEXPR_CPP11 E operator ^ (E lhs, E rhs){\
-        return E(T(lhs) ^ T(rhs));\
-    }\
-    inline FLATBUFFERS_CONSTEXPR_CPP11 E operator ~ (E lhs){\
-        return E(~T(lhs));\
-    }\
-    inline FLATBUFFERS_CONSTEXPR_CPP11 E operator |= (E &lhs, E rhs){\
-        lhs = lhs | rhs;\
-        return lhs;\
-    }\
-    inline FLATBUFFERS_CONSTEXPR_CPP11 E operator &= (E &lhs, E rhs){\
-        lhs = lhs & rhs;\
-        return lhs;\
-    }\
-    inline FLATBUFFERS_CONSTEXPR_CPP11 E operator ^= (E &lhs, E rhs){\
-        lhs = lhs ^ rhs;\
-        return lhs;\
-    }\
-    inline FLATBUFFERS_CONSTEXPR_CPP11 bool operator !(E rhs) \
-    {\
-        return !bool(T(rhs)); \
-    }
-/// @endcond
-}  // namespace flatbuffers
-
-// clang-format on
-
-#endif  // FLATBUFFERS_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/stl_emulation.h b/cpp/include/cudf/io/ipc/flatbuffers/stl_emulation.h
deleted file mode 100644
index 7527e964456..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/stl_emulation.h
+++ /dev/null
@@ -1,568 +0,0 @@
-/*
- * Copyright 2017 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_STL_EMULATION_H_
-#define FLATBUFFERS_STL_EMULATION_H_
-
-#include <cudf/io/ipc/flatbuffers/base.h>
-
-#include <limits>
-#include <memory>
-#include <string>
-#include <type_traits>
-#include <vector>
-
-#ifndef FLATBUFFERS_USE_STD_OPTIONAL
-// Detect C++17 compatible compiler.
-// __cplusplus >= 201703L - a compiler has support of 'static inline' variables.
-#if (defined(__cplusplus) && __cplusplus >= 201703L) || \
-  (defined(_MSVC_LANG) && _MSVC_LANG >= 201703L)
-#define FLATBUFFERS_USE_STD_OPTIONAL 1
-#else
-#define FLATBUFFERS_USE_STD_OPTIONAL 0
-#endif  // (defined(__cplusplus) && __cplusplus >= 201703L) ...
-#endif  // FLATBUFFERS_USE_STD_OPTIONAL
-
-#if FLATBUFFERS_USE_STD_OPTIONAL
-#include <optional>
-#endif
-
-#ifndef FLATBUFFERS_USE_STD_SPAN
-// Testing __cpp_lib_span requires including either <version> or <span>,
-// both of which were added in C++20.
-// See: https://en.cppreference.com/w/cpp/utility/feature_test
-#if defined(__cplusplus) && __cplusplus >= 202002L || (defined(_MSVC_LANG) && _MSVC_LANG >= 202002L)
-#define FLATBUFFERS_USE_STD_SPAN 1
-#endif
-#endif  // FLATBUFFERS_USE_STD_SPAN
-
-#if defined(FLATBUFFERS_USE_STD_SPAN)
-#include <array>
-#include <span>
-#else
-// Disable non-trivial ctors if FLATBUFFERS_SPAN_MINIMAL defined.
-#if !defined(FLATBUFFERS_TEMPLATES_ALIASES)
-#define FLATBUFFERS_SPAN_MINIMAL
-#else
-// Enable implicit construction of a span<T,N> from a std::array<T,N>.
-#include <array>
-#endif
-#endif  // defined(FLATBUFFERS_USE_STD_SPAN)
-
-// This header provides backwards compatibility for older versions of the STL.
-namespace flatbuffers {
-
-#if defined(FLATBUFFERS_TEMPLATES_ALIASES)
-template <typename T>
-using numeric_limits = std::numeric_limits<T>;
-#else
-template <typename T>
-class numeric_limits : public std::numeric_limits<T> {};
-#endif  // defined(FLATBUFFERS_TEMPLATES_ALIASES)
-
-#if defined(FLATBUFFERS_TEMPLATES_ALIASES)
-template <typename T>
-using is_scalar = std::is_scalar<T>;
-template <typename T, typename U>
-using is_same = std::is_same<T, U>;
-template <typename T>
-using is_floating_point = std::is_floating_point<T>;
-template <typename T>
-using is_unsigned = std::is_unsigned<T>;
-template <typename T>
-using is_enum = std::is_enum<T>;
-template <typename T>
-using make_unsigned = std::make_unsigned<T>;
-template <bool B, class T, class F>
-using conditional = std::conditional<B, T, F>;
-template <class T, T v>
-using integral_constant = std::integral_constant<T, v>;
-template <bool B>
-using bool_constant = integral_constant<bool, B>;
-using true_type     = std::true_type;
-using false_type    = std::false_type;
-#else
-// MSVC 2010 doesn't support C++11 aliases.
-template <typename T>
-struct is_scalar : public std::is_scalar<T> {};
-template <typename T, typename U>
-struct is_same : public std::is_same<T, U> {};
-template <typename T>
-struct is_floating_point : public std::is_floating_point<T> {};
-template <typename T>
-struct is_unsigned : public std::is_unsigned<T> {};
-template <typename T>
-struct is_enum : public std::is_enum<T> {};
-template <typename T>
-struct make_unsigned : public std::make_unsigned<T> {};
-template <bool B, class T, class F>
-struct conditional : public std::conditional<B, T, F> {};
-template <class T, T v>
-struct integral_constant : public std::integral_constant<T, v> {};
-template <bool B>
-struct bool_constant : public integral_constant<bool, B> {};
-typedef bool_constant<true> true_type;
-typedef bool_constant<false> false_type;
-#endif  // defined(FLATBUFFERS_TEMPLATES_ALIASES)
-
-#if defined(FLATBUFFERS_TEMPLATES_ALIASES)
-template <class T>
-using unique_ptr = std::unique_ptr<T>;
-#else
-// MSVC 2010 doesn't support C++11 aliases.
-// We're manually "aliasing" the class here as we want to bring unique_ptr
-// into the flatbuffers namespace.  We have unique_ptr in the flatbuffers
-// namespace we have a completely independent implementation (see below)
-// for C++98 STL implementations.
-template <class T>
-class unique_ptr : public std::unique_ptr<T> {
- public:
-  unique_ptr() {}
-  explicit unique_ptr(T* p) : std::unique_ptr<T>(p) {}
-  unique_ptr(std::unique_ptr<T>&& u) { *this = std::move(u); }
-  unique_ptr(unique_ptr&& u) { *this = std::move(u); }
-  unique_ptr& operator=(std::unique_ptr<T>&& u)
-  {
-    std::unique_ptr<T>::reset(u.release());
-    return *this;
-  }
-  unique_ptr& operator=(unique_ptr&& u)
-  {
-    std::unique_ptr<T>::reset(u.release());
-    return *this;
-  }
-  unique_ptr& operator=(T* p) { return std::unique_ptr<T>::operator=(p); }
-};
-#endif  // defined(FLATBUFFERS_TEMPLATES_ALIASES)
-
-#if FLATBUFFERS_USE_STD_OPTIONAL
-template <class T>
-using Optional                     = std::optional<T>;
-using nullopt_t                    = std::nullopt_t;
-inline constexpr nullopt_t nullopt = std::nullopt;
-
-#else
-// Limited implementation of Optional<T> type for a scalar T.
-// This implementation limited by trivial types compatible with
-// std::is_arithmetic<T> or std::is_enum<T> type traits.
-
-// A tag to indicate an empty flatbuffers::optional<T>.
-struct nullopt_t {
-  explicit FLATBUFFERS_CONSTEXPR_CPP11 nullopt_t(int) {}
-};
-
-#if defined(FLATBUFFERS_CONSTEXPR_DEFINED)
-namespace internal {
-template <class>
-struct nullopt_holder {
-  static constexpr nullopt_t instance_ = nullopt_t(0);
-};
-template <class Dummy>
-constexpr nullopt_t nullopt_holder<Dummy>::instance_;
-}  // namespace internal
-static constexpr const nullopt_t& nullopt = internal::nullopt_holder<void>::instance_;
-
-#else
-namespace internal {
-template <class>
-struct nullopt_holder {
-  static const nullopt_t instance_;
-};
-template <class Dummy>
-const nullopt_t nullopt_holder<Dummy>::instance_ = nullopt_t(0);
-}  // namespace internal
-static const nullopt_t& nullopt = internal::nullopt_holder<void>::instance_;
-
-#endif
-
-template <class T>
-class Optional FLATBUFFERS_FINAL_CLASS {
-  // Non-scalar 'T' would extremely complicated Optional<T>.
-  // Use is_scalar<T> checking because flatbuffers flatbuffers::is_arithmetic<T>
-  // isn't implemented.
-  static_assert(flatbuffers::is_scalar<T>::value, "unexpected type T");
-
- public:
-  ~Optional() {}
-
-  FLATBUFFERS_CONSTEXPR_CPP11 Optional() FLATBUFFERS_NOEXCEPT : value_(), has_value_(false) {}
-
-  FLATBUFFERS_CONSTEXPR_CPP11 Optional(nullopt_t) FLATBUFFERS_NOEXCEPT : value_(), has_value_(false)
-  {
-  }
-
-  FLATBUFFERS_CONSTEXPR_CPP11 Optional(T val) FLATBUFFERS_NOEXCEPT : value_(val), has_value_(true)
-  {
-  }
-
-  FLATBUFFERS_CONSTEXPR_CPP11 Optional(const Optional& other) FLATBUFFERS_NOEXCEPT
-    : value_(other.value_),
-      has_value_(other.has_value_)
-  {
-  }
-
-  FLATBUFFERS_CONSTEXPR_CPP14 Optional& operator=(const Optional& other) FLATBUFFERS_NOEXCEPT
-  {
-    value_     = other.value_;
-    has_value_ = other.has_value_;
-    return *this;
-  }
-
-  FLATBUFFERS_CONSTEXPR_CPP14 Optional& operator=(nullopt_t) FLATBUFFERS_NOEXCEPT
-  {
-    value_     = T();
-    has_value_ = false;
-    return *this;
-  }
-
-  FLATBUFFERS_CONSTEXPR_CPP14 Optional& operator=(T val) FLATBUFFERS_NOEXCEPT
-  {
-    value_     = val;
-    has_value_ = true;
-    return *this;
-  }
-
-  void reset() FLATBUFFERS_NOEXCEPT { *this = nullopt; }
-
-  void swap(Optional& other) FLATBUFFERS_NOEXCEPT
-  {
-    std::swap(value_, other.value_);
-    std::swap(has_value_, other.has_value_);
-  }
-
-  FLATBUFFERS_CONSTEXPR_CPP11 FLATBUFFERS_EXPLICIT_CPP11 operator bool() const FLATBUFFERS_NOEXCEPT
-  {
-    return has_value_;
-  }
-
-  FLATBUFFERS_CONSTEXPR_CPP11 bool has_value() const FLATBUFFERS_NOEXCEPT { return has_value_; }
-
-  FLATBUFFERS_CONSTEXPR_CPP11 const T& operator*() const FLATBUFFERS_NOEXCEPT { return value_; }
-
-  const T& value() const
-  {
-    FLATBUFFERS_ASSERT(has_value());
-    return value_;
-  }
-
-  T value_or(T default_value) const FLATBUFFERS_NOEXCEPT
-  {
-    return has_value() ? value_ : default_value;
-  }
-
- private:
-  T value_;
-  bool has_value_;
-};
-
-template <class T>
-FLATBUFFERS_CONSTEXPR_CPP11 bool operator==(const Optional<T>& opt, nullopt_t) FLATBUFFERS_NOEXCEPT
-{
-  return !opt;
-}
-template <class T>
-FLATBUFFERS_CONSTEXPR_CPP11 bool operator==(nullopt_t, const Optional<T>& opt) FLATBUFFERS_NOEXCEPT
-{
-  return !opt;
-}
-
-template <class T, class U>
-FLATBUFFERS_CONSTEXPR_CPP11 bool operator==(const Optional<T>& lhs,
-                                            const U& rhs) FLATBUFFERS_NOEXCEPT
-{
-  return static_cast<bool>(lhs) && (*lhs == rhs);
-}
-
-template <class T, class U>
-FLATBUFFERS_CONSTEXPR_CPP11 bool operator==(const T& lhs,
-                                            const Optional<U>& rhs) FLATBUFFERS_NOEXCEPT
-{
-  return static_cast<bool>(rhs) && (lhs == *rhs);
-}
-
-template <class T, class U>
-FLATBUFFERS_CONSTEXPR_CPP11 bool operator==(const Optional<T>& lhs,
-                                            const Optional<U>& rhs) FLATBUFFERS_NOEXCEPT
-{
-  return static_cast<bool>(lhs) != static_cast<bool>(rhs) ? false
-         : !static_cast<bool>(lhs)                        ? false
-                                                          : (*lhs == *rhs);
-}
-#endif  // FLATBUFFERS_USE_STD_OPTIONAL
-
-// Very limited and naive partial implementation of C++20 std::span<T,Extent>.
-#if defined(FLATBUFFERS_USE_STD_SPAN)
-inline constexpr std::size_t dynamic_extent = std::dynamic_extent;
-template <class T, std::size_t Extent = std::dynamic_extent>
-using span = std::span<T, Extent>;
-
-#else  // !defined(FLATBUFFERS_USE_STD_SPAN)
-FLATBUFFERS_CONSTEXPR std::size_t dynamic_extent = static_cast<std::size_t>(-1);
-
-// Exclude this code if MSVC2010 or non-STL Android is active.
-// The non-STL Android doesn't have `std::is_convertible` required for SFINAE.
-#if !defined(FLATBUFFERS_SPAN_MINIMAL)
-namespace internal {
-// This is SFINAE helper class for checking of a common condition:
-// > This overload only participates in overload resolution
-// > Check whether a pointer to an array of From can be converted
-// > to a pointer to an array of To.
-// This helper is used for checking of 'From -> const From'.
-template <class To, std::size_t Extent, class From, std::size_t N>
-struct is_span_convertible {
-  using type = typename std::conditional<std::is_convertible<From (*)[], To (*)[]>::value &&
-                                           (Extent == dynamic_extent || N == Extent),
-                                         int,
-                                         void>::type;
-};
-
-template <typename T>
-struct SpanIterator {
-  // TODO: upgrade to std::random_access_iterator_tag.
-  using iterator_category = std::forward_iterator_tag;
-  using difference_type   = std::ptrdiff_t;
-  using value_type        = typename std::remove_cv<T>::type;
-  using reference         = T&;
-  using pointer           = T*;
-
-// Convince MSVC compiler that this iterator is trusted (it is verified).
-#ifdef _MSC_VER
-  using _Unchecked_type = pointer;
-#endif  // _MSC_VER
-
-  SpanIterator(pointer ptr) : ptr_(ptr) {}
-  reference operator*() const { return *ptr_; }
-  pointer operator->() { return ptr_; }
-  SpanIterator& operator++()
-  {
-    ptr_++;
-    return *this;
-  }
-  SpanIterator operator++(int)
-  {
-    auto tmp = *this;
-    ++(*this);
-    return tmp;
-  }
-
-  friend bool operator==(const SpanIterator& lhs, const SpanIterator& rhs)
-  {
-    return lhs.ptr_ == rhs.ptr_;
-  }
-  friend bool operator!=(const SpanIterator& lhs, const SpanIterator& rhs)
-  {
-    return lhs.ptr_ != rhs.ptr_;
-  }
-
- private:
-  pointer ptr_;
-};
-}  // namespace internal
-#endif  // !defined(FLATBUFFERS_SPAN_MINIMAL)
-
-// T - element type; must be a complete type that is not an abstract
-// class type.
-// Extent - the number of elements in the sequence, or dynamic.
-template <class T, std::size_t Extent = dynamic_extent>
-class span FLATBUFFERS_FINAL_CLASS {
- public:
-  typedef T element_type;
-  typedef T& reference;
-  typedef const T& const_reference;
-  typedef T* pointer;
-  typedef const T* const_pointer;
-  typedef std::size_t size_type;
-
-  static FLATBUFFERS_CONSTEXPR size_type extent = Extent;
-
-  // Returns the number of elements in the span.
-  FLATBUFFERS_CONSTEXPR_CPP11 size_type size() const FLATBUFFERS_NOEXCEPT { return count_; }
-
-  // Returns the size of the sequence in bytes.
-  FLATBUFFERS_CONSTEXPR_CPP11
-  size_type size_bytes() const FLATBUFFERS_NOEXCEPT { return size() * sizeof(element_type); }
-
-  // Checks if the span is empty.
-  FLATBUFFERS_CONSTEXPR_CPP11 bool empty() const FLATBUFFERS_NOEXCEPT { return size() == 0; }
-
-  // Returns a pointer to the beginning of the sequence.
-  FLATBUFFERS_CONSTEXPR_CPP11 pointer data() const FLATBUFFERS_NOEXCEPT { return data_; }
-
-#if !defined(FLATBUFFERS_SPAN_MINIMAL)
-  using Iterator = internal::SpanIterator<T>;
-
-  Iterator begin() const { return Iterator(data()); }
-  Iterator end() const { return Iterator(data() + size()); }
-#endif
-
-  // Returns a reference to the idx-th element of the sequence.
-  // The behavior is undefined if the idx is greater than or equal to size().
-  FLATBUFFERS_CONSTEXPR_CPP11 reference operator[](size_type idx) const { return data()[idx]; }
-
-  FLATBUFFERS_CONSTEXPR_CPP11 span(const span& other) FLATBUFFERS_NOEXCEPT : data_(other.data_),
-                                                                             count_(other.count_)
-  {
-  }
-
-  FLATBUFFERS_CONSTEXPR_CPP14 span& operator=(const span& other) FLATBUFFERS_NOEXCEPT
-  {
-    data_  = other.data_;
-    count_ = other.count_;
-  }
-
-  // Limited implementation of
-  // `template <class It> constexpr std::span(It first, size_type count);`.
-  //
-  // Constructs a span that is a view over the range [first, first + count);
-  // the resulting span has: data() == first and size() == count.
-  // The behavior is undefined if [first, first + count) is not a valid range,
-  // or if (extent != flatbuffers::dynamic_extent && count != extent).
-  FLATBUFFERS_CONSTEXPR_CPP11
-  explicit span(pointer first, size_type count) FLATBUFFERS_NOEXCEPT
-    : data_(Extent == dynamic_extent ? first : (Extent == count ? first : nullptr)),
-      count_(Extent == dynamic_extent ? count : (Extent == count ? Extent : 0))
-  {
-    // Make span empty if the count argument is incompatible with span<T,N>.
-  }
-
-// Exclude this code if MSVC2010 is active. The MSVC2010 isn't C++11
-// compliant, it doesn't support default template arguments for functions.
-#if defined(FLATBUFFERS_SPAN_MINIMAL)
-  FLATBUFFERS_CONSTEXPR_CPP11 span() FLATBUFFERS_NOEXCEPT : data_(nullptr), count_(0)
-  {
-    static_assert(extent == 0 || extent == dynamic_extent, "invalid span");
-  }
-
-#else
-  // Constructs an empty span whose data() == nullptr and size() == 0.
-  // This overload only participates in overload resolution if
-  // extent == 0 || extent == flatbuffers::dynamic_extent.
-  // A dummy template argument N is need dependency for SFINAE.
-  template <
-    std::size_t N                                                                             = 0,
-    typename internal::is_span_convertible<element_type, Extent, element_type, (N - N)>::type = 0>
-  FLATBUFFERS_CONSTEXPR_CPP11 span() FLATBUFFERS_NOEXCEPT : data_(nullptr), count_(0)
-  {
-    static_assert(extent == 0 || extent == dynamic_extent, "invalid span");
-  }
-
-  // Constructs a span that is a view over the array arr; the resulting span
-  // has size() == N and data() == std::data(arr). These overloads only
-  // participate in overload resolution if
-  // extent == std::dynamic_extent || N == extent is true and
-  // std::remove_pointer_t<decltype(std::data(arr))>(*)[]
-  // is convertible to element_type (*)[].
-  template <std::size_t N,
-            typename internal::is_span_convertible<element_type, Extent, element_type, N>::type = 0>
-  FLATBUFFERS_CONSTEXPR_CPP11 span(element_type (&arr)[N]) FLATBUFFERS_NOEXCEPT : data_(arr),
-                                                                                  count_(N)
-  {
-  }
-
-  template <class U,
-            std::size_t N,
-            typename internal::is_span_convertible<element_type, Extent, U, N>::type = 0>
-  FLATBUFFERS_CONSTEXPR_CPP11 span(std::array<U, N>& arr) FLATBUFFERS_NOEXCEPT : data_(arr.data()),
-                                                                                 count_(N)
-  {
-  }
-
-  // template<class U, std::size_t N,
-  //   int = 0>
-  // FLATBUFFERS_CONSTEXPR_CPP11 span(std::array<U, N> &arr) FLATBUFFERS_NOEXCEPT
-  //    : data_(arr.data()), count_(N) {}
-
-  template <class U,
-            std::size_t N,
-            typename internal::is_span_convertible<element_type, Extent, U, N>::type = 0>
-  FLATBUFFERS_CONSTEXPR_CPP11 span(const std::array<U, N>& arr) FLATBUFFERS_NOEXCEPT
-    : data_(arr.data()),
-      count_(N)
-  {
-  }
-
-  // Converting constructor from another span s;
-  // the resulting span has size() == s.size() and data() == s.data().
-  // This overload only participates in overload resolution
-  // if extent == std::dynamic_extent || N == extent is true and U (*)[]
-  // is convertible to element_type (*)[].
-  template <class U,
-            std::size_t N,
-            typename internal::is_span_convertible<element_type, Extent, U, N>::type = 0>
-  FLATBUFFERS_CONSTEXPR_CPP11 span(const flatbuffers::span<U, N>& s) FLATBUFFERS_NOEXCEPT
-    : span(s.data(), s.size())
-  {
-  }
-
-#endif  // !defined(FLATBUFFERS_SPAN_MINIMAL)
-
- private:
-  // This is a naive implementation with 'count_' member even if (Extent != dynamic_extent).
-  pointer const data_;
-  size_type count_;
-};
-#endif  // defined(FLATBUFFERS_USE_STD_SPAN)
-
-#if !defined(FLATBUFFERS_SPAN_MINIMAL)
-template <class ElementType, std::size_t Extent>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<ElementType, Extent> make_span(
-  ElementType (&arr)[Extent]) FLATBUFFERS_NOEXCEPT
-{
-  return span<ElementType, Extent>(arr);
-}
-
-template <class ElementType, std::size_t Extent>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const ElementType, Extent> make_span(
-  const ElementType (&arr)[Extent]) FLATBUFFERS_NOEXCEPT
-{
-  return span<const ElementType, Extent>(arr);
-}
-
-template <class ElementType, std::size_t Extent>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<ElementType, Extent> make_span(
-  std::array<ElementType, Extent>& arr) FLATBUFFERS_NOEXCEPT
-{
-  return span<ElementType, Extent>(arr);
-}
-
-template <class ElementType, std::size_t Extent>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const ElementType, Extent> make_span(
-  const std::array<ElementType, Extent>& arr) FLATBUFFERS_NOEXCEPT
-{
-  return span<const ElementType, Extent>(arr);
-}
-
-template <class ElementType, std::size_t Extent>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<ElementType, dynamic_extent> make_span(
-  ElementType* first, std::size_t count) FLATBUFFERS_NOEXCEPT
-{
-  return span<ElementType, dynamic_extent>(first, count);
-}
-
-template <class ElementType, std::size_t Extent>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const ElementType, dynamic_extent> make_span(
-  const ElementType* first, std::size_t count) FLATBUFFERS_NOEXCEPT
-{
-  return span<const ElementType, dynamic_extent>(first, count);
-}
-#endif  // !defined(FLATBUFFERS_SPAN_MINIMAL)
-
-}  // namespace flatbuffers
-
-#endif  // FLATBUFFERS_STL_EMULATION_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/string.h b/cpp/include/cudf/io/ipc/flatbuffers/string.h
deleted file mode 100644
index 95e937ffca9..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/string.h
+++ /dev/null
@@ -1,70 +0,0 @@
-/*
- * Copyright 2021 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_STRING_H_
-#define FLATBUFFERS_STRING_H_
-
-#include <cudf/io/ipc/flatbuffers/base.h>
-#include <cudf/io/ipc/flatbuffers/vector.h>
-
-namespace flatbuffers {
-
-struct String : public Vector<char> {
-  const char* c_str() const { return reinterpret_cast<const char*>(Data()); }
-  std::string str() const { return std::string(c_str(), size()); }
-
-  // clang-format off
-  #ifdef FLATBUFFERS_HAS_STRING_VIEW
-  flatbuffers::string_view string_view() const {
-    return flatbuffers::string_view(c_str(), size());
-  }
-
-  /* implicit */
-  operator flatbuffers::string_view() const {
-    return flatbuffers::string_view(c_str(), size());
-  }
-  #endif // FLATBUFFERS_HAS_STRING_VIEW
-  // clang-format on
-
-  bool operator<(const String& o) const
-  {
-    return StringLessThan(this->data(), this->size(), o.data(), o.size());
-  }
-};
-
-// Convenience function to get std::string from a String returning an empty
-// string on null pointer.
-static inline std::string GetString(const String* str) { return str ? str->str() : ""; }
-
-// Convenience function to get char* from a String returning an empty string on
-// null pointer.
-static inline const char* GetCstring(const String* str) { return str ? str->c_str() : ""; }
-
-#ifdef FLATBUFFERS_HAS_STRING_VIEW
-// Convenience function to get string_view from a String returning an empty
-// string_view on null pointer.
-static inline flatbuffers::string_view GetStringView(const String* str)
-{
-  return str ? str->string_view() : flatbuffers::string_view();
-}
-#endif  // FLATBUFFERS_HAS_STRING_VIEW
-
-}  // namespace flatbuffers
-
-#endif  // FLATBUFFERS_STRING_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/struct.h b/cpp/include/cudf/io/ipc/flatbuffers/struct.h
deleted file mode 100644
index b4fd5a1de73..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/struct.h
+++ /dev/null
@@ -1,60 +0,0 @@
-/*
- * Copyright 2021 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_STRUCT_H_
-#define FLATBUFFERS_STRUCT_H_
-
-#include <cudf/io/ipc/flatbuffers/base.h>
-
-namespace flatbuffers {
-
-// "structs" are flat structures that do not have an offset table, thus
-// always have all members present and do not support forwards/backwards
-// compatible extensions.
-
-class Struct FLATBUFFERS_FINAL_CLASS {
- public:
-  template <typename T>
-  T GetField(uoffset_t o) const
-  {
-    return ReadScalar<T>(&data_[o]);
-  }
-
-  template <typename T>
-  T GetStruct(uoffset_t o) const
-  {
-    return reinterpret_cast<T>(&data_[o]);
-  }
-
-  const uint8_t* GetAddressOf(uoffset_t o) const { return &data_[o]; }
-  uint8_t* GetAddressOf(uoffset_t o) { return &data_[o]; }
-
- private:
-  // private constructor & copy constructor: you obtain instances of this
-  // class by pointing to existing data only
-  Struct();
-  Struct(const Struct&);
-  Struct& operator=(const Struct&);
-
-  uint8_t data_[1];
-};
-
-}  // namespace flatbuffers
-
-#endif  // FLATBUFFERS_STRUCT_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/table.h b/cpp/include/cudf/io/ipc/flatbuffers/table.h
deleted file mode 100644
index 34aa51ebea7..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/table.h
+++ /dev/null
@@ -1,202 +0,0 @@
-/*
- * Copyright 2021 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_TABLE_H_
-#define FLATBUFFERS_TABLE_H_
-
-#include <cudf/io/ipc/flatbuffers/base.h>
-#include <cudf/io/ipc/flatbuffers/verifier.h>
-
-namespace flatbuffers {
-
-// "tables" use an offset table (possibly shared) that allows fields to be
-// omitted and added at will, but uses an extra indirection to read.
-class Table {
- public:
-  const uint8_t* GetVTable() const { return data_ - ReadScalar<soffset_t>(data_); }
-
-  // This gets the field offset for any of the functions below it, or 0
-  // if the field was not present.
-  voffset_t GetOptionalFieldOffset(voffset_t field) const
-  {
-    // The vtable offset is always at the start.
-    auto vtable = GetVTable();
-    // The first element is the size of the vtable (fields + type id + itself).
-    auto vtsize = ReadScalar<voffset_t>(vtable);
-    // If the field we're accessing is outside the vtable, we're reading older
-    // data, so it's the same as if the offset was 0 (not present).
-    return field < vtsize ? ReadScalar<voffset_t>(vtable + field) : 0;
-  }
-
-  template <typename T>
-  T GetField(voffset_t field, T defaultval) const
-  {
-    auto field_offset = GetOptionalFieldOffset(field);
-    return field_offset ? ReadScalar<T>(data_ + field_offset) : defaultval;
-  }
-
-  template <typename P, typename OffsetSize = uoffset_t>
-  P GetPointer(voffset_t field)
-  {
-    auto field_offset = GetOptionalFieldOffset(field);
-    auto p            = data_ + field_offset;
-    return field_offset ? reinterpret_cast<P>(p + ReadScalar<OffsetSize>(p)) : nullptr;
-  }
-  template <typename P, typename OffsetSize = uoffset_t>
-  P GetPointer(voffset_t field) const
-  {
-    return const_cast<Table*>(this)->GetPointer<P, OffsetSize>(field);
-  }
-
-  template <typename P>
-  P GetPointer64(voffset_t field)
-  {
-    return GetPointer<P, uoffset64_t>(field);
-  }
-
-  template <typename P>
-  P GetPointer64(voffset_t field) const
-  {
-    return GetPointer<P, uoffset64_t>(field);
-  }
-
-  template <typename P>
-  P GetStruct(voffset_t field) const
-  {
-    auto field_offset = GetOptionalFieldOffset(field);
-    auto p            = const_cast<uint8_t*>(data_ + field_offset);
-    return field_offset ? reinterpret_cast<P>(p) : nullptr;
-  }
-
-  template <typename Raw, typename Face>
-  flatbuffers::Optional<Face> GetOptional(voffset_t field) const
-  {
-    auto field_offset = GetOptionalFieldOffset(field);
-    auto p            = data_ + field_offset;
-    return field_offset ? Optional<Face>(static_cast<Face>(ReadScalar<Raw>(p))) : Optional<Face>();
-  }
-
-  template <typename T>
-  bool SetField(voffset_t field, T val, T def)
-  {
-    auto field_offset = GetOptionalFieldOffset(field);
-    if (!field_offset) return IsTheSameAs(val, def);
-    WriteScalar(data_ + field_offset, val);
-    return true;
-  }
-  template <typename T>
-  bool SetField(voffset_t field, T val)
-  {
-    auto field_offset = GetOptionalFieldOffset(field);
-    if (!field_offset) return false;
-    WriteScalar(data_ + field_offset, val);
-    return true;
-  }
-
-  bool SetPointer(voffset_t field, const uint8_t* val)
-  {
-    auto field_offset = GetOptionalFieldOffset(field);
-    if (!field_offset) return false;
-    WriteScalar(data_ + field_offset, static_cast<uoffset_t>(val - (data_ + field_offset)));
-    return true;
-  }
-
-  uint8_t* GetAddressOf(voffset_t field)
-  {
-    auto field_offset = GetOptionalFieldOffset(field);
-    return field_offset ? data_ + field_offset : nullptr;
-  }
-  const uint8_t* GetAddressOf(voffset_t field) const
-  {
-    return const_cast<Table*>(this)->GetAddressOf(field);
-  }
-
-  bool CheckField(voffset_t field) const { return GetOptionalFieldOffset(field) != 0; }
-
-  // Verify the vtable of this table.
-  // Call this once per table, followed by VerifyField once per field.
-  bool VerifyTableStart(Verifier& verifier) const { return verifier.VerifyTableStart(data_); }
-
-  // Verify a particular field.
-  template <typename T>
-  bool VerifyField(const Verifier& verifier, voffset_t field, size_t align) const
-  {
-    // Calling GetOptionalFieldOffset should be safe now thanks to
-    // VerifyTable().
-    auto field_offset = GetOptionalFieldOffset(field);
-    // Check the actual field.
-    return !field_offset || verifier.VerifyField<T>(data_, field_offset, align);
-  }
-
-  // VerifyField for required fields.
-  template <typename T>
-  bool VerifyFieldRequired(const Verifier& verifier, voffset_t field, size_t align) const
-  {
-    auto field_offset = GetOptionalFieldOffset(field);
-    return verifier.Check(field_offset != 0) && verifier.VerifyField<T>(data_, field_offset, align);
-  }
-
-  // Versions for offsets.
-  template <typename OffsetT = uoffset_t>
-  bool VerifyOffset(const Verifier& verifier, voffset_t field) const
-  {
-    auto field_offset = GetOptionalFieldOffset(field);
-    return !field_offset || verifier.VerifyOffset<OffsetT>(data_, field_offset);
-  }
-
-  template <typename OffsetT = uoffset_t>
-  bool VerifyOffsetRequired(const Verifier& verifier, voffset_t field) const
-  {
-    auto field_offset = GetOptionalFieldOffset(field);
-    return verifier.Check(field_offset != 0) && verifier.VerifyOffset<OffsetT>(data_, field_offset);
-  }
-
-  bool VerifyOffset64(const Verifier& verifier, voffset_t field) const
-  {
-    return VerifyOffset<uoffset64_t>(verifier, field);
-  }
-
-  bool VerifyOffset64Required(const Verifier& verifier, voffset_t field) const
-  {
-    return VerifyOffsetRequired<uoffset64_t>(verifier, field);
-  }
-
- private:
-  // private constructor & copy constructor: you obtain instances of this
-  // class by pointing to existing data only
-  Table();
-  Table(const Table& other);
-  Table& operator=(const Table&);
-
-  uint8_t data_[1];
-};
-
-// This specialization allows avoiding warnings like:
-// MSVC C4800: type: forcing value to bool 'true' or 'false'.
-template <>
-inline flatbuffers::Optional<bool> Table::GetOptional<uint8_t, bool>(voffset_t field) const
-{
-  auto field_offset = GetOptionalFieldOffset(field);
-  auto p            = data_ + field_offset;
-  return field_offset ? Optional<bool>(ReadScalar<uint8_t>(p) != 0) : Optional<bool>();
-}
-
-}  // namespace flatbuffers
-
-#endif  // FLATBUFFERS_TABLE_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/vector.h b/cpp/include/cudf/io/ipc/flatbuffers/vector.h
deleted file mode 100644
index 095939f8b0c..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/vector.h
+++ /dev/null
@@ -1,416 +0,0 @@
-/*
- * Copyright 2021 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_VECTOR_H_
-#define FLATBUFFERS_VECTOR_H_
-
-#include <cudf/io/ipc/flatbuffers/base.h>
-#include <cudf/io/ipc/flatbuffers/buffer.h>
-#include <cudf/io/ipc/flatbuffers/stl_emulation.h>
-
-namespace flatbuffers {
-
-struct String;
-
-// An STL compatible iterator implementation for Vector below, effectively
-// calling Get() for every element.
-template <typename T, typename IT, typename Data = uint8_t*, typename SizeT = uoffset_t>
-struct VectorIterator {
-  typedef std::random_access_iterator_tag iterator_category;
-  typedef IT value_type;
-  typedef ptrdiff_t difference_type;
-  typedef IT* pointer;
-  typedef IT& reference;
-
-  static const SizeT element_stride = IndirectHelper<T>::element_stride;
-
-  VectorIterator(Data data, SizeT i) : data_(data + element_stride * i) {}
-  VectorIterator(const VectorIterator& other) : data_(other.data_) {}
-  VectorIterator() : data_(nullptr) {}
-
-  VectorIterator& operator=(const VectorIterator& other)
-  {
-    data_ = other.data_;
-    return *this;
-  }
-
-  VectorIterator& operator=(VectorIterator&& other)
-  {
-    data_ = other.data_;
-    return *this;
-  }
-
-  bool operator==(const VectorIterator& other) const { return data_ == other.data_; }
-
-  bool operator<(const VectorIterator& other) const { return data_ < other.data_; }
-
-  bool operator!=(const VectorIterator& other) const { return data_ != other.data_; }
-
-  difference_type operator-(const VectorIterator& other) const
-  {
-    return (data_ - other.data_) / element_stride;
-  }
-
-  // Note: return type is incompatible with the standard
-  // `reference operator*()`.
-  IT operator*() const { return IndirectHelper<T>::Read(data_, 0); }
-
-  // Note: return type is incompatible with the standard
-  // `pointer operator->()`.
-  IT operator->() const { return IndirectHelper<T>::Read(data_, 0); }
-
-  VectorIterator& operator++()
-  {
-    data_ += element_stride;
-    return *this;
-  }
-
-  VectorIterator operator++(int)
-  {
-    VectorIterator temp(data_, 0);
-    data_ += element_stride;
-    return temp;
-  }
-
-  VectorIterator operator+(const SizeT& offset) const
-  {
-    return VectorIterator(data_ + offset * element_stride, 0);
-  }
-
-  VectorIterator& operator+=(const SizeT& offset)
-  {
-    data_ += offset * element_stride;
-    return *this;
-  }
-
-  VectorIterator& operator--()
-  {
-    data_ -= element_stride;
-    return *this;
-  }
-
-  VectorIterator operator--(int)
-  {
-    VectorIterator temp(data_, 0);
-    data_ -= element_stride;
-    return temp;
-  }
-
-  VectorIterator operator-(const SizeT& offset) const
-  {
-    return VectorIterator(data_ - offset * element_stride, 0);
-  }
-
-  VectorIterator& operator-=(const SizeT& offset)
-  {
-    data_ -= offset * element_stride;
-    return *this;
-  }
-
- private:
-  Data data_;
-};
-
-template <typename T, typename IT, typename SizeT = uoffset_t>
-using VectorConstIterator = VectorIterator<T, IT, const uint8_t*, SizeT>;
-
-template <typename Iterator>
-struct VectorReverseIterator : public std::reverse_iterator<Iterator> {
-  explicit VectorReverseIterator(Iterator iter) : std::reverse_iterator<Iterator>(iter) {}
-
-  // Note: return type is incompatible with the standard
-  // `reference operator*()`.
-  typename Iterator::value_type operator*() const
-  {
-    auto tmp = std::reverse_iterator<Iterator>::current;
-    return *--tmp;
-  }
-
-  // Note: return type is incompatible with the standard
-  // `pointer operator->()`.
-  typename Iterator::value_type operator->() const
-  {
-    auto tmp = std::reverse_iterator<Iterator>::current;
-    return *--tmp;
-  }
-};
-
-// This is used as a helper type for accessing vectors.
-// Vector::data() assumes the vector elements start after the length field.
-template <typename T, typename SizeT = uoffset_t>
-class Vector {
- public:
-  typedef VectorIterator<T, typename IndirectHelper<T>::mutable_return_type, uint8_t*, SizeT>
-    iterator;
-  typedef VectorConstIterator<T, typename IndirectHelper<T>::return_type, SizeT> const_iterator;
-  typedef VectorReverseIterator<iterator> reverse_iterator;
-  typedef VectorReverseIterator<const_iterator> const_reverse_iterator;
-
-  typedef typename flatbuffers::bool_constant<flatbuffers::is_scalar<T>::value> scalar_tag;
-
-  static FLATBUFFERS_CONSTEXPR bool is_span_observable =
-    scalar_tag::value && (FLATBUFFERS_LITTLEENDIAN || sizeof(T) == 1);
-
-  SizeT size() const { return EndianScalar(length_); }
-
-  // Deprecated: use size(). Here for backwards compatibility.
-  FLATBUFFERS_ATTRIBUTE([[deprecated("use size() instead")]])
-  SizeT Length() const { return size(); }
-
-  typedef SizeT size_type;
-  typedef typename IndirectHelper<T>::return_type return_type;
-  typedef typename IndirectHelper<T>::mutable_return_type mutable_return_type;
-  typedef return_type value_type;
-
-  return_type Get(SizeT i) const
-  {
-    FLATBUFFERS_ASSERT(i < size());
-    return IndirectHelper<T>::Read(Data(), i);
-  }
-
-  return_type operator[](SizeT i) const { return Get(i); }
-
-  // If this is a Vector of enums, T will be its storage type, not the enum
-  // type. This function makes it convenient to retrieve value with enum
-  // type E.
-  template <typename E>
-  E GetEnum(SizeT i) const
-  {
-    return static_cast<E>(Get(i));
-  }
-
-  // If this a vector of unions, this does the cast for you. There's no check
-  // to make sure this is the right type!
-  template <typename U>
-  const U* GetAs(SizeT i) const
-  {
-    return reinterpret_cast<const U*>(Get(i));
-  }
-
-  // If this a vector of unions, this does the cast for you. There's no check
-  // to make sure this is actually a string!
-  const String* GetAsString(SizeT i) const { return reinterpret_cast<const String*>(Get(i)); }
-
-  const void* GetStructFromOffset(size_t o) const
-  {
-    return reinterpret_cast<const void*>(Data() + o);
-  }
-
-  iterator begin() { return iterator(Data(), 0); }
-  const_iterator begin() const { return const_iterator(Data(), 0); }
-
-  iterator end() { return iterator(Data(), size()); }
-  const_iterator end() const { return const_iterator(Data(), size()); }
-
-  reverse_iterator rbegin() { return reverse_iterator(end()); }
-  const_reverse_iterator rbegin() const { return const_reverse_iterator(end()); }
-
-  reverse_iterator rend() { return reverse_iterator(begin()); }
-  const_reverse_iterator rend() const { return const_reverse_iterator(begin()); }
-
-  const_iterator cbegin() const { return begin(); }
-
-  const_iterator cend() const { return end(); }
-
-  const_reverse_iterator crbegin() const { return rbegin(); }
-
-  const_reverse_iterator crend() const { return rend(); }
-
-  // Change elements if you have a non-const pointer to this object.
-  // Scalars only. See reflection.h, and the documentation.
-  void Mutate(SizeT i, const T& val)
-  {
-    FLATBUFFERS_ASSERT(i < size());
-    WriteScalar(data() + i, val);
-  }
-
-  // Change an element of a vector of tables (or strings).
-  // "val" points to the new table/string, as you can obtain from
-  // e.g. reflection::AddFlatBuffer().
-  void MutateOffset(SizeT i, const uint8_t* val)
-  {
-    FLATBUFFERS_ASSERT(i < size());
-    static_assert(sizeof(T) == sizeof(SizeT), "Unrelated types");
-    WriteScalar(data() + i, static_cast<SizeT>(val - (Data() + i * sizeof(SizeT))));
-  }
-
-  // Get a mutable pointer to tables/strings inside this vector.
-  mutable_return_type GetMutableObject(SizeT i) const
-  {
-    FLATBUFFERS_ASSERT(i < size());
-    return const_cast<mutable_return_type>(IndirectHelper<T>::Read(Data(), i));
-  }
-
-  // The raw data in little endian format. Use with care.
-  const uint8_t* Data() const { return reinterpret_cast<const uint8_t*>(&length_ + 1); }
-
-  uint8_t* Data() { return reinterpret_cast<uint8_t*>(&length_ + 1); }
-
-  // Similarly, but typed, much like std::vector::data
-  const T* data() const { return reinterpret_cast<const T*>(Data()); }
-  T* data() { return reinterpret_cast<T*>(Data()); }
-
-  template <typename K>
-  return_type LookupByKey(K key) const
-  {
-    void* search_result =
-      std::bsearch(&key, Data(), size(), IndirectHelper<T>::element_stride, KeyCompare<K>);
-
-    if (!search_result) {
-      return nullptr;  // Key not found.
-    }
-
-    const uint8_t* element = reinterpret_cast<const uint8_t*>(search_result);
-
-    return IndirectHelper<T>::Read(element, 0);
-  }
-
-  template <typename K>
-  mutable_return_type MutableLookupByKey(K key)
-  {
-    return const_cast<mutable_return_type>(LookupByKey(key));
-  }
-
- protected:
-  // This class is only used to access pre-existing data. Don't ever
-  // try to construct these manually.
-  Vector();
-
-  SizeT length_;
-
- private:
-  // This class is a pointer. Copying will therefore create an invalid object.
-  // Private and unimplemented copy constructor.
-  Vector(const Vector&);
-  Vector& operator=(const Vector&);
-
-  template <typename K>
-  static int KeyCompare(const void* ap, const void* bp)
-  {
-    const K* key        = reinterpret_cast<const K*>(ap);
-    const uint8_t* data = reinterpret_cast<const uint8_t*>(bp);
-    auto table          = IndirectHelper<T>::Read(data, 0);
-
-    // std::bsearch compares with the operands transposed, so we negate the
-    // result here.
-    return -table->KeyCompareWithValue(*key);
-  }
-};
-
-template <typename T>
-using Vector64 = Vector<T, uoffset64_t>;
-
-template <class U>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<U> make_span(Vector<U>& vec) FLATBUFFERS_NOEXCEPT
-{
-  static_assert(Vector<U>::is_span_observable,
-                "wrong type U, only LE-scalar, or byte types are allowed");
-  return span<U>(vec.data(), vec.size());
-}
-
-template <class U>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const U> make_span(const Vector<U>& vec)
-  FLATBUFFERS_NOEXCEPT
-{
-  static_assert(Vector<U>::is_span_observable,
-                "wrong type U, only LE-scalar, or byte types are allowed");
-  return span<const U>(vec.data(), vec.size());
-}
-
-template <class U>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<uint8_t> make_bytes_span(Vector<U>& vec)
-  FLATBUFFERS_NOEXCEPT
-{
-  static_assert(Vector<U>::scalar_tag::value,
-                "wrong type U, only LE-scalar, or byte types are allowed");
-  return span<uint8_t>(vec.Data(), vec.size() * sizeof(U));
-}
-
-template <class U>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const uint8_t> make_bytes_span(const Vector<U>& vec)
-  FLATBUFFERS_NOEXCEPT
-{
-  static_assert(Vector<U>::scalar_tag::value,
-                "wrong type U, only LE-scalar, or byte types are allowed");
-  return span<const uint8_t>(vec.Data(), vec.size() * sizeof(U));
-}
-
-// Convenient helper functions to get a span of any vector, regardless
-// of whether it is null or not (the field is not set).
-template <class U>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<U> make_span(Vector<U>* ptr) FLATBUFFERS_NOEXCEPT
-{
-  static_assert(Vector<U>::is_span_observable,
-                "wrong type U, only LE-scalar, or byte types are allowed");
-  return ptr ? make_span(*ptr) : span<U>();
-}
-
-template <class U>
-FLATBUFFERS_CONSTEXPR_CPP11 flatbuffers::span<const U> make_span(const Vector<U>* ptr)
-  FLATBUFFERS_NOEXCEPT
-{
-  static_assert(Vector<U>::is_span_observable,
-                "wrong type U, only LE-scalar, or byte types are allowed");
-  return ptr ? make_span(*ptr) : span<const U>();
-}
-
-// Represent a vector much like the template above, but in this case we
-// don't know what the element types are (used with reflection.h).
-class VectorOfAny {
- public:
-  uoffset_t size() const { return EndianScalar(length_); }
-
-  const uint8_t* Data() const { return reinterpret_cast<const uint8_t*>(&length_ + 1); }
-  uint8_t* Data() { return reinterpret_cast<uint8_t*>(&length_ + 1); }
-
- protected:
-  VectorOfAny();
-
-  uoffset_t length_;
-
- private:
-  VectorOfAny(const VectorOfAny&);
-  VectorOfAny& operator=(const VectorOfAny&);
-};
-
-template <typename T, typename U>
-Vector<Offset<T>>* VectorCast(Vector<Offset<U>>* ptr)
-{
-  static_assert(std::is_base_of<T, U>::value, "Unrelated types");
-  return reinterpret_cast<Vector<Offset<T>>*>(ptr);
-}
-
-template <typename T, typename U>
-const Vector<Offset<T>>* VectorCast(const Vector<Offset<U>>* ptr)
-{
-  static_assert(std::is_base_of<T, U>::value, "Unrelated types");
-  return reinterpret_cast<const Vector<Offset<T>>*>(ptr);
-}
-
-// Convenient helper function to get the length of any vector, regardless
-// of whether it is null or not (the field is not set).
-template <typename T>
-static inline size_t VectorLength(const Vector<T>* v)
-{
-  return v ? v->size() : 0;
-}
-
-}  // namespace flatbuffers
-
-#endif  // FLATBUFFERS_VERIFIER_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/vector_downward.h b/cpp/include/cudf/io/ipc/flatbuffers/vector_downward.h
deleted file mode 100644
index 052e5d7f874..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/vector_downward.h
+++ /dev/null
@@ -1,316 +0,0 @@
-/*
- * Copyright 2021 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_VECTOR_DOWNWARD_H_
-#define FLATBUFFERS_VECTOR_DOWNWARD_H_
-
-#include <cudf/io/ipc/flatbuffers/base.h>
-#include <cudf/io/ipc/flatbuffers/default_allocator.h>
-#include <cudf/io/ipc/flatbuffers/detached_buffer.h>
-
-#include <algorithm>
-#include <cstdint>
-
-namespace flatbuffers {
-
-// This is a minimal replication of std::vector<uint8_t> functionality,
-// except growing from higher to lower addresses. i.e. push_back() inserts data
-// in the lowest address in the vector.
-// Since this vector leaves the lower part unused, we support a "scratch-pad"
-// that can be stored there for temporary data, to share the allocated space.
-// Essentially, this supports 2 std::vectors in a single buffer.
-template <typename SizeT = uoffset_t>
-class vector_downward {
- public:
-  explicit vector_downward(size_t initial_size,
-                           Allocator* allocator,
-                           bool own_allocator,
-                           size_t buffer_minalign,
-                           const SizeT max_size = FLATBUFFERS_MAX_BUFFER_SIZE)
-    : allocator_(allocator),
-      own_allocator_(own_allocator),
-      initial_size_(initial_size),
-      max_size_(max_size),
-      buffer_minalign_(buffer_minalign),
-      reserved_(0),
-      size_(0),
-      buf_(nullptr),
-      cur_(nullptr),
-      scratch_(nullptr)
-  {
-  }
-
-  vector_downward(vector_downward&& other) noexcept
-    // clang-format on
-    : allocator_(other.allocator_),
-      own_allocator_(other.own_allocator_),
-      initial_size_(other.initial_size_),
-      max_size_(other.max_size_),
-      buffer_minalign_(other.buffer_minalign_),
-      reserved_(other.reserved_),
-      size_(other.size_),
-      buf_(other.buf_),
-      cur_(other.cur_),
-      scratch_(other.scratch_)
-  {
-    // No change in other.allocator_
-    // No change in other.initial_size_
-    // No change in other.buffer_minalign_
-    other.own_allocator_ = false;
-    other.reserved_      = 0;
-    other.buf_           = nullptr;
-    other.cur_           = nullptr;
-    other.scratch_       = nullptr;
-  }
-
-  vector_downward& operator=(vector_downward&& other) noexcept
-  {
-    // Move construct a temporary and swap idiom
-    vector_downward temp(std::move(other));
-    swap(temp);
-    return *this;
-  }
-
-  ~vector_downward()
-  {
-    clear_buffer();
-    clear_allocator();
-  }
-
-  void reset()
-  {
-    clear_buffer();
-    clear();
-  }
-
-  void clear()
-  {
-    if (buf_) {
-      cur_ = buf_ + reserved_;
-    } else {
-      reserved_ = 0;
-      cur_      = nullptr;
-    }
-    size_ = 0;
-    clear_scratch();
-  }
-
-  void clear_scratch() { scratch_ = buf_; }
-
-  void clear_allocator()
-  {
-    if (own_allocator_ && allocator_) { delete allocator_; }
-    allocator_     = nullptr;
-    own_allocator_ = false;
-  }
-
-  void clear_buffer()
-  {
-    if (buf_) Deallocate(allocator_, buf_, reserved_);
-    buf_ = nullptr;
-  }
-
-  // Relinquish the pointer to the caller.
-  uint8_t* release_raw(size_t& allocated_bytes, size_t& offset)
-  {
-    auto* buf       = buf_;
-    allocated_bytes = reserved_;
-    offset          = vector_downward::offset();
-
-    // release_raw only relinquishes the buffer ownership.
-    // Does not deallocate or reset the allocator. Destructor will do that.
-    buf_ = nullptr;
-    clear();
-    return buf;
-  }
-
-  // Relinquish the pointer to the caller.
-  DetachedBuffer release()
-  {
-    // allocator ownership (if any) is transferred to DetachedBuffer.
-    DetachedBuffer fb(allocator_, own_allocator_, buf_, reserved_, cur_, size());
-    if (own_allocator_) {
-      allocator_     = nullptr;
-      own_allocator_ = false;
-    }
-    buf_ = nullptr;
-    clear();
-    return fb;
-  }
-
-  size_t ensure_space(size_t len)
-  {
-    FLATBUFFERS_ASSERT(cur_ >= scratch_ && scratch_ >= buf_);
-    // If the length is larger than the unused part of the buffer, we need to
-    // grow.
-    if (len > unused_buffer_size()) { reallocate(len); }
-    FLATBUFFERS_ASSERT(size() < max_size_);
-    return len;
-  }
-
-  inline uint8_t* make_space(size_t len)
-  {
-    if (len) {
-      ensure_space(len);
-      cur_ -= len;
-      size_ += static_cast<SizeT>(len);
-    }
-    return cur_;
-  }
-
-  // Returns nullptr if using the DefaultAllocator.
-  Allocator* get_custom_allocator() { return allocator_; }
-
-  // The current offset into the buffer.
-  size_t offset() const { return cur_ - buf_; }
-
-  // The total size of the vector (both the buffer and scratch parts).
-  inline SizeT size() const { return size_; }
-
-  // The size of the buffer part of the vector that is currently unused.
-  SizeT unused_buffer_size() const { return static_cast<SizeT>(cur_ - scratch_); }
-
-  // The size of the scratch part of the vector.
-  SizeT scratch_size() const { return static_cast<SizeT>(scratch_ - buf_); }
-
-  size_t capacity() const { return reserved_; }
-
-  uint8_t* data() const
-  {
-    FLATBUFFERS_ASSERT(cur_);
-    return cur_;
-  }
-
-  uint8_t* scratch_data() const
-  {
-    FLATBUFFERS_ASSERT(buf_);
-    return buf_;
-  }
-
-  uint8_t* scratch_end() const
-  {
-    FLATBUFFERS_ASSERT(scratch_);
-    return scratch_;
-  }
-
-  uint8_t* data_at(size_t offset) const { return buf_ + reserved_ - offset; }
-
-  void push(const uint8_t* bytes, size_t num)
-  {
-    if (num > 0) { memcpy(make_space(num), bytes, num); }
-  }
-
-  // Specialized version of push() that avoids memcpy call for small data.
-  template <typename T>
-  void push_small(const T& little_endian_t)
-  {
-    make_space(sizeof(T));
-    *reinterpret_cast<T*>(cur_) = little_endian_t;
-  }
-
-  template <typename T>
-  void scratch_push_small(const T& t)
-  {
-    ensure_space(sizeof(T));
-    *reinterpret_cast<T*>(scratch_) = t;
-    scratch_ += sizeof(T);
-  }
-
-  // fill() is most frequently called with small byte counts (<= 4),
-  // which is why we're using loops rather than calling memset.
-  void fill(size_t zero_pad_bytes)
-  {
-    make_space(zero_pad_bytes);
-    for (size_t i = 0; i < zero_pad_bytes; i++)
-      cur_[i] = 0;
-  }
-
-  // Version for when we know the size is larger.
-  // Precondition: zero_pad_bytes > 0
-  void fill_big(size_t zero_pad_bytes) { memset(make_space(zero_pad_bytes), 0, zero_pad_bytes); }
-
-  void pop(size_t bytes_to_remove)
-  {
-    cur_ += bytes_to_remove;
-    size_ -= static_cast<SizeT>(bytes_to_remove);
-  }
-
-  void scratch_pop(size_t bytes_to_remove) { scratch_ -= bytes_to_remove; }
-
-  void swap(vector_downward& other)
-  {
-    using std::swap;
-    swap(allocator_, other.allocator_);
-    swap(own_allocator_, other.own_allocator_);
-    swap(initial_size_, other.initial_size_);
-    swap(buffer_minalign_, other.buffer_minalign_);
-    swap(reserved_, other.reserved_);
-    swap(size_, other.size_);
-    swap(max_size_, other.max_size_);
-    swap(buf_, other.buf_);
-    swap(cur_, other.cur_);
-    swap(scratch_, other.scratch_);
-  }
-
-  void swap_allocator(vector_downward& other)
-  {
-    using std::swap;
-    swap(allocator_, other.allocator_);
-    swap(own_allocator_, other.own_allocator_);
-  }
-
- private:
-  // You shouldn't really be copying instances of this class.
-  FLATBUFFERS_DELETE_FUNC(vector_downward(const vector_downward&));
-  FLATBUFFERS_DELETE_FUNC(vector_downward& operator=(const vector_downward&));
-
-  Allocator* allocator_;
-  bool own_allocator_;
-  size_t initial_size_;
-
-  // The maximum size the vector can be.
-  SizeT max_size_;
-  size_t buffer_minalign_;
-  size_t reserved_;
-  SizeT size_;
-  uint8_t* buf_;
-  uint8_t* cur_;      // Points at location between empty (below) and used (above).
-  uint8_t* scratch_;  // Points to the end of the scratchpad in use.
-
-  void reallocate(size_t len)
-  {
-    auto old_reserved     = reserved_;
-    auto old_size         = size();
-    auto old_scratch_size = scratch_size();
-    reserved_ += (std::max)(len, old_reserved ? old_reserved / 2 : initial_size_);
-    reserved_ = (reserved_ + buffer_minalign_ - 1) & ~(buffer_minalign_ - 1);
-    if (buf_) {
-      buf_ =
-        ReallocateDownward(allocator_, buf_, old_reserved, reserved_, old_size, old_scratch_size);
-    } else {
-      buf_ = Allocate(allocator_, reserved_);
-    }
-    cur_     = buf_ + reserved_ - old_size;
-    scratch_ = buf_ + old_scratch_size;
-  }
-};
-
-}  // namespace flatbuffers
-
-#endif  // FLATBUFFERS_VECTOR_DOWNWARD_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS
diff --git a/cpp/include/cudf/io/ipc/flatbuffers/verifier.h b/cpp/include/cudf/io/ipc/flatbuffers/verifier.h
deleted file mode 100644
index 38effcf43df..00000000000
--- a/cpp/include/cudf/io/ipc/flatbuffers/verifier.h
+++ /dev/null
@@ -1,389 +0,0 @@
-/*
- * Copyright 2021 Google Inc. All rights reserved.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-#ifndef DOXYGEN_SHOULD_SKIP_THIS
-
-#ifndef FLATBUFFERS_VERIFIER_H_
-#define FLATBUFFERS_VERIFIER_H_
-
-#include <cudf/io/ipc/flatbuffers/base.h>
-#include <cudf/io/ipc/flatbuffers/vector.h>
-
-namespace flatbuffers {
-
-// Helper class to verify the integrity of a FlatBuffer
-template <bool TrackVerifierBufferSize>
-class VerifierTemplate FLATBUFFERS_FINAL_CLASS {
- public:
-  struct Options {
-    // The maximum nesting of tables and vectors before we call it invalid.
-    uoffset_t max_depth = 64;
-    // The maximum number of tables we will verify before we call it invalid.
-    uoffset_t max_tables = 1000000;
-    // If true, verify all data is aligned.
-    bool check_alignment = true;
-    // If true, run verifier on nested flatbuffers
-    bool check_nested_flatbuffers = true;
-    // The maximum size of a buffer.
-    size_t max_size = FLATBUFFERS_MAX_BUFFER_SIZE;
-    // Use assertions to check for errors.
-    bool assert = false;
-  };
-
-  explicit VerifierTemplate(const uint8_t* const buf, const size_t buf_len, const Options& opts)
-    : buf_(buf), size_(buf_len), opts_(opts)
-  {
-    FLATBUFFERS_ASSERT(size_ < opts.max_size);
-  }
-
-  // Deprecated API, please construct with VerifierTemplate::Options.
-  VerifierTemplate(const uint8_t* const buf,
-                   const size_t buf_len,
-                   const uoffset_t max_depth  = 64,
-                   const uoffset_t max_tables = 1000000,
-                   const bool check_alignment = true)
-    : VerifierTemplate(buf, buf_len, [&] {
-        Options opts;
-        opts.max_depth       = max_depth;
-        opts.max_tables      = max_tables;
-        opts.check_alignment = check_alignment;
-        return opts;
-      }())
-  {
-  }
-
-  // Central location where any verification failures register.
-  bool Check(const bool ok) const
-  {
-    // clang-format off
-    #ifdef FLATBUFFERS_DEBUG_VERIFICATION_FAILURE
-      if (opts_.assert) { FLATBUFFERS_ASSERT(ok); }
-    #endif
-    // clang-format on
-    if (TrackVerifierBufferSize) {
-      if (!ok) { upper_bound_ = 0; }
-    }
-    return ok;
-  }
-
-  // Verify any range within the buffer.
-  bool Verify(const size_t elem, const size_t elem_len) const
-  {
-    if (TrackVerifierBufferSize) {
-      auto upper_bound = elem + elem_len;
-      if (upper_bound_ < upper_bound) { upper_bound_ = upper_bound; }
-    }
-    return Check(elem_len < size_ && elem <= size_ - elem_len);
-  }
-
-  bool VerifyAlignment(const size_t elem, const size_t align) const
-  {
-    return Check((elem & (align - 1)) == 0 || !opts_.check_alignment);
-  }
-
-  // Verify a range indicated by sizeof(T).
-  template <typename T>
-  bool Verify(const size_t elem) const
-  {
-    return VerifyAlignment(elem, sizeof(T)) && Verify(elem, sizeof(T));
-  }
-
-  bool VerifyFromPointer(const uint8_t* const p, const size_t len)
-  {
-    return Verify(static_cast<size_t>(p - buf_), len);
-  }
-
-  // Verify relative to a known-good base pointer.
-  bool VerifyFieldStruct(const uint8_t* const base,
-                         const voffset_t elem_off,
-                         const size_t elem_len,
-                         const size_t align) const
-  {
-    const auto f = static_cast<size_t>(base - buf_) + elem_off;
-    return VerifyAlignment(f, align) && Verify(f, elem_len);
-  }
-
-  template <typename T>
-  bool VerifyField(const uint8_t* const base, const voffset_t elem_off, const size_t align) const
-  {
-    const auto f = static_cast<size_t>(base - buf_) + elem_off;
-    return VerifyAlignment(f, align) && Verify(f, sizeof(T));
-  }
-
-  // Verify a pointer (may be NULL) of a table type.
-  template <typename T>
-  bool VerifyTable(const T* const table)
-  {
-    return !table || table->Verify(*this);
-  }
-
-  // Verify a pointer (may be NULL) of any vector type.
-  template <int&..., typename T, typename LenT>
-  bool VerifyVector(const Vector<T, LenT>* const vec) const
-  {
-    return !vec || VerifyVectorOrString<LenT>(reinterpret_cast<const uint8_t*>(vec), sizeof(T));
-  }
-
-  // Verify a pointer (may be NULL) of a vector to struct.
-  template <int&..., typename T, typename LenT>
-  bool VerifyVector(const Vector<const T*, LenT>* const vec) const
-  {
-    return VerifyVector(reinterpret_cast<const Vector<T, LenT>*>(vec));
-  }
-
-  // Verify a pointer (may be NULL) to string.
-  bool VerifyString(const String* const str) const
-  {
-    size_t end;
-    return !str ||
-           (VerifyVectorOrString<uoffset_t>(reinterpret_cast<const uint8_t*>(str), 1, &end) &&
-            Verify(end, 1) &&           // Must have terminator
-            Check(buf_[end] == '\0'));  // Terminating byte must be 0.
-  }
-
-  // Common code between vectors and strings.
-  template <typename LenT = uoffset_t>
-  bool VerifyVectorOrString(const uint8_t* const vec,
-                            const size_t elem_size,
-                            size_t* const end = nullptr) const
-  {
-    const auto vec_offset = static_cast<size_t>(vec - buf_);
-    // Check we can read the size field.
-    if (!Verify<LenT>(vec_offset)) return false;
-    // Check the whole array. If this is a string, the byte past the array must
-    // be 0.
-    const LenT size      = ReadScalar<LenT>(vec);
-    const auto max_elems = opts_.max_size / elem_size;
-    if (!Check(size < max_elems)) return false;  // Protect against byte_size overflowing.
-    const auto byte_size = sizeof(LenT) + elem_size * size;
-    if (end) *end = vec_offset + byte_size;
-    return Verify(vec_offset, byte_size);
-  }
-
-  // Special case for string contents, after the above has been called.
-  bool VerifyVectorOfStrings(const Vector<Offset<String>>* const vec) const
-  {
-    if (vec) {
-      for (uoffset_t i = 0; i < vec->size(); i++) {
-        if (!VerifyString(vec->Get(i))) return false;
-      }
-    }
-    return true;
-  }
-
-  // Special case for table contents, after the above has been called.
-  template <typename T>
-  bool VerifyVectorOfTables(const Vector<Offset<T>>* const vec)
-  {
-    if (vec) {
-      for (uoffset_t i = 0; i < vec->size(); i++) {
-        if (!vec->Get(i)->Verify(*this)) return false;
-      }
-    }
-    return true;
-  }
-
-  FLATBUFFERS_SUPPRESS_UBSAN("unsigned-integer-overflow")
-  bool VerifyTableStart(const uint8_t* const table)
-  {
-    // Check the vtable offset.
-    const auto tableo = static_cast<size_t>(table - buf_);
-    if (!Verify<soffset_t>(tableo)) return false;
-    // This offset may be signed, but doing the subtraction unsigned always
-    // gives the result we want.
-    const auto vtableo = tableo - static_cast<size_t>(ReadScalar<soffset_t>(table));
-    // Check the vtable size field, then check vtable fits in its entirety.
-    if (!(VerifyComplexity() && Verify<voffset_t>(vtableo) &&
-          VerifyAlignment(ReadScalar<voffset_t>(buf_ + vtableo), sizeof(voffset_t))))
-      return false;
-    const auto vsize = ReadScalar<voffset_t>(buf_ + vtableo);
-    return Check((vsize & 1) == 0) && Verify(vtableo, vsize);
-  }
-
-  template <typename T>
-  bool VerifyBufferFromStart(const char* const identifier, const size_t start)
-  {
-    // Buffers have to be of some size to be valid. The reason it is a runtime
-    // check instead of static_assert, is that nested flatbuffers go through
-    // this call and their size is determined at runtime.
-    if (!Check(size_ >= FLATBUFFERS_MIN_BUFFER_SIZE)) return false;
-
-    // If an identifier is provided, check that we have a buffer
-    if (identifier && !Check((size_ >= 2 * sizeof(flatbuffers::uoffset_t) &&
-                              BufferHasIdentifier(buf_ + start, identifier)))) {
-      return false;
-    }
-
-    // Call T::Verify, which must be in the generated code for this type.
-    const auto o = VerifyOffset<uoffset_t>(start);
-    if (!Check(o != 0)) return false;
-    if (!(reinterpret_cast<const T*>(buf_ + start + o)->Verify(*this))) { return false; }
-    if (TrackVerifierBufferSize) {
-      if (GetComputedSize() == 0) return false;
-    }
-    return true;
-  }
-
-  template <typename T, int&..., typename SizeT>
-  bool VerifyNestedFlatBuffer(const Vector<uint8_t, SizeT>* const buf, const char* const identifier)
-  {
-    // Caller opted out of this.
-    if (!opts_.check_nested_flatbuffers) return true;
-
-    // An empty buffer is OK as it indicates not present.
-    if (!buf) return true;
-
-    // If there is a nested buffer, it must be greater than the min size.
-    if (!Check(buf->size() >= FLATBUFFERS_MIN_BUFFER_SIZE)) return false;
-
-    VerifierTemplate<TrackVerifierBufferSize> nested_verifier(buf->data(), buf->size(), opts_);
-    return nested_verifier.VerifyBuffer<T>(identifier);
-  }
-
-  // Verify this whole buffer, starting with root type T.
-  template <typename T>
-  bool VerifyBuffer()
-  {
-    return VerifyBuffer<T>(nullptr);
-  }
-
-  template <typename T>
-  bool VerifyBuffer(const char* const identifier)
-  {
-    return VerifyBufferFromStart<T>(identifier, 0);
-  }
-
-  template <typename T, typename SizeT = uoffset_t>
-  bool VerifySizePrefixedBuffer(const char* const identifier)
-  {
-    return Verify<SizeT>(0U) &&
-           // Ensure the prefixed size is within the bounds of the provided
-           // length.
-           Check(ReadScalar<SizeT>(buf_) + sizeof(SizeT) <= size_) &&
-           VerifyBufferFromStart<T>(identifier, sizeof(SizeT));
-  }
-
-  template <typename OffsetT = uoffset_t, typename SOffsetT = soffset_t>
-  size_t VerifyOffset(const size_t start) const
-  {
-    if (!Verify<OffsetT>(start)) return 0;
-    const auto o = ReadScalar<OffsetT>(buf_ + start);
-    // May not point to itself.
-    if (!Check(o != 0)) return 0;
-    // Can't wrap around larger than the max size.
-    if (!Check(static_cast<SOffsetT>(o) >= 0)) return 0;
-    // Must be inside the buffer to create a pointer from it (pointer outside
-    // buffer is UB).
-    if (!Verify(start + o, 1)) return 0;
-    return o;
-  }
-
-  template <typename OffsetT = uoffset_t>
-  size_t VerifyOffset(const uint8_t* const base, const voffset_t start) const
-  {
-    return VerifyOffset<OffsetT>(static_cast<size_t>(base - buf_) + start);
-  }
-
-  // Called at the start of a table to increase counters measuring data
-  // structure depth and amount, and possibly bails out with false if limits set
-  // by the constructor have been hit. Needs to be balanced with EndTable().
-  bool VerifyComplexity()
-  {
-    depth_++;
-    num_tables_++;
-    return Check(depth_ <= opts_.max_depth && num_tables_ <= opts_.max_tables);
-  }
-
-  // Called at the end of a table to pop the depth count.
-  bool EndTable()
-  {
-    depth_--;
-    return true;
-  }
-
-  // Returns the message size in bytes.
-  //
-  // This should only be called after first calling VerifyBuffer or
-  // VerifySizePrefixedBuffer.
-  //
-  // This method should only be called for VerifierTemplate instances
-  // where the TrackVerifierBufferSize template parameter is true,
-  // i.e. for SizeVerifier.  For instances where TrackVerifierBufferSize
-  // is false, this fails at runtime or returns zero.
-  size_t GetComputedSize() const
-  {
-    if (TrackVerifierBufferSize) {
-      uintptr_t size = upper_bound_;
-      // Align the size to uoffset_t
-      size = (size - 1 + sizeof(uoffset_t)) & ~(sizeof(uoffset_t) - 1);
-      return (size > size_) ? 0 : size;
-    }
-    // Must use SizeVerifier, or (deprecated) turn on
-    // FLATBUFFERS_TRACK_VERIFIER_BUFFER_SIZE, for this to work.
-    (void)upper_bound_;
-    FLATBUFFERS_ASSERT(false);
-    return 0;
-  }
-
-  std::vector<uint8_t>* GetFlexReuseTracker() { return flex_reuse_tracker_; }
-
-  void SetFlexReuseTracker(std::vector<uint8_t>* const rt) { flex_reuse_tracker_ = rt; }
-
- private:
-  const uint8_t* buf_;
-  const size_t size_;
-  const Options opts_;
-
-  mutable size_t upper_bound_ = 0;
-
-  uoffset_t depth_                          = 0;
-  uoffset_t num_tables_                     = 0;
-  std::vector<uint8_t>* flex_reuse_tracker_ = nullptr;
-};
-
-// Specialization for 64-bit offsets.
-template <>
-template <>
-inline size_t VerifierTemplate<false>::VerifyOffset<uoffset64_t>(const size_t start) const
-{
-  return VerifyOffset<uoffset64_t, soffset64_t>(start);
-}
-template <>
-template <>
-inline size_t VerifierTemplate<true>::VerifyOffset<uoffset64_t>(const size_t start) const
-{
-  return VerifyOffset<uoffset64_t, soffset64_t>(start);
-}
-
-// Instance of VerifierTemplate that supports GetComputedSize().
-using SizeVerifier = VerifierTemplate</*TrackVerifierBufferSize = */ true>;
-
-// The FLATBUFFERS_TRACK_VERIFIER_BUFFER_SIZE build configuration macro is
-// deprecated, and should not be defined, since it is easy to misuse in ways
-// that result in ODR violations. Rather than using Verifier and defining
-// FLATBUFFERS_TRACK_VERIFIER_BUFFER_SIZE, please use SizeVerifier instead.
-#ifdef FLATBUFFERS_TRACK_VERIFIER_BUFFER_SIZE  // Deprecated, see above.
-using Verifier = SizeVerifier;
-#else
-// Instance of VerifierTemplate that is slightly faster, but does not
-// support GetComputedSize().
-using Verifier = VerifierTemplate</*TrackVerifierBufferSize = */ false>;
-#endif
-
-}  // namespace flatbuffers
-
-#endif  // FLATBUFFERS_VERIFIER_H_
-#endif  // DOXYGEN_SHOULD_SKIP_THIS

From c5a7b0e6db27ab9195741c97eebcd00a17adbf7b Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Thu, 2 May 2024 23:41:14 +0000
Subject: [PATCH 14/53] Make arrow schema use in PQ reader optional. Add tests.

---
 .pre-commit-config.yaml                    |  8 ++++---
 cpp/include/cudf/io/parquet.hpp            | 28 ++++++++++++++++++++++
 cpp/src/io/parquet/reader_impl.cpp         |  8 +++++--
 cpp/src/io/parquet/reader_impl_helpers.cpp | 10 ++++----
 cpp/src/io/parquet/reader_impl_helpers.hpp | 16 ++++++++-----
 python/cudf/cudf/_lib/cpp/io/parquet.pxd   |  5 ++++
 python/cudf/cudf/_lib/parquet.pyx          |  3 +++
 python/cudf/cudf/io/parquet.py             |  4 ++++
 python/cudf/cudf/tests/test_parquet.py     | 10 ++++++++
 9 files changed, 77 insertions(+), 15 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 3e99cf3fa9a..92585dcda9a 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -140,9 +140,11 @@ repos:
     hooks:
       - id: verify-copyright
         exclude: |
-          (?x)
-              cpp/include/cudf_test/cxxopts[.]hpp$
-
+          (?x)^(
+            cpp/include/cudf_test/cxxopts[.]hpp|
+            cpp/include/cudf/io/ipc/detail/.*|
+            cpp/include/cudf/detail/utilities/base64_utils[.]hpp
+          )$
 
 default_language_version:
       python: python3
diff --git a/cpp/include/cudf/io/parquet.hpp b/cpp/include/cudf/io/parquet.hpp
index f58bc48a37d..cadad65cadd 100644
--- a/cpp/include/cudf/io/parquet.hpp
+++ b/cpp/include/cudf/io/parquet.hpp
@@ -71,6 +71,8 @@ class parquet_reader_options {
   bool _convert_strings_to_categories = false;
   // Whether to use PANDAS metadata to load columns
   bool _use_pandas_metadata = true;
+  // Whether to read and use ARROW schema
+  bool _use_arrow_schema = true;
   // Cast timestamp columns to a specific type
   data_type _timestamp_type{type_id::EMPTY};
 
@@ -126,6 +128,13 @@ class parquet_reader_options {
    */
   [[nodiscard]] bool is_enabled_use_pandas_metadata() const { return _use_pandas_metadata; }
 
+  /**
+   * @brief Returns true/false depending whether to use arrow schema while reading.
+   *
+   * @return `true` if arrow schema is used while reading
+   */
+  [[nodiscard]] bool is_enabled_use_arrow_schema() const { return _use_arrow_schema; }
+
   /**
    * @brief Returns optional tree of metadata.
    *
@@ -214,6 +223,13 @@ class parquet_reader_options {
    */
   void enable_use_pandas_metadata(bool val) { _use_pandas_metadata = val; }
 
+  /**
+   * @brief Sets to enable/disable use of arrow schema to read.
+   *
+   * @param val Boolean value whether to use arrow schema
+   */
+  void enable_use_arrow_schema(bool val) { _use_arrow_schema = val; }
+
   /**
    * @brief Sets reader column schema.
    *
@@ -328,6 +344,18 @@ class parquet_reader_options_builder {
     return *this;
   }
 
+  /**
+   * @brief Sets to enable/disable use of arrow schema to read.
+   *
+   * @param val Boolean value whether to use arrow schema
+   * @return this for chaining
+   */
+  parquet_reader_options_builder& use_arrow_schema(bool val)
+  {
+    options._use_arrow_schema = val;
+    return *this;
+  }
+
   /**
    * @brief Sets reader metadata.
    *
diff --git a/cpp/src/io/parquet/reader_impl.cpp b/cpp/src/io/parquet/reader_impl.cpp
index a524e7c6dcc..bac1f64cd39 100644
--- a/cpp/src/io/parquet/reader_impl.cpp
+++ b/cpp/src/io/parquet/reader_impl.cpp
@@ -387,7 +387,8 @@ reader::impl::impl(std::size_t chunk_read_limit,
     _input_pass_read_limit{pass_read_limit}
 {
   // Open and parse the source dataset metadata
-  _metadata = std::make_unique<aggregate_reader_metadata>(_sources);
+  _metadata =
+    std::make_unique<aggregate_reader_metadata>(_sources, options.is_enabled_use_arrow_schema());
 
   // Override output timestamp resolution if requested
   if (options.get_timestamp_type().id() != type_id::EMPTY) {
@@ -603,8 +604,11 @@ parquet_column_schema walk_schema(aggregate_reader_metadata const* mt, int idx)
 
 parquet_metadata read_parquet_metadata(host_span<std::unique_ptr<datasource> const> sources)
 {
+  // do not use arrow schema when reading information from parquet metadata.
+  static constexpr auto use_arrow_schema = false;
+
   // Open and parse the source dataset metadata
-  auto metadata = aggregate_reader_metadata(sources);
+  auto metadata = aggregate_reader_metadata(sources, use_arrow_schema);
 
   return parquet_metadata{parquet_schema{walk_schema(&metadata, 0)},
                           metadata.get_num_rows(),
diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index d8c674fa87d..42bd5808ba1 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -525,10 +525,10 @@ void aggregate_reader_metadata::column_info_for_row_group(row_group_info& rg_inf
 }
 
 aggregate_reader_metadata::aggregate_reader_metadata(
-  host_span<std::unique_ptr<datasource> const> sources)
+  host_span<std::unique_ptr<datasource> const> sources, bool use_arrow_schema)
   : per_file_metadata(metadatas_from_sources(sources)),
     keyval_maps(collect_keyval_metadata()),
-    arrow_schema(collect_arrow_schema()),
+    arrow_schema(collect_arrow_schema(use_arrow_schema)),
     num_rows(calc_num_rows()),
     num_row_groups(calc_num_row_groups())
 {
@@ -561,10 +561,12 @@ aggregate_reader_metadata::aggregate_reader_metadata(
 }
 
 [[nodiscard]] std::optional<arrow_schema_data_types>
-aggregate_reader_metadata::collect_arrow_schema() const
+aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
 {
-  // Check the key_value metadata for ARROW:schema, decode and walk it
+  // Check if we want to collect the arrow_schema
+  if (not use_arrow_schema) { return std::nullopt; }
 
+  // Check the key_value metadata for ARROW:schema, decode and walk it
   // Function to convert from flatbuf::duration type to cudf::type_id
   auto duration_from_flatbuffer = [](flatbuf::Duration const* duration) {
     // TODO: we only need this for arrow::DurationType for now. Else, we can take in a
diff --git a/cpp/src/io/parquet/reader_impl_helpers.hpp b/cpp/src/io/parquet/reader_impl_helpers.hpp
index 0ca557c4b1d..881e88273f4 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.hpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.hpp
@@ -28,8 +28,6 @@
 #include <thrust/iterator/counting_iterator.h>
 #include <thrust/iterator/zip_iterator.h>
 
-#include <arrow/type_fwd.h>
-
 #include <list>
 #include <tuple>
 #include <vector>
@@ -149,11 +147,16 @@ class aggregate_reader_metadata {
     const;
 
   /**
-   * @brief Decodes and walks over "ARROW:schema"  from Parquet key value
-   * metadata section and return it.
+   * @brief Decodes and constructs the arrow schema from the "ARROW:schema" IPC message
+   * in key value metadata section of Parquet file footer
    */
-  [[nodiscard]] std::optional<arrow_schema_data_types> collect_arrow_schema() const;
+  [[nodiscard]] std::optional<arrow_schema_data_types> collect_arrow_schema(
+    bool use_arrow_schema) const;
 
+  /**
+   * @brief Co-walks the collected arrow and Parquet schema, updates
+   * dtypes and destroys the no longer needed arrow schema object(s).
+   */
   void consume_arrow_schema();
 
   /**
@@ -181,7 +184,8 @@ class aggregate_reader_metadata {
   void column_info_for_row_group(row_group_info& rg_info, size_type chunk_start_row) const;
 
  public:
-  aggregate_reader_metadata(host_span<std::unique_ptr<datasource> const> sources);
+  aggregate_reader_metadata(host_span<std::unique_ptr<datasource> const> sources,
+                            bool use_arrow_schema);
 
   [[nodiscard]] RowGroup const& get_row_group(size_type row_group_index, size_type src_idx) const;
 
diff --git a/python/cudf/cudf/_lib/cpp/io/parquet.pxd b/python/cudf/cudf/_lib/cpp/io/parquet.pxd
index 8de16d06a9d..948ccc9776b 100644
--- a/python/cudf/cudf/_lib/cpp/io/parquet.pxd
+++ b/python/cudf/cudf/_lib/cpp/io/parquet.pxd
@@ -23,11 +23,13 @@ cdef extern from "cudf/io/parquet.hpp" namespace "cudf::io" nogil:
         const optional[reference_wrapper[expression]]& get_filter() except +
         data_type get_timestamp_type() except +
         bool is_enabled_use_pandas_metadata() except +
+        bool is_enabled_arrow_schema() except +
 
         # setter
 
         void set_columns(vector[string] col_names) except +
         void set_row_groups(vector[vector[size_type]] row_grp) except +
+        void enable_use_arrow_schema(bool val) except +
         void enable_use_pandas_metadata(bool val) except +
         void set_timestamp_type(data_type type) except +
 
@@ -50,6 +52,9 @@ cdef extern from "cudf/io/parquet.hpp" namespace "cudf::io" nogil:
         parquet_reader_options_builder& use_pandas_metadata(
             bool val
         ) except +
+        parquet_reader_options_builder& use_arrow_schema(
+            bool val
+        ) except +
         parquet_reader_options_builder& timestamp_type(
             data_type type
         ) except +
diff --git a/python/cudf/cudf/_lib/parquet.pyx b/python/cudf/cudf/_lib/parquet.pyx
index 9ce9aad18f7..8e1e58b09e3 100644
--- a/python/cudf/cudf/_lib/parquet.pyx
+++ b/python/cudf/cudf/_lib/parquet.pyx
@@ -124,6 +124,7 @@ def _parse_metadata(meta):
 
 
 cpdef read_parquet(filepaths_or_buffers, columns=None, row_groups=None,
+                   use_arrow_schema=True,
                    use_pandas_metadata=True,
                    Expression filters=None):
     """
@@ -152,6 +153,7 @@ cpdef read_parquet(filepaths_or_buffers, columns=None, row_groups=None,
         filepaths_or_buffers)
 
     cdef bool cpp_use_pandas_metadata = use_pandas_metadata
+    cdef bool cpp_use_arrow_schema = use_arrow_schema
 
     cdef vector[vector[size_type]] cpp_row_groups
     cdef data_type cpp_timestamp_type = cudf_types.data_type(
@@ -167,6 +169,7 @@ cpdef read_parquet(filepaths_or_buffers, columns=None, row_groups=None,
         parquet_reader_options.builder(source)
         .row_groups(cpp_row_groups)
         .use_pandas_metadata(cpp_use_pandas_metadata)
+        .use_arrow_schema(cpp_use_arrow_schema)
         .timestamp_type(cpp_timestamp_type)
     )
     if filters is not None:
diff --git a/python/cudf/cudf/io/parquet.py b/python/cudf/cudf/io/parquet.py
index e7f1ad0751f..bc0e86efe6e 100644
--- a/python/cudf/cudf/io/parquet.py
+++ b/python/cudf/cudf/io/parquet.py
@@ -471,6 +471,7 @@ def read_parquet(
     storage_options=None,
     filters=None,
     row_groups=None,
+    use_arrow_schema=True,
     use_pandas_metadata=True,
     use_python_file_object=True,
     categorical_partitions=True,
@@ -608,6 +609,7 @@ def read_parquet(
         *args,
         columns=columns,
         row_groups=row_groups,
+        use_arrow_schema=use_arrow_schema,
         use_pandas_metadata=use_pandas_metadata,
         partition_keys=partition_keys,
         partition_categories=partition_categories,
@@ -839,6 +841,7 @@ def _read_parquet(
     engine,
     columns=None,
     row_groups=None,
+    use_arrow_schema=None,
     use_pandas_metadata=None,
     *args,
     **kwargs,
@@ -861,6 +864,7 @@ def _read_parquet(
             columns=columns,
             row_groups=row_groups,
             use_pandas_metadata=use_pandas_metadata,
+            use_arrow_schema=use_arrow_schema,
         )
     else:
         if (
diff --git a/python/cudf/cudf/tests/test_parquet.py b/python/cudf/cudf/tests/test_parquet.py
index 897ef71a278..d6bb214831a 100644
--- a/python/cudf/cudf/tests/test_parquet.py
+++ b/python/cudf/cudf/tests/test_parquet.py
@@ -3201,3 +3201,13 @@ def test_parquet_reader_duration_types():
     got = cudf.read_parquet(buffer)
     assert_eq(pdf.dtypes, got.dtypes)
     assert_eq(pdf, got)
+
+    # Convert all pdf dtypes to int64
+    pdf2 = pdf.astype("int64")
+
+    # Read parquet without arrow schema
+    got2 = cudf.read_parquet(buffer, use_arrow_schema=False)
+
+    # Check results
+    assert_eq(pdf2.dtypes, got2.dtypes)
+    assert_eq(pdf2, got2)

From 6f187661010b95e9e53f6f449bba01ae10859daa Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Thu, 2 May 2024 23:44:20 +0000
Subject: [PATCH 15/53] minor updates for better readability

---
 python/cudf/cudf/tests/test_parquet.py | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/python/cudf/cudf/tests/test_parquet.py b/python/cudf/cudf/tests/test_parquet.py
index d6bb214831a..21bde2b2bd9 100644
--- a/python/cudf/cudf/tests/test_parquet.py
+++ b/python/cudf/cudf/tests/test_parquet.py
@@ -3193,21 +3193,21 @@ def test_parquet_reader_duration_types():
         }
     )
 
+    # Convert all pdf dtypes to int64
+    pdf2 = pdf.astype("int64")
+
     # Write parquet with arrow for now (to write arrow:schema)
     buffer = BytesIO()
     pdf.to_parquet(buffer, engine="pyarrow")
 
-    # Check results
+    # Read parquet with and without arrow schema
     got = cudf.read_parquet(buffer)
+    got2 = cudf.read_parquet(buffer, use_arrow_schema=False)
+
+    # Check results for reader with schema
     assert_eq(pdf.dtypes, got.dtypes)
     assert_eq(pdf, got)
 
-    # Convert all pdf dtypes to int64
-    pdf2 = pdf.astype("int64")
-
-    # Read parquet without arrow schema
-    got2 = cudf.read_parquet(buffer, use_arrow_schema=False)
-
-    # Check results
+    # Check results for reader without schema
     assert_eq(pdf2.dtypes, got2.dtypes)
     assert_eq(pdf2, got2)

From dc7564a191ffd19716d6153770f4388af2d6f1eb Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Fri, 3 May 2024 03:09:22 +0000
Subject: [PATCH 16/53] fix arrow schema walk to handle list type columns. Add
 more pytests

---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 11 ++-
 python/cudf/cudf/tests/test_parquet.py     | 87 ++++++++++++++++++++--
 2 files changed, 90 insertions(+), 8 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index a7501038b06..7aa4bc37bd9 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -609,8 +609,15 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
               })) {
           return false;
         }
-
-        schema_elem.children = std::move(schema_children);
+        switch (field->type_type()) {
+          case flatbuf::Type::Type_List:
+          case flatbuf::Type::Type_LargeList:
+          case flatbuf::Type::Type_FixedSizeList:
+            schema_elem.children.emplace_back(arrow_schema_data_types{});
+            schema_elem.children.back().children = std::move(schema_children);
+            break;
+          default: schema_elem.children = std::move(schema_children); break;
+        }
       }
 
       // Walk the field itself
diff --git a/python/cudf/cudf/tests/test_parquet.py b/python/cudf/cudf/tests/test_parquet.py
index b4af10afc6b..442f196d57d 100644
--- a/python/cudf/cudf/tests/test_parquet.py
+++ b/python/cudf/cudf/tests/test_parquet.py
@@ -3183,13 +3183,14 @@ def test_parquet_reader_zstd_huff_tables(datadir):
 
 
 def test_parquet_reader_duration_types():
+    # arrow schema is used to faithfully round trip duration
+    # types (timedelta64) across Parquet read and write.
     pdf = pd.DataFrame(
         {
             "s": pd.Series([1234, 3456, 32442], dtype="timedelta64[s]"),
             "ms": pd.Series([1234, 3456, 32442], dtype="timedelta64[ms]"),
             "us": pd.Series([1234, 3456, 32442], dtype="timedelta64[us]"),
             "ns": pd.Series([1234, 3456, 32442], dtype="timedelta64[ns]"),
-            "i64": pd.Series([1234, 3456, 32442], dtype="int64"),
         }
     )
 
@@ -3200,14 +3201,88 @@ def test_parquet_reader_duration_types():
     buffer = BytesIO()
     pdf.to_parquet(buffer, engine="pyarrow")
 
-    # Read parquet with and without arrow schema
+    # Read parquet with arrow schema
     got = cudf.read_parquet(buffer)
+    # Convert to cudf table for an apple to apple comparison
+    expected = cudf.from_pandas(pdf)
+
+    # Check results for reader with schema
+    assert_eq(expected.dtypes, got.dtypes)
+    assert_eq(expected, got)
+
+    # Read parquet without arrow schema
     got2 = cudf.read_parquet(buffer, use_arrow_schema=False)
+    # Convert to cudf table for an apple to apple comparison
+    expected2 = cudf.from_pandas(pdf2)
+
+    # Check results for reader without schema
+    assert_eq(expected2.dtypes, got2.dtypes)
+    assert_eq(expected2, got2)
+
+
+def test_parquet_reader_roundtrip_with_arrow_schema():
+    # Ensure that the nested types are faithfully being roundtripped
+    # across Parquet with arrow schema present
+
+    # data frame with several types that round trip perfectly
+    # without arrow schema as well
+    expected = cudf.DataFrame(
+        {
+            "int64": cudf.Series([1234, 123, 4123], dtype="int64"),
+            "list": list([[1, 2], [1, 2], [1, 2]]),
+            "time": cudf.Series([1234, 123, 4123], dtype="datetime64[ms]"),
+        }
+    )
+
+    # Write parquet with arrow for now (to write arrow:schema)
+    buffer = BytesIO()
+    pdf = expected.to_pandas()
+    pdf.to_parquet(buffer, engine="pyarrow")
+
+    # Read parquet with arrow schema
+    got_with_schema = cudf.read_parquet(buffer)
+    got_without_schema = cudf.read_parquet(buffer, use_arrow_schema=False)
 
     # Check results for reader with schema
-    assert_eq(pdf.dtypes, got.dtypes)
-    assert_eq(pdf, got)
+    assert_eq(expected.dtypes, got_with_schema.dtypes)
+    assert_eq(expected, got_with_schema)
+
+    # Check results for reader without schema
+    assert_eq(expected.dtypes, got_without_schema.dtypes)
+    assert_eq(expected, got_without_schema)
+
+    # reset data frame with a column of struct type
+    expected = cudf.DataFrame(
+        {
+            "a": {
+                "payload": {
+                    "Domain": {
+                        "Name": "abc",
+                        "Id": {"Name": "host", "Value": "127.0.0.8"},
+                    },
+                    "StreamId": "12345678",
+                    "Duration": 10,
+                    "Offset": 12,
+                    "Resource": [{"Name": "ZoneName", "Value": "RAPIDS"}],
+                }
+            }
+        }
+    )
+
+    # Reset the buffer
+    buffer = BytesIO()
+
+    pdf = expected.to_pandas()
+    pdf.to_parquet(buffer, engine="pyarrow")
+
+    # Read parquet with arrow schema
+    got_with_schema = cudf.read_parquet(buffer)
+    got_without_schema = cudf.read_parquet(buffer, use_arrow_schema=False)
+
+    # Check results for reader with schema
+    assert_eq(expected.dtypes, got_with_schema.dtypes)
+    assert_eq(expected, got_with_schema)
 
     # Check results for reader without schema
-    assert_eq(pdf2.dtypes, got2.dtypes)
-    assert_eq(pdf2, got2)
+    assert_eq(expected.dtypes, got_without_schema.dtypes)
+    assert_eq(expected, got_without_schema)

From 0c4e7c4df85ac30e31257e11f6c7aae8162d771a Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Fri, 3 May 2024 03:31:48 +0000
Subject: [PATCH 17/53] add comments for the dummy node hack

---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 7aa4bc37bd9..e3d0865cd42 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -609,6 +609,11 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
               })) {
           return false;
         }
+        // arrow and parquet schemas are structured slightly differently for list type fields. list
+        // type fields in arrow are structured as: "field:list<element>" vs structured as:
+        // "field:list.element" in Parquet. To handle this, whenever we encounter a list type field,
+        // we add a dummy node "field.list" to the end of current children and move the current
+        // children (".element") to it.
         switch (field->type_type()) {
           case flatbuf::Type::Type_List:
           case flatbuf::Type::Type_LargeList:

From 0514b5cc7a5fa320b8faf709d4653e586c20e5d8 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Fri, 3 May 2024 23:48:06 +0000
Subject: [PATCH 18/53] Adding `map` type to parquet testing.

---
 python/cudf/cudf/tests/test_parquet.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/python/cudf/cudf/tests/test_parquet.py b/python/cudf/cudf/tests/test_parquet.py
index 442f196d57d..5ce9dd6fb94 100644
--- a/python/cudf/cudf/tests/test_parquet.py
+++ b/python/cudf/cudf/tests/test_parquet.py
@@ -3230,7 +3230,8 @@ def test_parquet_reader_roundtrip_with_arrow_schema():
         {
             "int64": cudf.Series([1234, 123, 4123], dtype="int64"),
             "list": list([[1, 2], [1, 2], [1, 2]]),
-            "time": cudf.Series([1234, 123, 4123], dtype="datetime64[ms]"),
+            "datetime": cudf.Series([1234, 123, 4123], dtype="datetime64[ms]"),
+            "map": cudf.Series(['cat', 'dog', 'cow']).map({'cat': 'kitten', 'dog': 'puppy', 'cow':'calf'})
         }
     )
 

From a1f8fe7cc47577e19822e983a0c58670512903e3 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Mon, 6 May 2024 18:31:31 +0000
Subject: [PATCH 19/53] relocate files, fix copyirghts and ruff checks

---
 .pre-commit-config.yaml                       |  5 ++--
 .../io/parquet/ipc}/Message_generated.h       |  0
 .../io/parquet/ipc}/Schema_generated.h        |  0
 .../io/parquet/ipc/schema}/Message.fbs        |  0
 .../io/parquet/ipc/schema}/Schema.fbs         |  0
 cpp/src/io/parquet/reader_impl_helpers.cpp    |  9 +++----
 .../io/utilities/base64_utilities.hpp}        | 25 +++++++++++++++++--
 python/cudf/cudf/tests/test_parquet.py        |  4 ++-
 8 files changed, 32 insertions(+), 11 deletions(-)
 rename cpp/{include/cudf/io/ipc/detail => src/io/parquet/ipc}/Message_generated.h (100%)
 rename cpp/{include/cudf/io/ipc/detail => src/io/parquet/ipc}/Schema_generated.h (100%)
 rename cpp/{include/cudf/io/ipc => src/io/parquet/ipc/schema}/Message.fbs (100%)
 rename cpp/{include/cudf/io/ipc => src/io/parquet/ipc/schema}/Schema.fbs (100%)
 rename cpp/{include/cudf/detail/utilities/base64_utils.hpp => src/io/utilities/base64_utilities.hpp} (85%)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 92585dcda9a..9dd4add68e6 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -141,9 +141,8 @@ repos:
       - id: verify-copyright
         exclude: |
           (?x)^(
-            cpp/include/cudf_test/cxxopts[.]hpp|
-            cpp/include/cudf/io/ipc/detail/.*|
-            cpp/include/cudf/detail/utilities/base64_utils[.]hpp
+            cpp/include/cudf_test/cxxopts[.]hpp$
+            cpp/src/io/parquet/ipc/.*_generated[.]hpp
           )$
 
 default_language_version:
diff --git a/cpp/include/cudf/io/ipc/detail/Message_generated.h b/cpp/src/io/parquet/ipc/Message_generated.h
similarity index 100%
rename from cpp/include/cudf/io/ipc/detail/Message_generated.h
rename to cpp/src/io/parquet/ipc/Message_generated.h
diff --git a/cpp/include/cudf/io/ipc/detail/Schema_generated.h b/cpp/src/io/parquet/ipc/Schema_generated.h
similarity index 100%
rename from cpp/include/cudf/io/ipc/detail/Schema_generated.h
rename to cpp/src/io/parquet/ipc/Schema_generated.h
diff --git a/cpp/include/cudf/io/ipc/Message.fbs b/cpp/src/io/parquet/ipc/schema/Message.fbs
similarity index 100%
rename from cpp/include/cudf/io/ipc/Message.fbs
rename to cpp/src/io/parquet/ipc/schema/Message.fbs
diff --git a/cpp/include/cudf/io/ipc/Schema.fbs b/cpp/src/io/parquet/ipc/schema/Schema.fbs
similarity index 100%
rename from cpp/include/cudf/io/ipc/Schema.fbs
rename to cpp/src/io/parquet/ipc/schema/Schema.fbs
diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index e3d0865cd42..7bc5e6802d1 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -17,11 +17,10 @@
 #include "reader_impl_helpers.hpp"
 
 #include "io/parquet/parquet.hpp"
+#include "io/utilities/base64_utilities.hpp"
 #include "io/utilities/row_selection.hpp"
-
-#include <cudf/detail/utilities/base64_utils.hpp>
-#include <cudf/io/ipc/detail/Message_generated.h>
-#include <cudf/io/ipc/detail/Schema_generated.h>
+#include "ipc/Message_generated.h"
+#include "ipc/Schema_generated.h"
 
 #include <thrust/iterator/counting_iterator.h>
 
@@ -655,7 +654,7 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
   // Note: Store the output from base64_decode in the lvalue here and then pass
   // it to decode_ipc_message. Directly passing rvalue from base64_decode to
   // decode_ipc_message can lead to unintended nullptr dereferences.
-  auto decoded_message = cudf::detail::base64_decode(encoded_serialized_message);
+  auto decoded_message = cudf::io::detail::base64_decode(encoded_serialized_message);
 
   // Decode the ipc message to get a const void pointer to the arrow:Message flatbuffer
   auto metadata_buf = decode_ipc_message(decoded_message);
diff --git a/cpp/include/cudf/detail/utilities/base64_utils.hpp b/cpp/src/io/utilities/base64_utilities.hpp
similarity index 85%
rename from cpp/include/cudf/detail/utilities/base64_utils.hpp
rename to cpp/src/io/utilities/base64_utilities.hpp
index 18d1475922f..c616335f002 100644
--- a/cpp/include/cudf/detail/utilities/base64_utils.hpp
+++ b/cpp/src/io/utilities/base64_utilities.hpp
@@ -1,3 +1,24 @@
+/*
+ * Copyright (c) 2024, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/*
+ * Portions of this file are derived from Google's Brotli project at
+ * https://github.com/ReneNyffenegger/cpp-base64, original license text below.
+ */
+
 /*
  *  base64_utils.cpp and base64_utils.hpp
  *
@@ -45,7 +66,7 @@
 // altered: applying clang-format for libcudf on this file.
 
 // altered: use cudf namespaces
-namespace cudf::detail {
+namespace cudf::io::detail {
 
 static const std::string base64_chars =
   "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
@@ -155,4 +176,4 @@ std::string base64_decode(std::string_view encoded_string)
   return decoded;
 }
 
-}  // namespace cudf::detail
+}  // namespace cudf::io::detail
diff --git a/python/cudf/cudf/tests/test_parquet.py b/python/cudf/cudf/tests/test_parquet.py
index 5ce9dd6fb94..d625774b14d 100644
--- a/python/cudf/cudf/tests/test_parquet.py
+++ b/python/cudf/cudf/tests/test_parquet.py
@@ -3231,7 +3231,9 @@ def test_parquet_reader_roundtrip_with_arrow_schema():
             "int64": cudf.Series([1234, 123, 4123], dtype="int64"),
             "list": list([[1, 2], [1, 2], [1, 2]]),
             "datetime": cudf.Series([1234, 123, 4123], dtype="datetime64[ms]"),
-            "map": cudf.Series(['cat', 'dog', 'cow']).map({'cat': 'kitten', 'dog': 'puppy', 'cow':'calf'})
+            "map": cudf.Series(["cat", "dog", "cow"]).map(
+                {"cat": "kitten", "dog": "puppy", "lion": "cub"}
+            ),
         }
     )
 

From a36c1c6e610f09fb820ab798da29a6cf2f42bff2 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Mon, 6 May 2024 18:38:31 +0000
Subject: [PATCH 20/53] minor fix for verify copyright hook

---
 .pre-commit-config.yaml | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 9dd4add68e6..6dcf5a28ce2 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -141,8 +141,9 @@ repos:
       - id: verify-copyright
         exclude: |
           (?x)^(
-            cpp/include/cudf_test/cxxopts[.]hpp$
-            cpp/src/io/parquet/ipc/.*_generated[.]hpp
+            cpp/include/cudf_test/cxxopts[.]hpp|
+            cpp/src/io/parquet/ipc/Message_generated[.]h|
+            cpp/src/io/parquet/ipc/Schema_generated[.]h
           )$
 
 default_language_version:

From 6b9bde530eca86546b6569a4ae9a5d6833967779 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Mon, 6 May 2024 19:06:33 +0000
Subject: [PATCH 21/53] update copyright messages

---
 cpp/src/io/parquet/ipc/schema/Message.fbs | 21 +++++++++++++++++++++
 cpp/src/io/parquet/ipc/schema/Schema.fbs  | 21 +++++++++++++++++++++
 cpp/src/io/utilities/base64_utilities.hpp |  2 +-
 3 files changed, 43 insertions(+), 1 deletion(-)

diff --git a/cpp/src/io/parquet/ipc/schema/Message.fbs b/cpp/src/io/parquet/ipc/schema/Message.fbs
index 8a65c2e3cf9..25534410597 100644
--- a/cpp/src/io/parquet/ipc/schema/Message.fbs
+++ b/cpp/src/io/parquet/ipc/schema/Message.fbs
@@ -1,3 +1,24 @@
+//
+// Copyright (c) 2024, NVIDIA CORPORATION.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+
+//
+// Portions of this file are derived from Apache's Arrow project at
+// https://github.com/apache/arrow, original license text below.
+//
+
 // Licensed to the Apache Software Foundation (ASF) under one
 // or more contributor license agreements.  See the NOTICE file
 // distributed with this work for additional information
diff --git a/cpp/src/io/parquet/ipc/schema/Schema.fbs b/cpp/src/io/parquet/ipc/schema/Schema.fbs
index 4c8722d0628..5f66e7bbd5e 100644
--- a/cpp/src/io/parquet/ipc/schema/Schema.fbs
+++ b/cpp/src/io/parquet/ipc/schema/Schema.fbs
@@ -1,3 +1,24 @@
+//
+// Copyright (c) 2024, NVIDIA CORPORATION.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+
+//
+// Portions of this file are derived from Apache's Arrow project at
+// https://github.com/apache/arrow, original license text below.
+//
+
 // Licensed to the Apache Software Foundation (ASF) under one
 // or more contributor license agreements.  See the NOTICE file
 // distributed with this work for additional information
diff --git a/cpp/src/io/utilities/base64_utilities.hpp b/cpp/src/io/utilities/base64_utilities.hpp
index c616335f002..2bc78f8c2f4 100644
--- a/cpp/src/io/utilities/base64_utilities.hpp
+++ b/cpp/src/io/utilities/base64_utilities.hpp
@@ -15,7 +15,7 @@
  */
 
 /*
- * Portions of this file are derived from Google's Brotli project at
+ * Portions of this file are derived from Rene Nyffenegger's codebase at
  * https://github.com/ReneNyffenegger/cpp-base64, original license text below.
  */
 

From cb691dd245b4ea735ca1a5205ceb3b34d84bdd00 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Mon, 6 May 2024 20:50:38 +0000
Subject: [PATCH 22/53] segfault-proof the `validate_schemas` method

---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 19 ++++++++++---------
 1 file changed, 10 insertions(+), 9 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 7bc5e6802d1..7bffa9131b1 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -718,17 +718,18 @@ void aggregate_reader_metadata::consume_arrow_schema()
     [&](arrow_schema_data_types& arrow_schema, int schema_idx) {
       auto& schema_elem = per_file_metadata[0].schema[schema_idx];
 
-      // TODO: raw loops. Should change to STL if possible.
-      if (not std::all_of(thrust::make_counting_iterator(0),
-                          thrust::make_counting_iterator(schema_elem.num_children),
-                          [&](auto const& idx) {
-                            return validate_schemas(arrow_schema.children[idx],
-                                                    schema_elem.children_idx[idx]);
-                          })) {
+      // ensure equal number of children first to avoid any segfaults in children
+      if (schema_elem.num_children == static_cast<int32_t>(arrow_schema.children.size())) {
+        // true if and only if true for all children as well
+        return std::all_of(thrust::make_counting_iterator(0),
+                           thrust::make_counting_iterator(schema_elem.num_children),
+                           [&](auto const& idx) {
+                             return validate_schemas(arrow_schema.children[idx],
+                                                     schema_elem.children_idx[idx]);
+                           });
+      } else {
         return false;
       }
-
-      return schema_elem.num_children == static_cast<int32_t>(arrow_schema.children.size());
     };
 
   // Function to co-walk arrow and parquet schemas

From ed83908c39423a3c8a573ddeef2269f99faf3153 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Tue, 7 May 2024 01:33:17 +0000
Subject: [PATCH 23/53] C++ friendly base64 encoder/decoder implementations

---
 cpp/src/io/utilities/base64_utilities.hpp | 271 +++++++++++++++-------
 1 file changed, 185 insertions(+), 86 deletions(-)

diff --git a/cpp/src/io/utilities/base64_utilities.hpp b/cpp/src/io/utilities/base64_utilities.hpp
index 2bc78f8c2f4..2f04a73c9ef 100644
--- a/cpp/src/io/utilities/base64_utilities.hpp
+++ b/cpp/src/io/utilities/base64_utilities.hpp
@@ -20,13 +20,15 @@
  */
 
 /*
- *  base64_utils.cpp and base64_utils.hpp
+ *  base64.cpp and base64.h
  *
  *  base64 encoding and decoding with C++.
+ *  More information at
+ *    https://renenyffenegger.ch/notes/development/Base64/Encoding-and-decoding-base-64-with-cpp
  *
- *  Version: 1.01.00
+ *  Version: 2.rc.09 (release candidate)
  *
- *  Copyright (C) 2004-2017 René Nyffenegger
+ *  Copyright (C) 2004-2017, 2020-2022 René Nyffenegger
  *
  *  This source code is provided 'as-is', without any express or implied
  *  warranty. In no event will the author be held liable for any damages
@@ -57,10 +59,13 @@
 #pragma once
 
 // altered: including required std headers
-#include <array>
-#include <iostream>
+#include <cudf/utilities/error.hpp>
+
+#include <thrust/iterator/counting_iterator.h>
+
+#include <algorithm>
+#include <functional>
 #include <string>
-#include <vector>
 
 // altered: merged base64.h and base64.cpp into one file.
 // altered: applying clang-format for libcudf on this file.
@@ -73,106 +78,200 @@ static const std::string base64_chars =
   "abcdefghijklmnopqrstuvwxyz"
   "0123456789+/";
 
-static inline auto is_base64(unsigned char c) { return (isalnum(c) or (c == '+') or (c == '/')); }
+static constexpr unsigned char trailing_char = '=';
 
-// merging the encoder wrapper into the single function
+// Function to encode input string to base64 and return the encoded string
 std::string base64_encode(std::string_view string_to_encode)
 {
-  // get bytes to encode and length
-  auto bytes_to_encode = reinterpret_cast<const unsigned char*>(string_to_encode.data());
+  // altered: use braces around if else
+  auto bytes_to_encode = string_to_encode.data();
   auto input_length    = string_to_encode.size();
 
-  std::string encoded;
-  std::array<unsigned char, 4> char_array_4;
-  std::array<unsigned char, 3> char_array_3;
-  int i = 0;
-  int j = 0;
-
-  // altered: added braces to one liner loops in the rest of this function
-  while (input_length--) {
-    char_array_3[i++] = *(bytes_to_encode++);
-    if (i == 3) {
-      char_array_4[0] = (char_array_3[0] & 0xfc) >> 2;
-      char_array_4[1] = ((char_array_3[0] & 0x03) << 4) + ((char_array_3[1] & 0xf0) >> 4);
-      char_array_4[2] = ((char_array_3[1] & 0x0f) << 2) + ((char_array_3[2] & 0xc0) >> 6);
-      char_array_4[3] = char_array_3[2] & 0x3f;
-
-      for (i = 0; (i < 4); i++) {
-        encoded += base64_chars[char_array_4[i]];
-      }
-      i = 0;
-    }
-  }
+  // altered: compute complete encoding length = floor(multiple of 3)
+  int32_t complete_encoding_length = (input_length / 3) * 3;
+  auto remaining_bytes             = input_length - complete_encoding_length;
+  CUDF_EXPECTS(remaining_bytes < 3, "Remaining bytes must be < 3");
 
-  if (i) {
-    for (j = i; j < 3; j++) {
-      char_array_3[j] = '\0';
-    }
+  std::string encoded;
+  size_t encoded_length = (input_length + 2) / 3 * 4;
+  encoded.reserve(encoded_length);
 
-    char_array_4[0] = (char_array_3[0] & 0xfc) >> 2;
-    char_array_4[1] = ((char_array_3[0] & 0x03) << 4) + ((char_array_3[1] & 0xf0) >> 4);
-    char_array_4[2] = ((char_array_3[1] & 0x0f) << 2) + ((char_array_3[2] & 0xc0) >> 6);
+  // altered: modify base64 encoder loop using STL and Thrust.
+  // TODO: Port this loop to thrust cooperative groups of size 4 if needed for too-wide tables.
+  std::for_each(thrust::make_counting_iterator(0),
+                thrust::make_counting_iterator(complete_encoding_length),
+                [&](auto&& idx) {
+                  auto modulus = idx % 3;
+                  switch (modulus) {
+                    case 0:
+                      encoded.push_back(base64_chars[(bytes_to_encode[idx] & 0xfc) >> 2]);
+                      break;
+                    case 1:
+                      encoded.push_back(base64_chars[((bytes_to_encode[idx - 1] & 0x03) << 4) +
+                                                     ((bytes_to_encode[idx] & 0xf0) >> 4)]);
+                      break;
+                    case 2:
+                      encoded.push_back(base64_chars[((bytes_to_encode[idx - 1] & 0x0f) << 2) +
+                                                     ((bytes_to_encode[idx] & 0xc0) >> 6)]);
+                      encoded.push_back(base64_chars[bytes_to_encode[idx] & 0x3f]);
+                      break;
+                    default:
+                      // altered: default case should never be reached
+                      CUDF_UNREACHABLE("Invalid modulus");
+                      break;
+                  }
+                });
 
-    for (j = 0; (j < i + 1); j++) {
-      encoded += base64_chars[char_array_4[j]];
-    }
-    while ((i++ < 3)) {
-      encoded += '=';
-    }
+  // altered: encode the remaining 1 or 2 bytes
+  switch (remaining_bytes) {
+    case 0: break;
+    case 1:
+      // from case 0
+      encoded.push_back(base64_chars[(bytes_to_encode[complete_encoding_length] & 0xfc) >> 2]);
+      // from case 1
+      encoded.push_back(base64_chars[(bytes_to_encode[complete_encoding_length] & 0x03) << 4]);
+      // two trailing characters
+      encoded.push_back(trailing_char);
+      encoded.push_back(trailing_char);
+      break;
+    case 2:
+      // from case 0
+      encoded.push_back(base64_chars[(bytes_to_encode[complete_encoding_length] & 0xfc) >> 2]);
+      // from case 1
+      encoded.push_back(
+        base64_chars[((bytes_to_encode[complete_encoding_length] & 0x03) << 4) +
+                     ((bytes_to_encode[complete_encoding_length + 1] & 0xf0) >> 4)]);
+      // from case 2
+      encoded.push_back(base64_chars[(bytes_to_encode[complete_encoding_length + 1] & 0x0f) << 2]);
+      // one trailing character
+      encoded.push_back(trailing_char);
+      break;
+    default: CUDF_UNREACHABLE("Invalid number of remaining bytes"); break;
   }
 
   return encoded;
 }
 
-// base64 decode lambda function
+// base64 decode function
 std::string base64_decode(std::string_view encoded_string)
 {
-  std::array<unsigned char, 4> char_array_4;
-  std::array<unsigned char, 3> char_array_3;
-  std::string decoded;
-  size_t input_len = encoded_string.size();
-
-  int i   = 0;
-  int j   = 0;
-  int in_ = 0;
-
-  // altered: added braces to one liner loops in the rest of this function
-  while (input_len-- and (encoded_string[in_] != '=') and is_base64(encoded_string[in_])) {
-    char_array_4[i++] = encoded_string[in_];
-    in_++;
-    if (i == 4) {
-      for (i = 0; i < 4; i++) {
-        char_array_4[i] = base64_chars.find(char_array_4[i]) & 0xff;
-      }
-
-      char_array_3[0] = (char_array_4[0] << 2) + ((char_array_4[1] & 0x30) >> 4);
-      char_array_3[1] = ((char_array_4[1] & 0xf) << 4) + ((char_array_4[2] & 0x3c) >> 2);
-      char_array_3[2] = ((char_array_4[2] & 0x3) << 6) + char_array_4[3];
-
-      for (i = 0; (i < 3); i++) {
-        decoded += char_array_3[i];
-      }
-      i = 0;
+  // altered: converted to lambda function inside base64_decode
+  // Function to compute and return the position of character within base64
+  static constexpr auto error_position = static_cast<size_t>(-1);
+  std::function<size_t(unsigned char const)> base64_position =
+    [&](unsigned char const chr) -> size_t {
+    // altered: use braces around if else
+    if (chr >= 'A' and chr <= 'Z') {
+      return chr - 'A';
+    } else if (chr >= 'a' and chr <= 'z') {
+      return chr - 'a' + ('Z' - 'A') + 1;
+    } else if (chr >= '0' and chr <= '9') {
+      return chr - '0' + ('Z' - 'A') + ('z' - 'a') + 2;
+    } else if (chr == '+') {
+      return 62;
+    } else if (chr == '/') {
+      return 63;
+    } else {
+      CUDF_LOG_ERROR(
+        "Parquet reader encountered invalid base64-encoded data."
+        "arrow:schema not processed.");
+      return error_position;
     }
+  };
+
+  // altered: there must be at least 2 characters in the base64-encoded string
+  if (encoded_string.size() < 2) {
+    CUDF_LOG_ERROR(
+      "Parquet reader encountered invalid base64-encoded string size."
+      "arrow:schema not processed.");
+    return std::string();
   }
 
-  // altered: modify to i!=0 for better readability
-  if (i != 0) {
-    for (j = 0; j < i; j++) {
-      char_array_4[j] = base64_chars.find(char_array_4[j]) & 0xff;
-    }
-    char_array_3[0] = (char_array_4[0] << 2) + ((char_array_4[1] & 0x30) >> 4);
-    char_array_3[1] = ((char_array_4[1] & 0xf) << 4) + ((char_array_4[2] & 0x3c) >> 2);
-    // altered: arrow source code doesn't have the below line.
-    //          This is inconsequential as it is never appended to
-    //          `decoded` as max(i) = 3 and 0 <= j < 2.
-    char_array_3[2] = ((char_array_4[2] & 0x3) << 6) + char_array_4[3];
-
-    for (j = 0; j < i - 1; j++) {
-      decoded += char_array_3[j];
-    }
+  size_t input_length = encoded_string.length();
+  std::string decoded;
+
+  //
+  // The approximate length (bytes) of the decoded string might be one or
+  // two bytes smaller, depending on the amount of trailing equal signs
+  // in the encoded string. This approximation is needed to reserve
+  // enough space in the string to be returned.
+  size_t approx_decoded_length = input_length / 4 * 3;
+  decoded.reserve(approx_decoded_length);
+
+  //
+  // Iterate over encoded input string in chunks. The size of all
+  // chunks except the last one is 4 bytes.
+  //
+  // The last chunk might be padded with equal signs or dots
+  // in order to make it 4 bytes in size as well, but this
+  // is not required as per RFC 2045.
+  //
+  // All chunks except the last one produce three output bytes.
+  //
+  // The last chunk produces at least one and up to three bytes.
+  //
+  // altered: modify base64 encoder loop using STL and Thrust.
+  // TODO: Port this loop to thrust cooperative groups of size 3 if needed for too-wide tables.
+  if (not std::all_of(
+        thrust::make_counting_iterator(0),
+        thrust::make_counting_iterator(static_cast<int32_t>(input_length)),
+        [&](auto&& idx) {
+          int32_t modulus              = idx % 4;
+          size_t current_char_position = 0;
+          size_t char1_position        = 0;
+          size_t char2_position        = 0;
+
+          switch (modulus) {
+            case 0:
+              if (encoded_string[idx] != '=') {  // Check for data that is not padded with equal
+                                                 // signs (which is allowed by RFC 2045)
+                current_char_position = base64_position(encoded_string[idx]);
+                char1_position        = base64_position(encoded_string[idx + 1]);
+                if (current_char_position == error_position or char1_position == error_position) {
+                  return false;
+                }
+                // Emit the first output byte that is produced in each chunk:
+                decoded.push_back(static_cast<std::string::value_type>(
+                  (current_char_position << 2) + ((char1_position & 0x30) >> 4)));
+              }
+              break;
+            case 2:
+              if (encoded_string[idx] != '=') {  // Check for data that is not padded with equal
+                                                 // signs (which is allowed by RFC 2045)
+                char1_position = base64_position(encoded_string[idx - 1]);
+                char2_position = base64_position(encoded_string[idx]);
+                if (char1_position == error_position or char2_position == error_position) {
+                  return false;
+                }
+                // Emit a chunk's second byte (which might not be produced in the last chunk).
+                decoded.push_back(static_cast<std::string::value_type>(
+                  ((char1_position & 0x0f) << 4) + ((char2_position & 0x3c) >> 2)));
+              }
+              break;
+
+            case 3:
+              if (encoded_string[idx] != '=') {  // Check for data that is not padded with equal
+                                                 // signs (which is allowed by RFC 2045)
+                char2_position        = base64_position(encoded_string[idx - 1]);
+                current_char_position = base64_position(encoded_string[idx]);
+                if (current_char_position == error_position or char2_position == error_position) {
+                  return false;
+                }
+                // Emit a chunk's third byte (which might not be produced in the last chunk).
+                decoded.push_back(static_cast<std::string::value_type>(
+                  ((char2_position & 0x03) << 6) + current_char_position));
+              }
+              break;
+            default:  // case 1 (ignore)
+              break;
+          }
+          // all good, return true
+          return true;
+        })) {
+    return std::string();
   }
 
+  // return the decoded string
   return decoded;
 }
 

From fbd335679a7af0607c071cfd6692530099524142 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Tue, 7 May 2024 01:38:49 +0000
Subject: [PATCH 24/53] minor updates

---
 cpp/src/io/utilities/base64_utilities.hpp | 62 ++++++++++++-----------
 1 file changed, 32 insertions(+), 30 deletions(-)

diff --git a/cpp/src/io/utilities/base64_utilities.hpp b/cpp/src/io/utilities/base64_utilities.hpp
index 2f04a73c9ef..2bb3e0c7e85 100644
--- a/cpp/src/io/utilities/base64_utilities.hpp
+++ b/cpp/src/io/utilities/base64_utilities.hpp
@@ -106,15 +106,18 @@ std::string base64_encode(std::string_view string_to_encode)
                     case 0:
                       encoded.push_back(base64_chars[(bytes_to_encode[idx] & 0xfc) >> 2]);
                       break;
+
                     case 1:
                       encoded.push_back(base64_chars[((bytes_to_encode[idx - 1] & 0x03) << 4) +
                                                      ((bytes_to_encode[idx] & 0xf0) >> 4)]);
                       break;
+
                     case 2:
                       encoded.push_back(base64_chars[((bytes_to_encode[idx - 1] & 0x0f) << 2) +
                                                      ((bytes_to_encode[idx] & 0xc0) >> 6)]);
                       encoded.push_back(base64_chars[bytes_to_encode[idx] & 0x3f]);
                       break;
+
                     default:
                       // altered: default case should never be reached
                       CUDF_UNREACHABLE("Invalid modulus");
@@ -125,6 +128,7 @@ std::string base64_encode(std::string_view string_to_encode)
   // altered: encode the remaining 1 or 2 bytes
   switch (remaining_bytes) {
     case 0: break;
+
     case 1:
       // from case 0
       encoded.push_back(base64_chars[(bytes_to_encode[complete_encoding_length] & 0xfc) >> 2]);
@@ -134,6 +138,7 @@ std::string base64_encode(std::string_view string_to_encode)
       encoded.push_back(trailing_char);
       encoded.push_back(trailing_char);
       break;
+
     case 2:
       // from case 0
       encoded.push_back(base64_chars[(bytes_to_encode[complete_encoding_length] & 0xfc) >> 2]);
@@ -221,47 +226,44 @@ std::string base64_decode(std::string_view encoded_string)
           size_t char1_position        = 0;
           size_t char2_position        = 0;
 
+          // Check for data that is not padded with equal
+          // signs (which is allowed by RFC 2045)
+          if (encoded_string[idx] != '=') { return true; }
+
           switch (modulus) {
             case 0:
-              if (encoded_string[idx] != '=') {  // Check for data that is not padded with equal
-                                                 // signs (which is allowed by RFC 2045)
-                current_char_position = base64_position(encoded_string[idx]);
-                char1_position        = base64_position(encoded_string[idx + 1]);
-                if (current_char_position == error_position or char1_position == error_position) {
-                  return false;
-                }
-                // Emit the first output byte that is produced in each chunk:
-                decoded.push_back(static_cast<std::string::value_type>(
-                  (current_char_position << 2) + ((char1_position & 0x30) >> 4)));
+              current_char_position = base64_position(encoded_string[idx]);
+              char1_position        = base64_position(encoded_string[idx + 1]);
+              if (current_char_position == error_position or char1_position == error_position) {
+                return false;
               }
+              // Emit the first output byte that is produced in each chunk:
+              decoded.push_back(static_cast<std::string::value_type>(
+                (current_char_position << 2) + ((char1_position & 0x30) >> 4)));
               break;
+
             case 2:
-              if (encoded_string[idx] != '=') {  // Check for data that is not padded with equal
-                                                 // signs (which is allowed by RFC 2045)
-                char1_position = base64_position(encoded_string[idx - 1]);
-                char2_position = base64_position(encoded_string[idx]);
-                if (char1_position == error_position or char2_position == error_position) {
-                  return false;
-                }
-                // Emit a chunk's second byte (which might not be produced in the last chunk).
-                decoded.push_back(static_cast<std::string::value_type>(
-                  ((char1_position & 0x0f) << 4) + ((char2_position & 0x3c) >> 2)));
+              char1_position = base64_position(encoded_string[idx - 1]);
+              char2_position = base64_position(encoded_string[idx]);
+              if (char1_position == error_position or char2_position == error_position) {
+                return false;
               }
+              // Emit a chunk's second byte (which might not be produced in the last chunk).
+              decoded.push_back(static_cast<std::string::value_type>(
+                ((char1_position & 0x0f) << 4) + ((char2_position & 0x3c) >> 2)));
               break;
 
             case 3:
-              if (encoded_string[idx] != '=') {  // Check for data that is not padded with equal
-                                                 // signs (which is allowed by RFC 2045)
-                char2_position        = base64_position(encoded_string[idx - 1]);
-                current_char_position = base64_position(encoded_string[idx]);
-                if (current_char_position == error_position or char2_position == error_position) {
-                  return false;
-                }
-                // Emit a chunk's third byte (which might not be produced in the last chunk).
-                decoded.push_back(static_cast<std::string::value_type>(
-                  ((char2_position & 0x03) << 6) + current_char_position));
+              char2_position        = base64_position(encoded_string[idx - 1]);
+              current_char_position = base64_position(encoded_string[idx]);
+              if (current_char_position == error_position or char2_position == error_position) {
+                return false;
               }
+              // Emit a chunk's third byte (which might not be produced in the last chunk).
+              decoded.push_back(static_cast<std::string::value_type>(
+                ((char2_position & 0x03) << 6) + current_char_position));
               break;
+
             default:  // case 1 (ignore)
               break;
           }

From b93c2c0fc9fb6c1150334aea80f00c1f081f8d4a Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Tue, 7 May 2024 01:40:42 +0000
Subject: [PATCH 25/53] fix the erroneous inequality check to equality

---
 cpp/src/io/utilities/base64_utilities.hpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cpp/src/io/utilities/base64_utilities.hpp b/cpp/src/io/utilities/base64_utilities.hpp
index 2bb3e0c7e85..4856a7fdb3d 100644
--- a/cpp/src/io/utilities/base64_utilities.hpp
+++ b/cpp/src/io/utilities/base64_utilities.hpp
@@ -228,7 +228,7 @@ std::string base64_decode(std::string_view encoded_string)
 
           // Check for data that is not padded with equal
           // signs (which is allowed by RFC 2045)
-          if (encoded_string[idx] != '=') { return true; }
+          if (encoded_string[idx] == '=') { return true; }
 
           switch (modulus) {
             case 0:

From d01f94c9e7e39b8b97ebb098f1e50e55dca1e228 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Tue, 7 May 2024 02:42:46 +0000
Subject: [PATCH 26/53] use string find instead of custom function for better
 speed

---
 cpp/src/io/utilities/base64_utilities.hpp | 134 +++++++++-------------
 1 file changed, 57 insertions(+), 77 deletions(-)

diff --git a/cpp/src/io/utilities/base64_utilities.hpp b/cpp/src/io/utilities/base64_utilities.hpp
index 4856a7fdb3d..79d91702200 100644
--- a/cpp/src/io/utilities/base64_utilities.hpp
+++ b/cpp/src/io/utilities/base64_utilities.hpp
@@ -160,30 +160,6 @@ std::string base64_encode(std::string_view string_to_encode)
 // base64 decode function
 std::string base64_decode(std::string_view encoded_string)
 {
-  // altered: converted to lambda function inside base64_decode
-  // Function to compute and return the position of character within base64
-  static constexpr auto error_position = static_cast<size_t>(-1);
-  std::function<size_t(unsigned char const)> base64_position =
-    [&](unsigned char const chr) -> size_t {
-    // altered: use braces around if else
-    if (chr >= 'A' and chr <= 'Z') {
-      return chr - 'A';
-    } else if (chr >= 'a' and chr <= 'z') {
-      return chr - 'a' + ('Z' - 'A') + 1;
-    } else if (chr >= '0' and chr <= '9') {
-      return chr - '0' + ('Z' - 'A') + ('z' - 'a') + 2;
-    } else if (chr == '+') {
-      return 62;
-    } else if (chr == '/') {
-      return 63;
-    } else {
-      CUDF_LOG_ERROR(
-        "Parquet reader encountered invalid base64-encoded data."
-        "arrow:schema not processed.");
-      return error_position;
-    }
-  };
-
   // altered: there must be at least 2 characters in the base64-encoded string
   if (encoded_string.size() < 2) {
     CUDF_LOG_ERROR(
@@ -217,59 +193,63 @@ std::string base64_decode(std::string_view encoded_string)
   //
   // altered: modify base64 encoder loop using STL and Thrust.
   // TODO: Port this loop to thrust cooperative groups of size 3 if needed for too-wide tables.
-  if (not std::all_of(
-        thrust::make_counting_iterator(0),
-        thrust::make_counting_iterator(static_cast<int32_t>(input_length)),
-        [&](auto&& idx) {
-          int32_t modulus              = idx % 4;
-          size_t current_char_position = 0;
-          size_t char1_position        = 0;
-          size_t char2_position        = 0;
-
-          // Check for data that is not padded with equal
-          // signs (which is allowed by RFC 2045)
-          if (encoded_string[idx] == '=') { return true; }
-
-          switch (modulus) {
-            case 0:
-              current_char_position = base64_position(encoded_string[idx]);
-              char1_position        = base64_position(encoded_string[idx + 1]);
-              if (current_char_position == error_position or char1_position == error_position) {
-                return false;
-              }
-              // Emit the first output byte that is produced in each chunk:
-              decoded.push_back(static_cast<std::string::value_type>(
-                (current_char_position << 2) + ((char1_position & 0x30) >> 4)));
-              break;
-
-            case 2:
-              char1_position = base64_position(encoded_string[idx - 1]);
-              char2_position = base64_position(encoded_string[idx]);
-              if (char1_position == error_position or char2_position == error_position) {
-                return false;
-              }
-              // Emit a chunk's second byte (which might not be produced in the last chunk).
-              decoded.push_back(static_cast<std::string::value_type>(
-                ((char1_position & 0x0f) << 4) + ((char2_position & 0x3c) >> 2)));
-              break;
-
-            case 3:
-              char2_position        = base64_position(encoded_string[idx - 1]);
-              current_char_position = base64_position(encoded_string[idx]);
-              if (current_char_position == error_position or char2_position == error_position) {
-                return false;
-              }
-              // Emit a chunk's third byte (which might not be produced in the last chunk).
-              decoded.push_back(static_cast<std::string::value_type>(
-                ((char2_position & 0x03) << 6) + current_char_position));
-              break;
-
-            default:  // case 1 (ignore)
-              break;
-          }
-          // all good, return true
-          return true;
-        })) {
+  if (not std::all_of(thrust::make_counting_iterator(0),
+                      thrust::make_counting_iterator(static_cast<int32_t>(input_length)),
+                      [&](auto&& idx) {
+                        int32_t modulus              = idx % 4;
+                        size_t current_char_position = 0;
+                        size_t char1_position        = 0;
+                        size_t char2_position        = 0;
+
+                        // Check for data that is not padded with equal
+                        // signs (which is allowed by RFC 2045)
+                        if (encoded_string[idx] == '=') { return true; }
+
+                        switch (modulus) {
+                          case 0:
+                            current_char_position = base64_chars.find(encoded_string[idx]);
+                            char1_position        = base64_chars.find(encoded_string[idx + 1]);
+                            if (current_char_position == std::string::npos or
+                                char1_position == std::string::npos) {
+                              return false;
+                            }
+                            // Emit the first output byte that is produced in each chunk:
+                            decoded.push_back(static_cast<std::string::value_type>(
+                              (current_char_position << 2) + ((char1_position & 0x30) >> 4)));
+                            break;
+
+                          case 2:
+                            char1_position = base64_chars.find(encoded_string[idx - 1]);
+                            char2_position = base64_chars.find(encoded_string[idx]);
+                            if (char1_position == std::string::npos or
+                                char2_position == std::string::npos) {
+                              return false;
+                            }
+                            // Emit a chunk's second byte (which might not be produced in the last
+                            // chunk).
+                            decoded.push_back(static_cast<std::string::value_type>(
+                              ((char1_position & 0x0f) << 4) + ((char2_position & 0x3c) >> 2)));
+                            break;
+
+                          case 3:
+                            char2_position        = base64_chars.find(encoded_string[idx - 1]);
+                            current_char_position = base64_chars.find(encoded_string[idx]);
+                            if (current_char_position == std::string::npos or
+                                char2_position == std::string::npos) {
+                              return false;
+                            }
+                            // Emit a chunk's third byte (which might not be produced in the last
+                            // chunk).
+                            decoded.push_back(static_cast<std::string::value_type>(
+                              ((char2_position & 0x03) << 6) + current_char_position));
+                            break;
+
+                          default:  // case 1 (ignore)
+                            break;
+                        }
+                        // all good, return true
+                        return true;
+                      })) {
     return std::string();
   }
 

From b8c338bd1fffdfb1ffd4de1b14d6886c61f787fe Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Tue, 7 May 2024 03:08:15 +0000
Subject: [PATCH 27/53] optimize base64 encode

---
 cpp/src/io/utilities/base64_utilities.hpp | 81 +++++++----------------
 1 file changed, 24 insertions(+), 57 deletions(-)

diff --git a/cpp/src/io/utilities/base64_utilities.hpp b/cpp/src/io/utilities/base64_utilities.hpp
index 79d91702200..cbe812d4a1b 100644
--- a/cpp/src/io/utilities/base64_utilities.hpp
+++ b/cpp/src/io/utilities/base64_utilities.hpp
@@ -84,13 +84,11 @@ static constexpr unsigned char trailing_char = '=';
 std::string base64_encode(std::string_view string_to_encode)
 {
   // altered: use braces around if else
-  auto bytes_to_encode = string_to_encode.data();
-  auto input_length    = string_to_encode.size();
+  auto input_length = string_to_encode.size();
 
   // altered: compute complete encoding length = floor(multiple of 3)
-  int32_t complete_encoding_length = (input_length / 3) * 3;
-  auto remaining_bytes             = input_length - complete_encoding_length;
-  CUDF_EXPECTS(remaining_bytes < 3, "Remaining bytes must be < 3");
+  int32_t num_iterations = (input_length / 3);
+  num_iterations += (input_length % 3) ? 1 : 0;
 
   std::string encoded;
   size_t encoded_length = (input_length + 2) / 3 * 4;
@@ -99,61 +97,30 @@ std::string base64_encode(std::string_view string_to_encode)
   // altered: modify base64 encoder loop using STL and Thrust.
   // TODO: Port this loop to thrust cooperative groups of size 4 if needed for too-wide tables.
   std::for_each(thrust::make_counting_iterator(0),
-                thrust::make_counting_iterator(complete_encoding_length),
-                [&](auto&& idx) {
-                  auto modulus = idx % 3;
-                  switch (modulus) {
-                    case 0:
-                      encoded.push_back(base64_chars[(bytes_to_encode[idx] & 0xfc) >> 2]);
-                      break;
-
-                    case 1:
-                      encoded.push_back(base64_chars[((bytes_to_encode[idx - 1] & 0x03) << 4) +
-                                                     ((bytes_to_encode[idx] & 0xf0) >> 4)]);
-                      break;
-
-                    case 2:
-                      encoded.push_back(base64_chars[((bytes_to_encode[idx - 1] & 0x0f) << 2) +
-                                                     ((bytes_to_encode[idx] & 0xc0) >> 6)]);
-                      encoded.push_back(base64_chars[bytes_to_encode[idx] & 0x3f]);
-                      break;
-
-                    default:
-                      // altered: default case should never be reached
-                      CUDF_UNREACHABLE("Invalid modulus");
-                      break;
+                thrust::make_counting_iterator(num_iterations),
+                [&](auto&& iter) {
+                  auto idx = iter * 3;
+                  encoded.push_back(base64_chars[(string_to_encode[idx + 0] & 0xfc) >> 2]);
+
+                  if (idx + 1 < input_length) {
+                    encoded.push_back(base64_chars[((string_to_encode[idx + 0] & 0x03) << 4) +
+                                                   ((string_to_encode[idx + 1] & 0xf0) >> 4)]);
+
+                    if (idx + 2 < input_length) {
+                      encoded.push_back(base64_chars[((string_to_encode[idx + 1] & 0x0f) << 2) +
+                                                     ((string_to_encode[idx + 2] & 0xc0) >> 6)]);
+                      encoded.push_back(base64_chars[string_to_encode[idx + 2] & 0x3f]);
+                    } else {
+                      encoded.push_back(base64_chars[(string_to_encode[idx + 1] & 0x0f) << 2]);
+                      encoded.push_back(trailing_char);
+                    }
+                  } else {
+                    encoded.push_back(base64_chars[(string_to_encode[idx + 0] & 0x03) << 4]);
+                    encoded.push_back(trailing_char);
+                    encoded.push_back(trailing_char);
                   }
                 });
 
-  // altered: encode the remaining 1 or 2 bytes
-  switch (remaining_bytes) {
-    case 0: break;
-
-    case 1:
-      // from case 0
-      encoded.push_back(base64_chars[(bytes_to_encode[complete_encoding_length] & 0xfc) >> 2]);
-      // from case 1
-      encoded.push_back(base64_chars[(bytes_to_encode[complete_encoding_length] & 0x03) << 4]);
-      // two trailing characters
-      encoded.push_back(trailing_char);
-      encoded.push_back(trailing_char);
-      break;
-
-    case 2:
-      // from case 0
-      encoded.push_back(base64_chars[(bytes_to_encode[complete_encoding_length] & 0xfc) >> 2]);
-      // from case 1
-      encoded.push_back(
-        base64_chars[((bytes_to_encode[complete_encoding_length] & 0x03) << 4) +
-                     ((bytes_to_encode[complete_encoding_length + 1] & 0xf0) >> 4)]);
-      // from case 2
-      encoded.push_back(base64_chars[(bytes_to_encode[complete_encoding_length + 1] & 0x0f) << 2]);
-      // one trailing character
-      encoded.push_back(trailing_char);
-      break;
-    default: CUDF_UNREACHABLE("Invalid number of remaining bytes"); break;
-  }
-
   return encoded;
 }
 

From e47bbfb9945fd1910128b57be083149a91e7832c Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Tue, 7 May 2024 03:14:07 +0000
Subject: [PATCH 28/53] fix minor signed comparison error

---
 cpp/src/io/utilities/base64_utilities.hpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cpp/src/io/utilities/base64_utilities.hpp b/cpp/src/io/utilities/base64_utilities.hpp
index cbe812d4a1b..5930c997a11 100644
--- a/cpp/src/io/utilities/base64_utilities.hpp
+++ b/cpp/src/io/utilities/base64_utilities.hpp
@@ -64,6 +64,7 @@
 #include <thrust/iterator/counting_iterator.h>
 
 #include <algorithm>
+#include <cstdint>
 #include <functional>
 #include <string>
 
@@ -83,8 +84,7 @@ static constexpr unsigned char trailing_char = '=';
 // Function to encode input string to base64 and return the encoded string
 std::string base64_encode(std::string_view string_to_encode)
 {
-  // altered: use braces around if else
-  auto input_length = string_to_encode.size();
+  auto input_length = static_cast<int32_t>(string_to_encode.size());
 
   // altered: compute complete encoding length = floor(multiple of 3)
   int32_t num_iterations = (input_length / 3);

From 0b5ec613a039e2b5c28fb0df9b742ba5cee45410 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Tue, 7 May 2024 17:51:01 +0000
Subject: [PATCH 29/53] speed optimization for decoder

---
 cpp/src/io/utilities/base64_utilities.hpp | 152 ++++++++++++----------
 1 file changed, 82 insertions(+), 70 deletions(-)

diff --git a/cpp/src/io/utilities/base64_utilities.hpp b/cpp/src/io/utilities/base64_utilities.hpp
index 5930c997a11..1b7b33f5681 100644
--- a/cpp/src/io/utilities/base64_utilities.hpp
+++ b/cpp/src/io/utilities/base64_utilities.hpp
@@ -86,7 +86,7 @@ std::string base64_encode(std::string_view string_to_encode)
 {
   auto input_length = static_cast<int32_t>(string_to_encode.size());
 
-  // altered: compute complete encoding length = floor(multiple of 3)
+  // altered: compute number of encoding iterations = floor(multiple of 3)
   int32_t num_iterations = (input_length / 3);
   num_iterations += (input_length % 3) ? 1 : 0;
 
@@ -100,22 +100,27 @@ std::string base64_encode(std::string_view string_to_encode)
                 thrust::make_counting_iterator(num_iterations),
                 [&](auto&& iter) {
                   auto idx = iter * 3;
-                  encoded.push_back(base64_chars[(string_to_encode[idx + 0] & 0xfc) >> 2]);
 
-                  if (idx + 1 < input_length) {
-                    encoded.push_back(base64_chars[((string_to_encode[idx + 0] & 0x03) << 4) +
-                                                   ((string_to_encode[idx + 1] & 0xf0) >> 4)]);
+                  encoded.push_back(base64_chars[(string_to_encode[idx] & 0xfc) >> 2]);
+                  // increment the index by 1
+                  idx += 1;
 
-                    if (idx + 2 < input_length) {
-                      encoded.push_back(base64_chars[((string_to_encode[idx + 1] & 0x0f) << 2) +
-                                                     ((string_to_encode[idx + 2] & 0xc0) >> 6)]);
-                      encoded.push_back(base64_chars[string_to_encode[idx + 2] & 0x3f]);
+                  if (idx < input_length) {
+                    encoded.push_back(base64_chars[((string_to_encode[idx - 1] & 0x03) << 4) +
+                                                   ((string_to_encode[idx] & 0xf0) >> 4)]);
+                    // increment the index by 1
+                    idx += 1;
+
+                    if (idx < input_length) {
+                      encoded.push_back(base64_chars[((string_to_encode[idx - 1] & 0x0f) << 2) +
+                                                     ((string_to_encode[idx] & 0xc0) >> 6)]);
+                      encoded.push_back(base64_chars[string_to_encode[idx] & 0x3f]);
                     } else {
-                      encoded.push_back(base64_chars[(string_to_encode[idx + 1] & 0x0f) << 2]);
+                      encoded.push_back(base64_chars[(string_to_encode[idx - 1] & 0x0f) << 2]);
                       encoded.push_back(trailing_char);
                     }
                   } else {
-                    encoded.push_back(base64_chars[(string_to_encode[idx + 0] & 0x03) << 4]);
+                    encoded.push_back(base64_chars[(string_to_encode[idx - 1] & 0x03) << 4]);
                     encoded.push_back(trailing_char);
                     encoded.push_back(trailing_char);
                   }
@@ -132,12 +137,16 @@ std::string base64_decode(std::string_view encoded_string)
     CUDF_LOG_ERROR(
       "Parquet reader encountered invalid base64-encoded string size."
       "arrow:schema not processed.");
-    return std::string();
+    return std::string{};
   }
 
   size_t input_length = encoded_string.length();
   std::string decoded;
 
+  // altered: compute number of decoding iterations = floor (multiple of 4)
+  int32_t num_iterations = (input_length / 4);
+  num_iterations += (input_length % 4) ? 1 : 0;
+
   //
   // The approximate length (bytes) of the decoded string might be one or
   // two bytes smaller, depending on the amount of trailing equal signs
@@ -160,64 +169,67 @@ std::string base64_decode(std::string_view encoded_string)
   //
   // altered: modify base64 encoder loop using STL and Thrust.
   // TODO: Port this loop to thrust cooperative groups of size 3 if needed for too-wide tables.
-  if (not std::all_of(thrust::make_counting_iterator(0),
-                      thrust::make_counting_iterator(static_cast<int32_t>(input_length)),
-                      [&](auto&& idx) {
-                        int32_t modulus              = idx % 4;
-                        size_t current_char_position = 0;
-                        size_t char1_position        = 0;
-                        size_t char2_position        = 0;
-
-                        // Check for data that is not padded with equal
-                        // signs (which is allowed by RFC 2045)
-                        if (encoded_string[idx] == '=') { return true; }
-
-                        switch (modulus) {
-                          case 0:
-                            current_char_position = base64_chars.find(encoded_string[idx]);
-                            char1_position        = base64_chars.find(encoded_string[idx + 1]);
-                            if (current_char_position == std::string::npos or
-                                char1_position == std::string::npos) {
-                              return false;
-                            }
-                            // Emit the first output byte that is produced in each chunk:
-                            decoded.push_back(static_cast<std::string::value_type>(
-                              (current_char_position << 2) + ((char1_position & 0x30) >> 4)));
-                            break;
-
-                          case 2:
-                            char1_position = base64_chars.find(encoded_string[idx - 1]);
-                            char2_position = base64_chars.find(encoded_string[idx]);
-                            if (char1_position == std::string::npos or
-                                char2_position == std::string::npos) {
-                              return false;
-                            }
-                            // Emit a chunk's second byte (which might not be produced in the last
-                            // chunk).
-                            decoded.push_back(static_cast<std::string::value_type>(
-                              ((char1_position & 0x0f) << 4) + ((char2_position & 0x3c) >> 2)));
-                            break;
-
-                          case 3:
-                            char2_position        = base64_chars.find(encoded_string[idx - 1]);
-                            current_char_position = base64_chars.find(encoded_string[idx]);
-                            if (current_char_position == std::string::npos or
-                                char2_position == std::string::npos) {
-                              return false;
-                            }
-                            // Emit a chunk's third byte (which might not be produced in the last
-                            // chunk).
-                            decoded.push_back(static_cast<std::string::value_type>(
-                              ((char2_position & 0x03) << 6) + current_char_position));
-                            break;
-
-                          default:  // case 1 (ignore)
-                            break;
-                        }
-                        // all good, return true
-                        return true;
-                      })) {
-    return std::string();
+  if (not std::all_of(
+        thrust::make_counting_iterator(0),
+        thrust::make_counting_iterator(num_iterations),
+        [&](auto&& iter) {
+          int32_t idx                  = iter * 4;
+          size_t current_char_position = 0;
+          size_t char1_position        = 0;
+          size_t char2_position        = 0;
+
+          // Check for data that is not padded with equal
+          // signs (which is allowed by RFC 2045)
+          if (encoded_string[idx] == '=') { return true; }
+
+          current_char_position = base64_chars.find(encoded_string[idx]);
+          char1_position        = base64_chars.find(encoded_string[idx + 1]);
+          if (current_char_position == std::string::npos or char1_position == std::string::npos) {
+            return false;
+          }
+          // Emit the first output byte that is produced in each chunk:
+          decoded.push_back(static_cast<std::string::value_type>((current_char_position << 2) +
+                                                                 ((char1_position & 0x30) >> 4)));
+
+          // increment the index by 1
+          idx += 1;
+          // check for = padding
+          if (encoded_string[idx] == '=') { return true; }
+
+          // increment the index by 1
+          idx += 1;
+          // check for = padding
+          if (encoded_string[idx] == '=') { return true; }
+
+          char1_position = base64_chars.find(encoded_string[idx - 1]);
+          char2_position = base64_chars.find(encoded_string[idx]);
+          if (char1_position == std::string::npos or char2_position == std::string::npos) {
+            return false;
+          }
+          // Emit a chunk's second byte (which might not be produced in the last
+          // chunk).
+          decoded.push_back(static_cast<std::string::value_type>(((char1_position & 0x0f) << 4) +
+                                                                 ((char2_position & 0x3c) >> 2)));
+
+          // increment the index by 1
+          idx += 1;
+          // check for = padding
+          if (encoded_string[idx] == '=') { return true; }
+
+          char2_position        = base64_chars.find(encoded_string[idx - 1]);
+          current_char_position = base64_chars.find(encoded_string[idx]);
+          if (current_char_position == std::string::npos or char2_position == std::string::npos) {
+            return false;
+          }
+          // Emit a chunk's third byte (which might not be produced in the last
+          // chunk).
+          decoded.push_back(static_cast<std::string::value_type>(((char2_position & 0x03) << 6) +
+                                                                 current_char_position));
+
+          // all good, return true
+          return true;
+        })) {
+    return std::string{};
   }
 
   // return the decoded string

From 83a13a78b8a49d1d050241a1e9ea54feb655b725 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <14217455+mhaseeb123@users.noreply.github.com>
Date: Wed, 8 May 2024 11:29:38 -0700
Subject: [PATCH 30/53] Apply suggestions from code review

Co-authored-by: Yunsong Wang <yunsongw@nvidia.com>
---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 7bffa9131b1..8a3f4af3479 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -566,7 +566,7 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
 
   // Check the key_value metadata for ARROW:schema, decode and walk it
   // Function to convert from flatbuf::duration type to cudf::type_id
-  auto duration_from_flatbuffer = [](flatbuf::Duration const* duration) {
+  auto const duration_from_flatbuffer = [](flatbuf::Duration const* duration) {
     // TODO: we only need this for arrow::DurationType for now. Else, we can take in a
     // void ptr and typecast it to the corresponding type based on the type_id.
     auto fb_unit = duration->unit();
@@ -643,7 +643,7 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
 
   // Question: Should we check if any file has the "ARROW:schema" key or
   // Or if all files have the same "ARROW:schema"?
-  auto it = keyval_maps[0].find("ARROW:schema");
+  auto const it = keyval_maps[0].find("ARROW:schema");
   if (it == keyval_maps[0].end()) { return std::nullopt; }
 
   // Read arrow schema from flatbuffers

From 69be7dbb3d2a7fb45eefb7d2bc630e3b233883d2 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Wed, 8 May 2024 20:53:28 +0000
Subject: [PATCH 31/53] applying suggestions from reviewers

---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 31 ++++++++++++++--------
 1 file changed, 20 insertions(+), 11 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 8a3f4af3479..a586613a93d 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -73,9 +73,9 @@ type_id to_type_id(SchemaElement const& schema,
                    bool strings_to_categorical,
                    type_id timestamp_type_id)
 {
-  auto const physical = schema.type;
-  auto const arrow    = schema.arrow_type;
-  auto logical_type   = schema.logical_type;
+  auto const physical_type = schema.type;
+  auto const arrow_type    = schema.arrow_type;
+  auto logical_type        = schema.logical_type;
 
   // sanity check, but not worth failing over
   if (schema.converted_type.has_value() and not logical_type.has_value()) {
@@ -83,6 +83,16 @@ type_id to_type_id(SchemaElement const& schema,
     logical_type = converted_to_logical_type(schema);
   }
 
+  // check if have set the type through arrow schema?
+  if (arrow_type.has_value()) {
+    // is it duration type? i.e. phyical_type == INT64 and no logical/converted types
+    if (physical_type == Type::INT64 and not logical_type.has_value()) {
+      return arrow_type.value();
+    }
+    // should warn but not fail.
+    CUDF_LOG_WARN("Indeterminable arrow type encountered");
+  }
+
   if (logical_type.has_value()) {
     switch (logical_type->type) {
       case LogicalType::INTEGER: {
@@ -121,11 +131,11 @@ type_id to_type_id(SchemaElement const& schema,
 
       case LogicalType::DECIMAL: {
         int32_t const decimal_precision = logical_type->precision();
-        if (physical == INT32) {
+        if (physical_type == INT32) {
           return type_id::DECIMAL32;
-        } else if (physical == INT64) {
+        } else if (physical_type == INT64) {
           return type_id::DECIMAL64;
-        } else if (physical == FIXED_LEN_BYTE_ARRAY) {
+        } else if (physical_type == FIXED_LEN_BYTE_ARRAY) {
           if (schema.type_length <= static_cast<int32_t>(sizeof(int32_t))) {
             return type_id::DECIMAL32;
           } else if (schema.type_length <= static_cast<int32_t>(sizeof(int64_t))) {
@@ -133,7 +143,7 @@ type_id to_type_id(SchemaElement const& schema,
           } else if (schema.type_length <= static_cast<int32_t>(sizeof(__int128_t))) {
             return type_id::DECIMAL128;
           }
-        } else if (physical == BYTE_ARRAY) {
+        } else if (physical_type == BYTE_ARRAY) {
           CUDF_EXPECTS(decimal_precision <= MAX_DECIMAL128_PRECISION, "Invalid decimal precision");
           if (decimal_precision <= MAX_DECIMAL32_PRECISION) {
             return type_id::DECIMAL32;
@@ -166,10 +176,10 @@ type_id to_type_id(SchemaElement const& schema,
 
   // Physical storage type supported by Parquet; controls the on-disk storage
   // format in combination with the encoding type.
-  switch (physical) {
+  switch (physical_type) {
     case BOOLEAN: return type_id::BOOL8;
     case INT32: return type_id::INT32;
-    case INT64: return arrow.value_or(type_id::INT64);
+    case INT64: return type_id::INT64;
     case FLOAT: return type_id::FLOAT32;
     case DOUBLE: return type_id::FLOAT64;
     case BYTE_ARRAY:
@@ -617,8 +627,7 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
           case flatbuf::Type::Type_List:
           case flatbuf::Type::Type_LargeList:
           case flatbuf::Type::Type_FixedSizeList:
-            schema_elem.children.emplace_back(arrow_schema_data_types{});
-            schema_elem.children.back().children = std::move(schema_children);
+            schema_elem.children.emplace_back(arrow_schema_data_types{std::move(schema_children)});
             break;
           default: schema_elem.children = std::move(schema_children); break;
         }

From 0d41d9972700f15039d057b8603e4954c1dff241 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Wed, 8 May 2024 21:29:27 +0000
Subject: [PATCH 32/53] minor updates from reviewer suggestions

---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 18 ++++++++----------
 1 file changed, 8 insertions(+), 10 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index a586613a93d..6c9c17e8b48 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -665,8 +665,8 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
   // decode_ipc_message can lead to unintended nullptr dereferences.
   auto decoded_message = cudf::io::detail::base64_decode(encoded_serialized_message);
 
-  // Decode the ipc message to get a const void pointer to the arrow:Message flatbuffer
-  auto metadata_buf = decode_ipc_message(decoded_message);
+  // Decode the ipc message to get a const void pointer to the ipc:Message flatbuffer
+  const auto metadata_buf = decode_ipc_message(decoded_message);
 
   if (metadata_buf == nullptr) {
     CUDF_LOG_ERROR("Parquet reader encountered an invalid metadata pointer.",
@@ -674,24 +674,22 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
     return std::nullopt;
   }
 
-  // Get an arrow:ipc message object from ipc:message's decoded metadata section
-  auto ipc_message = flatbuf::GetMessage(metadata_buf);
-  if (ipc_message == nullptr) {
+  // Check if the decoded Message flatbuffer is valid
+  if (flatbuf::GetMessage(metadata_buf) == nullptr) {
     CUDF_LOG_ERROR("Parquet reader encountered an invalid ipc_message pointer.",
                    "arrow:schema not processed.");
     return std::nullopt;
   }
 
-  // Get schema object from the arrow:ipc message
-  auto fb_schema = ipc_message->header_as_Schema();
-  if (fb_schema == nullptr) {
+  // Check if the Message flatbuffer has a valid arrow:schema in its header
+  if (flatbuf::GetMessage(metadata_buf)->header_as_Schema() == nullptr) {
     CUDF_LOG_ERROR("Parquet reader encountered an invalid fb_schema pointer.",
                    "arrow:schema not processed.");
     return std::nullopt;
   }
 
-  // Get the vector of fields from arrow:schema object
-  const auto fields = fb_schema->fields();
+  // Get the vector of fields from arrow:schema flatbuffer object
+  const auto fields = flatbuf::GetMessage(metadata_buf)->header_as_Schema()->fields();
   if (fields == nullptr) {
     CUDF_LOG_ERROR("Parquet reader encountered an invalid fields pointer.",
                    "arrow:schema not processed.");

From 56bbc15d5b5cd235923d1e50899b1b9f1429d855 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Wed, 8 May 2024 23:54:01 +0000
Subject: [PATCH 33/53] add ctests for base64 encoder and decoder

---
 cpp/src/io/utilities/base64_utilities.hpp     |   6 +-
 .../utilities_tests/io_utilities_tests.cpp    | 116 ++++++++++++++++++
 2 files changed, 118 insertions(+), 4 deletions(-)

diff --git a/cpp/src/io/utilities/base64_utilities.hpp b/cpp/src/io/utilities/base64_utilities.hpp
index 1b7b33f5681..67584f61f62 100644
--- a/cpp/src/io/utilities/base64_utilities.hpp
+++ b/cpp/src/io/utilities/base64_utilities.hpp
@@ -58,14 +58,12 @@
 
 #pragma once
 
-// altered: including required std headers
-#include <cudf/utilities/error.hpp>
+// altered: include required cudf and std headers
+#include <cudf/detail/utilities/logger.hpp>
 
 #include <thrust/iterator/counting_iterator.h>
 
 #include <algorithm>
-#include <cstdint>
-#include <functional>
 #include <string>
 
 // altered: merged base64.h and base64.cpp into one file.
diff --git a/cpp/tests/utilities_tests/io_utilities_tests.cpp b/cpp/tests/utilities_tests/io_utilities_tests.cpp
index 6981ad71f1e..f40ef43e29d 100644
--- a/cpp/tests/utilities_tests/io_utilities_tests.cpp
+++ b/cpp/tests/utilities_tests/io_utilities_tests.cpp
@@ -25,6 +25,11 @@
 #include <rmm/mr/pinned_host_memory_resource.hpp>
 #include <rmm/resource_ref.hpp>
 
+#include <src/io/utilities/base64_utilities.hpp>
+
+using cudf::io::detail::base64_decode;
+using cudf::io::detail::base64_encode;
+
 class IoUtilitiesTest : public cudf::test::BaseFixture {};
 
 TEST(IoUtilitiesTest, HostMemoryGetAndSet)
@@ -63,3 +68,114 @@ TEST(IoUtilitiesTest, HostMemoryGetAndSet)
   // reset memory resource back
   cudf::io::set_host_memory_resource(last_mr);
 }
+
+TEST(IoUtilitiesTest, Base64EncodeAndDecode)
+{
+  // A long lorem ipsum string
+  std::vector<std::string> strings = {
+    "Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut ",
+    "labore et dolore magna aliqua. Id ornare arcu odio ut sem. Ultrices neque ornare aenean ",
+    "euismod elementum nisi quis. Faucibus pulvinar elementum integer enim. Ut tortor pretium ",
+    "viverra suspendisse potenti nullam ac tortor vitae. Elementum pulvinar etiam non quam lacus. ",
+    "Fermentum odio eu feugiat pretium nibh. Commodo ullamcorper a lacus vestibulum sed arcu. "
+    "Elit ",
+    "ut aliquam purus sit amet luctus venenatis lectus magna. Aliquet enim tortor at auctor urna ",
+    "nunc id cursus metus. Vivamus at augue eget arcu dictum. Ultricies leo integer malesuada "
+    "nunc ",
+    "vel risus commodo viverra maecenas.Netus et malesuada fames ac turpis egestas. Erat ",
+    "pellentesque adipiscing commodo elit at imperdiet. Commodo nulla facilisi nullam vehicula. ",
+    "Morbi tristique senectus et netus et. Cursus vitae congue mauris rhoncus aenean vel elit ",
+    "scelerisque mauris. Eros donec ac odio tempor orci dapibus ultrices. Purus in mollis nunc "
+    "sed ",
+    "id. Justo eget magna fermentum iaculis eu. Diam maecenas ultricies mi eget. Justo laoreet "
+    "sit ",
+    "amet cursus sit amet. Nibh venenatis cras sed felis eget velit aliquet sagittis id. Dui ut ",
+    "ornare lectus sit amet est placerat in egestas. Malesuada nunc vel risus commodo viverra ",
+    "maecenas accumsan lacus. Arcu non odio euismod lacinia at. Euismod elementum nisi quis ",
+    "eleifend quam adipiscing vitae proin sagittis. Eget sit amet tellus cras adipiscing enim ",
+    "eu.Neque ornare aenean euismod elementum nisi quis eleifend quam adipiscing. Posuere ",
+    "sollicitudin aliquam ultrices sagittis orci a scelerisque purus. Lobortis elementum nibh ",
+    "tellus molestie. Et ligula ullamcorper malesuada proin libero nunc consequat interdum "
+    "varius. ",
+    "Neque volutpat ac tincidunt vitae semper quis lectus. Nunc mi ipsum faucibus vitae. Congue "
+    "eu ",
+    "consequat ac felis donec et. Faucibus in ornare quam viverra orci sagittis. Egestas "
+    "fringilla ",
+    "phasellus faucibus scelerisque eleifend. Sem fringilla ut morbi tincidunt augue. Lobortis ",
+    "elementum nibh tellus molestie nunc non. Ultrices neque ornare aenean euismod elementum. ",
+    "Cursus turpis massa tincidunt dui ut ornare lectus sit. Eu facilisis sed odio morbi quis "
+    "commodo odio. Tortor dignissim convallis aenean et tortor at risus. Sed euismod nisi porta ",
+    "lorem. In ornare quam viverra orci sagittis. Sed blandit libero volutpat sed cras. Quis ",
+    "viverra nibh cras pulvinar mattis nunc sed blandit libero. Non tellus orci ac auctor augue. ",
+    "Mattis molestie a iaculis at erat pellentesque adipiscing. Est lorem ipsum dolor sit amet ",
+    "consectetur. Commodo odio aenean sed adipiscing. Nunc lobortis mattis aliquam faucibus "
+    "purus. ",
+    "Pellentesque massa placerat duis ultricies lacus. Sed viverra tellus in hac habitasse "
+    "platea. ",
+    "Ut porttitor leo a diam sollicitudin tempor id eu. Rhoncus aenean vel elit scelerisque "
+    "mauris ",
+    "pellentesque pulvinar pellentesque. Ornare quam viverra orci sagittis. Interdum consectetur ",
+    "libero id faucibus nisl tincidunt eget. Eget est lorem ipsum dolor sit amet. Malesuada fames ",
+    "ac turpis egestas integer eget aliquet nibh. Scelerisque felis imperdiet proin fermentum "
+    "leo. ",
+    "Duis convallis convallis tellus id interdum velit. Sit amet massa vitae tortor condimentum ",
+    "lacinia quis vel. Eu turpis egestas pretium aenean pharetra. Sed enim ut sem viverra aliquet ",
+    "eget sit amet tellus. Feugiat nisl pretium fusce id velit ut tortor. In hendrerit gravida ",
+    "rutrum quisque non tellus orci ac auctor. Sit amet nulla facilisi morbi. Nunc congue nisi ",
+    "vitae suscipit tellus. Posuere morbi leo urna molestie at elementum eu. Egestas sed tempus ",
+    "urna et pharetra pharetra. Sed euismod nisi porta lorem. At elementum eu facilisis sed. Odio ",
+    "aenean sed adipiscing diam donec. Congue nisi vitae suscipit tellus mauris a diam. Fringilla ",
+    "urna porttitor rhoncus dolor purus non enim praesent. Eget gravida cum sociis natoque. ",
+    "Facilisis mauris sit amet massa vitae tortor. Vulputate odio ut enim blandit volutpat ",
+    "maecenas volutpat blandit. Ut ornare lectus sit amet est placerat in. Quis vel eros donec ac ",
+    "odio tempor orci dapibus ultrices. Venenatis lectus magna fringilla urna porttitor rhoncus ",
+    "dolor. Mattis vulputate enim nulla aliquet porttitor lacus. Lectus nulla at volutpat diam ut ",
+    "venenatis tellus in. Et ligula ullamcorper malesuada proin libero nunc consequat interdum. "
+    "Ut ",
+    "enim blandit volutpat maecenas volutpat blandit aliquam etiam erat. Pellentesque pulvinar ",
+    "pellentesque habitant morbi tristique senectus et. Auctor eu augue ut lectus arcu bibendum "
+    "at ",
+    "varius. Posuere ac ut consequat semper viverra nam. Sed euismod nisi porta lorem mollis ",
+    "aliquam ut. Porttitor eget dolor morbi non arcu risus quis varius. Adipiscing bibendum est ",
+    "ultricies integer quis auctor. Hac habitasse platea dictumst quisque sagittis purus sit amet ",
+    "volutpat. Nullam vehicula ipsum a arcu cursus vitae. Velit scelerisque in dictum non ",
+    "consectetur a erat nam at. Nulla facilisi cras fermentum odio eu. Tincidunt augue interdum ",
+    "velit euismod in pellentesque massa placerat. Suspendisse potenti nullam ac tortor vitae ",
+    "purus faucibus ornare. Amet dictum sit amet justo donec enim diam vulputate. Tellus ",
+    "pellentesque eu tincidunt tortor aliquam nulla facilisi cras. Mauris in aliquam sem "
+    "fringilla ",
+    "ut morbi tincidunt. Volutpat diam ut venenatis tellus in metus. Sed pulvinar proin gravida ",
+    "hendrerit lectus a. Feugiat nisl pretium fusce id velit ut tortor pretium viverra. Non ",
+    "consectetur a erat nam. Fermentum odio eu feugiat pretium nibh ipsum consequat nisl. Donec ",
+    "pretium vulputate sapien nec. Purus sit amet luctus venenatis lectus magna fringilla. Mauris ",
+    "cursus mattis molestie a iaculis. A iaculis at erat pellentesque adipiscing. Auctor augue ",
+    "mauris augue neque gravida in fermentum et sollicitudin. Lectus quam id leo in vitae turpis ",
+    "massa sed. Erat nam at lectus urna duis convallis convallis. Dignissim cras tincidunt ",
+    "lobortis feugiat vivamus at augue eget arcu. Eleifend mi in nulla posuere sollicitudin ",
+    "aliquam ultrices sagittis. Pellentesque nec nam aliquam sem. Feugiat in fermentum posuere ",
+    "urna nec tincidunt praesent. Morbi non arcu risus quis varius quam quisque. Morbi tristique ",
+    "senectus et netus et malesuada fames ac. Et ligula ullamcorper malesuada proin libero. ",
+    "Vivamus at augue eget arcu dictum varius duis at consectetur. Eget mauris pharetra et ",
+    "ultrices neque ornare aenean euismod. Sapien faucibus et molestie ac feugiat sed lectus ",
+    "vestibulum mattis. Blandit turpis cursus in hac habitasse platea dictumst quisque sagittis. ",
+    "Fermentum iaculis eu non diam phasellus vestibulum. Mattis aliquam faucibus purus in massa ",
+    "tempor nec feugiat nisl. Lectus sit amet est placerat. Accumsan sit amet nulla facilisi "
+    "morbi ",
+    "tempus iaculis urna. Magna eget est lorem ipsum dolor sit. Curabitur gravida arcu ac tortor ",
+    "dignissim convallis aenean."};
+
+  std::vector<std::string> base64_roundtripped_strings;
+
+  std::transform(strings.begin(),
+                 strings.end(),
+                 std::back_inserter(base64_roundtripped_strings),
+                 [&](auto& str) { return base64_decode(base64_encode(str)); });
+
+  // Create columns for expected and results
+  cudf::test::strings_column_wrapper expected(strings.begin(), strings.end());
+  cudf::test::strings_column_wrapper results(base64_roundtripped_strings.begin(),
+                                             base64_roundtripped_strings.end());
+
+  // Check equal columns
+  CUDF_TEST_EXPECT_COLUMNS_EQUAL(expected, results);
+}

From bd54430901f5d2abd7887b1d6a4c2740406cc491 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Thu, 9 May 2024 00:13:01 +0000
Subject: [PATCH 34/53] minor comments update

---
 cpp/tests/utilities_tests/io_utilities_tests.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cpp/tests/utilities_tests/io_utilities_tests.cpp b/cpp/tests/utilities_tests/io_utilities_tests.cpp
index f40ef43e29d..9c2f1b99347 100644
--- a/cpp/tests/utilities_tests/io_utilities_tests.cpp
+++ b/cpp/tests/utilities_tests/io_utilities_tests.cpp
@@ -71,7 +71,7 @@ TEST(IoUtilitiesTest, HostMemoryGetAndSet)
 
 TEST(IoUtilitiesTest, Base64EncodeAndDecode)
 {
-  // A long lorem ipsum string
+  // a vector oflorem ipsum strings
   std::vector<std::string> strings = {
     "Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut ",
     "labore et dolore magna aliqua. Id ornare arcu odio ut sem. Ultrices neque ornare aenean ",

From e954b458b1d77238f05cb46fd89b7fe23213581c Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <14217455+mhaseeb123@users.noreply.github.com>
Date: Thu, 9 May 2024 13:25:17 -0700
Subject: [PATCH 35/53] Apply styling suggestions from code review

Co-authored-by: Yunsong Wang <yunsongw@nvidia.com>
---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 8 +++-----
 1 file changed, 3 insertions(+), 5 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 6c9c17e8b48..186f91d9256 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -666,7 +666,7 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
   auto decoded_message = cudf::io::detail::base64_decode(encoded_serialized_message);
 
   // Decode the ipc message to get a const void pointer to the ipc:Message flatbuffer
-  const auto metadata_buf = decode_ipc_message(decoded_message);
+  auto const metadata_buf = decode_ipc_message(decoded_message);
 
   if (metadata_buf == nullptr) {
     CUDF_LOG_ERROR("Parquet reader encountered an invalid metadata pointer.",
@@ -689,7 +689,7 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
   }
 
   // Get the vector of fields from arrow:schema flatbuffer object
-  const auto fields = flatbuf::GetMessage(metadata_buf)->header_as_Schema()->fields();
+  auto const fields = flatbuf::GetMessage(metadata_buf)->header_as_Schema()->fields();
   if (fields == nullptr) {
     CUDF_LOG_ERROR("Parquet reader encountered an invalid fields pointer.",
                    "arrow:schema not processed.");
@@ -783,11 +783,9 @@ void aggregate_reader_metadata::consume_arrow_schema()
                 [&](auto const& idx) {
                   co_walk_schemas(arrow_schema_root.children[idx], schema_root.children_idx[idx]);
                 });
-
-  return;
 }
 
-const void* aggregate_reader_metadata::decode_ipc_message(std::string& serialized_message) const
+void const* aggregate_reader_metadata::decode_ipc_message(std::string& serialized_message) const
 {
   // Constants copied from arrow source and renamed to match the case
   constexpr auto MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL         = sizeof(int32_t);

From b870359613d3f40ff238f8bcf01635193cbd0ea2 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Thu, 9 May 2024 20:39:50 +0000
Subject: [PATCH 36/53] minor updates and better styling

---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 22 +++++++++-------------
 cpp/src/io/parquet/reader_impl_helpers.hpp |  4 ++--
 2 files changed, 11 insertions(+), 15 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 186f91d9256..599b765877b 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -655,17 +655,13 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
   auto const it = keyval_maps[0].find("ARROW:schema");
   if (it == keyval_maps[0].end()) { return std::nullopt; }
 
-  // Read arrow schema from flatbuffers
-  std::string encoded_serialized_message = it->second;
-
   // Decode the base64 encoded ipc message string
-
   // Note: Store the output from base64_decode in the lvalue here and then pass
   // it to decode_ipc_message. Directly passing rvalue from base64_decode to
   // decode_ipc_message can lead to unintended nullptr dereferences.
-  auto decoded_message = cudf::io::detail::base64_decode(encoded_serialized_message);
+  auto const decoded_message = cudf::io::detail::base64_decode(it->second);
 
-  // Decode the ipc message to get a const void pointer to the ipc:Message flatbuffer
+  // Decode the ipc message to get a constant void pointer to the ipc:Message flatbuffer
   auto const metadata_buf = decode_ipc_message(decoded_message);
 
   if (metadata_buf == nullptr) {
@@ -785,7 +781,7 @@ void aggregate_reader_metadata::consume_arrow_schema()
                 });
 }
 
-void const* aggregate_reader_metadata::decode_ipc_message(std::string& serialized_message) const
+void const* aggregate_reader_metadata::decode_ipc_message(std::string_view serialized_message) const
 {
   // Constants copied from arrow source and renamed to match the case
   constexpr auto MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL         = sizeof(int32_t);
@@ -801,7 +797,7 @@ void const* aggregate_reader_metadata::decode_ipc_message(std::string& serialize
   if (message_size == 0) {
     CUDF_LOG_ERROR("Parquet reader encountered zero length arrow:schema.",
                    "arrow:schema not processed.");
-    return static_cast<const void*>(nullptr);
+    return static_cast<void const*>(nullptr);
   }
   // Check for improper message.
   if (message_size - MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL < 0) {
@@ -817,7 +813,7 @@ void const* aggregate_reader_metadata::decode_ipc_message(std::string& serialize
   if (continuation != IPC_CONTINUATION_TOKEN) {
     CUDF_LOG_ERROR("Parquet reader encountered unexpected IPC continuation token.",
                    "arrow:schema not processed.");
-    return static_cast<const void*>(nullptr);
+    return static_cast<void const*>(nullptr);
   } else {
     // Offset the message buf and reduce remaining size
     message_buf += MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL;
@@ -838,7 +834,7 @@ void const* aggregate_reader_metadata::decode_ipc_message(std::string& serialize
   if (metadata_len <= 0) {
     CUDF_LOG_ERROR("Parquet reader encountered unexpected metadata length.",
                    "arrow:schema not processed.");
-    return static_cast<const void*>(nullptr);
+    return static_cast<void const*>(nullptr);
   } else {
     // Offset the message buf and reduce remaining size
     message_buf += message_decoder_next_required_size_metadata_length;
@@ -850,11 +846,11 @@ void const* aggregate_reader_metadata::decode_ipc_message(std::string& serialize
   if (message_size < metadata_len) {
     CUDF_LOG_ERROR("Parquet reader encountered unexpected metadata bytes.",
                    "arrow:schema not processed.");
-    return static_cast<const void*>(nullptr);
+    return static_cast<void const*>(nullptr);
   }
 
-  // All good, return the current message_buf typecasted as const void*
-  return static_cast<const void*>(message_buf);
+  // All good, return the current message_buf typecasted as void const*
+  return static_cast<void const*>(message_buf);
 }
 
 RowGroup const& aggregate_reader_metadata::get_row_group(size_type row_group_index,
diff --git a/cpp/src/io/parquet/reader_impl_helpers.hpp b/cpp/src/io/parquet/reader_impl_helpers.hpp
index 881e88273f4..342b1f851fb 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.hpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.hpp
@@ -160,10 +160,10 @@ class aggregate_reader_metadata {
   void consume_arrow_schema();
 
   /**
-   * @brief Decode an arrow:IPC message and returns a const void pointer
+   * @brief Decode an arrow:IPC message and returns a constant void typecasted pointer
    * to its metadata header
    */
-  [[nodiscard]] const void* decode_ipc_message(std::string& serialized_message) const;
+  [[nodiscard]] void const* decode_ipc_message(std::string_view serialized_message) const;
 
   /**
    * @brief Sums up the number of rows of each source

From c34c24848402ccb249eb61713ba6fe9e5891f1f1 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Thu, 9 May 2024 21:18:40 +0000
Subject: [PATCH 37/53] adding const to decode_ipc_message fn

---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 3 ++-
 cpp/src/io/parquet/reader_impl_helpers.hpp | 2 +-
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 599b765877b..260312dc650 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -781,7 +781,8 @@ void aggregate_reader_metadata::consume_arrow_schema()
                 });
 }
 
-void const* aggregate_reader_metadata::decode_ipc_message(std::string_view serialized_message) const
+void const* aggregate_reader_metadata::decode_ipc_message(
+  std::string_view const serialized_message) const
 {
   // Constants copied from arrow source and renamed to match the case
   constexpr auto MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL         = sizeof(int32_t);
diff --git a/cpp/src/io/parquet/reader_impl_helpers.hpp b/cpp/src/io/parquet/reader_impl_helpers.hpp
index 342b1f851fb..1712721188f 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.hpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.hpp
@@ -163,7 +163,7 @@ class aggregate_reader_metadata {
    * @brief Decode an arrow:IPC message and returns a constant void typecasted pointer
    * to its metadata header
    */
-  [[nodiscard]] void const* decode_ipc_message(std::string_view serialized_message) const;
+  [[nodiscard]] void const* decode_ipc_message(std::string_view const serialized_message) const;
 
   /**
    * @brief Sums up the number of rows of each source

From dda87d19ae94214cfa178ee0a1884550958813e9 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Thu, 9 May 2024 22:37:36 +0000
Subject: [PATCH 38/53] avoid returning raw pointer in decode_ipc_message

---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 34 ++++++++++++----------
 cpp/src/io/parquet/reader_impl_helpers.hpp |  7 +++--
 2 files changed, 22 insertions(+), 19 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 260312dc650..46cf8693408 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -661,31 +661,32 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
   // decode_ipc_message can lead to unintended nullptr dereferences.
   auto const decoded_message = cudf::io::detail::base64_decode(it->second);
 
-  // Decode the ipc message to get a constant void pointer to the ipc:Message flatbuffer
+  // Decode the ipc message to get an optional string_view of the ipc:Message flatbuffer
   auto const metadata_buf = decode_ipc_message(decoded_message);
 
-  if (metadata_buf == nullptr) {
-    CUDF_LOG_ERROR("Parquet reader encountered an invalid metadata pointer.",
-                   "arrow:schema not processed.");
+  // Check if the string_view exists
+  if (not metadata_buf.has_value()) {
+    // No need to re-log error here as already logged inside decode_ipc_message
     return std::nullopt;
   }
 
   // Check if the decoded Message flatbuffer is valid
-  if (flatbuf::GetMessage(metadata_buf) == nullptr) {
-    CUDF_LOG_ERROR("Parquet reader encountered an invalid ipc_message pointer.",
+  if (flatbuf::GetMessage(metadata_buf.value().data()) == nullptr) {
+    CUDF_LOG_ERROR("Parquet reader encountered an invalid ipc:Message flatbuffer pointer.",
                    "arrow:schema not processed.");
     return std::nullopt;
   }
 
   // Check if the Message flatbuffer has a valid arrow:schema in its header
-  if (flatbuf::GetMessage(metadata_buf)->header_as_Schema() == nullptr) {
-    CUDF_LOG_ERROR("Parquet reader encountered an invalid fb_schema pointer.",
+  if (flatbuf::GetMessage(metadata_buf.value().data())->header_as_Schema() == nullptr) {
+    CUDF_LOG_ERROR("Parquet reader encountered an invalid arrow:schema flatbuffer pointer.",
                    "arrow:schema not processed.");
     return std::nullopt;
   }
 
   // Get the vector of fields from arrow:schema flatbuffer object
-  auto const fields = flatbuf::GetMessage(metadata_buf)->header_as_Schema()->fields();
+  auto const fields =
+    flatbuf::GetMessage(metadata_buf.value().data())->header_as_Schema()->fields();
   if (fields == nullptr) {
     CUDF_LOG_ERROR("Parquet reader encountered an invalid fields pointer.",
                    "arrow:schema not processed.");
@@ -781,7 +782,7 @@ void aggregate_reader_metadata::consume_arrow_schema()
                 });
 }
 
-void const* aggregate_reader_metadata::decode_ipc_message(
+std::optional<std::string_view> aggregate_reader_metadata::decode_ipc_message(
   std::string_view const serialized_message) const
 {
   // Constants copied from arrow source and renamed to match the case
@@ -798,7 +799,7 @@ void const* aggregate_reader_metadata::decode_ipc_message(
   if (message_size == 0) {
     CUDF_LOG_ERROR("Parquet reader encountered zero length arrow:schema.",
                    "arrow:schema not processed.");
-    return static_cast<void const*>(nullptr);
+    return std::nullopt;
   }
   // Check for improper message.
   if (message_size - MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL < 0) {
@@ -814,7 +815,7 @@ void const* aggregate_reader_metadata::decode_ipc_message(
   if (continuation != IPC_CONTINUATION_TOKEN) {
     CUDF_LOG_ERROR("Parquet reader encountered unexpected IPC continuation token.",
                    "arrow:schema not processed.");
-    return static_cast<void const*>(nullptr);
+    return std::nullopt;
   } else {
     // Offset the message buf and reduce remaining size
     message_buf += MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL;
@@ -835,7 +836,7 @@ void const* aggregate_reader_metadata::decode_ipc_message(
   if (metadata_len <= 0) {
     CUDF_LOG_ERROR("Parquet reader encountered unexpected metadata length.",
                    "arrow:schema not processed.");
-    return static_cast<void const*>(nullptr);
+    return std::nullopt;
   } else {
     // Offset the message buf and reduce remaining size
     message_buf += message_decoder_next_required_size_metadata_length;
@@ -847,11 +848,12 @@ void const* aggregate_reader_metadata::decode_ipc_message(
   if (message_size < metadata_len) {
     CUDF_LOG_ERROR("Parquet reader encountered unexpected metadata bytes.",
                    "arrow:schema not processed.");
-    return static_cast<void const*>(nullptr);
+    return std::nullopt;
   }
 
-  // All good, return the current message_buf typecasted as void const*
-  return static_cast<void const*>(message_buf);
+  // All good, return the current message_buf as string_view
+  return std::make_optional(std::string_view{
+    message_buf, static_cast<std::basic_string_view<char>::size_type>(message_size)});
 }
 
 RowGroup const& aggregate_reader_metadata::get_row_group(size_type row_group_index,
diff --git a/cpp/src/io/parquet/reader_impl_helpers.hpp b/cpp/src/io/parquet/reader_impl_helpers.hpp
index 1712721188f..2500accabd8 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.hpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.hpp
@@ -160,10 +160,11 @@ class aggregate_reader_metadata {
   void consume_arrow_schema();
 
   /**
-   * @brief Decode an arrow:IPC message and returns a constant void typecasted pointer
-   * to its metadata header
+   * @brief Decode an arrow:IPC message and returns an optional string_view of
+   * its metadata header
    */
-  [[nodiscard]] void const* decode_ipc_message(std::string_view const serialized_message) const;
+  [[nodiscard]] std::optional<std::string_view> decode_ipc_message(
+    std::string_view const serialized_message) const;
 
   /**
    * @brief Sums up the number of rows of each source

From e9f441debbbff4ea78a901254d749cc002678347 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Fri, 10 May 2024 19:14:52 +0000
Subject: [PATCH 39/53] move base64 definitions to a source file and add it to
 cmake

---
 cpp/CMakeLists.txt                            |   1 +
 cpp/src/io/parquet/reader_impl_helpers.cpp    |   4 +-
 cpp/src/io/utilities/base64_utilities.cpp     | 234 ++++++++++++++++++
 cpp/src/io/utilities/base64_utilities.hpp     | 190 ++------------
 .../utilities_tests/io_utilities_tests.cpp    |   2 +-
 5 files changed, 258 insertions(+), 173 deletions(-)
 create mode 100644 cpp/src/io/utilities/base64_utilities.cpp

diff --git a/cpp/CMakeLists.txt b/cpp/CMakeLists.txt
index d5e84d084b2..474269364de 100644
--- a/cpp/CMakeLists.txt
+++ b/cpp/CMakeLists.txt
@@ -431,6 +431,7 @@ add_library(
   src/io/text/bgzip_utils.cpp
   src/io/text/multibyte_split.cu
   src/io/utilities/arrow_io_source.cpp
+  src/io/utilities/base64_utilities.cpp
   src/io/utilities/column_buffer.cpp
   src/io/utilities/column_buffer_strings.cu
   src/io/utilities/config_utils.cpp
diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 46cf8693408..4699495cb23 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -852,8 +852,8 @@ std::optional<std::string_view> aggregate_reader_metadata::decode_ipc_message(
   }
 
   // All good, return the current message_buf as string_view
-  return std::make_optional(std::string_view{
-    message_buf, static_cast<std::basic_string_view<char>::size_type>(message_size)});
+  return std::string_view{message_buf,
+                          static_cast<std::basic_string_view<char>::size_type>(message_size)};
 }
 
 RowGroup const& aggregate_reader_metadata::get_row_group(size_type row_group_index,
diff --git a/cpp/src/io/utilities/base64_utilities.cpp b/cpp/src/io/utilities/base64_utilities.cpp
new file mode 100644
index 00000000000..856c29599a7
--- /dev/null
+++ b/cpp/src/io/utilities/base64_utilities.cpp
@@ -0,0 +1,234 @@
+/*
+ * Copyright (c) 2024, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/*
+ * Portions of this file are derived from Rene Nyffenegger's codebase at
+ * https://github.com/ReneNyffenegger/cpp-base64, original license text below.
+ */
+
+/*
+ *  base64.cpp and base64.h
+ *
+ *  base64 encoding and decoding with C++.
+ *  More information at
+ *    https://renenyffenegger.ch/notes/development/Base64/Encoding-and-decoding-base-64-with-cpp
+ *
+ *  Version: 2.rc.09 (release candidate)
+ *
+ *  Copyright (C) 2004-2017, 2020-2022 René Nyffenegger
+ *
+ *  This source code is provided 'as-is', without any express or implied
+ *  warranty. In no event will the author be held liable for any damages
+ *  arising from the use of this software.
+ *
+ *  Permission is granted to anyone to use this software for any purpose,
+ *  including commercial applications, and to alter it and redistribute it
+ *  freely, subject to the following restrictions:
+ *
+ *  1. The origin of this source code must not be misrepresented; you must not
+ *     claim that you wrote the original source code. If you use this source code
+ *     in a product, an acknowledgment in the product documentation would be
+ *     appreciated but is not required.
+ *
+ *  2. Altered source versions must be plainly marked as such, and must not be
+ *     misrepresented as being the original source code.
+ *
+ *  3. This notice may not be removed or altered from any source distribution.
+ *
+ *  René Nyffenegger rene.nyffenegger@adp-gmbh.ch
+ */
+
+/**
+ * @file base64_utils.cpp
+ * @brief base64 string encoding/decoding implementation
+ */
+
+// altered: applying clang-format for libcudf on this file.
+
+#include "base64_utilities.hpp"
+
+#include <cudf/detail/utilities/logger.hpp>
+
+#include <thrust/iterator/counting_iterator.h>
+
+#include <algorithm>
+
+// altered: use cudf namespaces
+namespace cudf::io::detail {
+
+static const std::string base64_chars =
+  "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
+  "abcdefghijklmnopqrstuvwxyz"
+  "0123456789+/";
+
+static constexpr unsigned char trailing_char = '=';
+
+// Function to encode input string to base64 and return the encoded string
+std::string base64_encode(std::string_view string_to_encode)
+{
+  auto input_length = static_cast<int32_t>(string_to_encode.size());
+
+  // altered: compute number of encoding iterations = floor(multiple of 3)
+  int32_t num_iterations = (input_length / 3);
+  num_iterations += (input_length % 3) ? 1 : 0;
+
+  std::string encoded;
+  size_t encoded_length = (input_length + 2) / 3 * 4;
+  encoded.reserve(encoded_length);
+
+  // altered: modify base64 encoder loop using STL and Thrust.
+  // TODO: Port this loop to thrust cooperative groups if needed for too-wide tables.
+  std::for_each(thrust::make_counting_iterator(0),
+                thrust::make_counting_iterator(num_iterations),
+                [&](auto&& iter) {
+                  auto idx = iter * 3;
+
+                  encoded.push_back(base64_chars[(string_to_encode[idx] & 0xfc) >> 2]);
+                  // increment the index by 1
+                  idx += 1;
+
+                  if (idx < input_length) {
+                    encoded.push_back(base64_chars[((string_to_encode[idx - 1] & 0x03) << 4) +
+                                                   ((string_to_encode[idx] & 0xf0) >> 4)]);
+                    // increment the index by 1
+                    idx += 1;
+
+                    if (idx < input_length) {
+                      encoded.push_back(base64_chars[((string_to_encode[idx - 1] & 0x0f) << 2) +
+                                                     ((string_to_encode[idx] & 0xc0) >> 6)]);
+                      encoded.push_back(base64_chars[string_to_encode[idx] & 0x3f]);
+                    } else {
+                      encoded.push_back(base64_chars[(string_to_encode[idx - 1] & 0x0f) << 2]);
+                      encoded.push_back(trailing_char);
+                    }
+                  } else {
+                    encoded.push_back(base64_chars[(string_to_encode[idx - 1] & 0x03) << 4]);
+                    encoded.push_back(trailing_char);
+                    encoded.push_back(trailing_char);
+                  }
+                });
+
+  return encoded;
+}
+
+// base64 decode function
+std::string base64_decode(std::string_view encoded_string)
+{
+  // altered: there must be at least 2 characters in the base64-encoded string
+  if (encoded_string.size() < 2) {
+    CUDF_LOG_ERROR(
+      "Parquet reader encountered invalid base64-encoded string size."
+      "arrow:schema not processed.");
+    return std::string{};
+  }
+
+  size_t input_length = encoded_string.length();
+  std::string decoded;
+
+  // altered: compute number of decoding iterations = floor (multiple of 4)
+  int32_t num_iterations = (input_length / 4);
+  num_iterations += (input_length % 4) ? 1 : 0;
+
+  //
+  // The approximate length (bytes) of the decoded string might be one or
+  // two bytes smaller, depending on the amount of trailing equal signs
+  // in the encoded string. This approximation is needed to reserve
+  // enough space in the string to be returned.
+  size_t approx_decoded_length = input_length / 4 * 3;
+  decoded.reserve(approx_decoded_length);
+
+  //
+  // Iterate over encoded input string in chunks. The size of all
+  // chunks except the last one is 4 bytes.
+  //
+  // The last chunk might be padded with equal signs or dots
+  // in order to make it 4 bytes in size as well, but this
+  // is not required as per RFC 2045.
+  //
+  // All chunks except the last one produce three output bytes.
+  //
+  // The last chunk produces at least one and up to three bytes.
+  //
+  // altered: modify base64 encoder loop to number of iterations using STL and Thrust.
+  // TODO: Port this loop to thrust cooperative groups if needed for too-wide tables.
+  if (not std::all_of(
+        thrust::make_counting_iterator(0),
+        thrust::make_counting_iterator(num_iterations),
+        [&](auto&& iter) {
+          int32_t idx                  = iter * 4;
+          size_t current_char_position = 0;
+          size_t char1_position        = 0;
+          size_t char2_position        = 0;
+
+          // Check for data that is not padded with equal
+          // signs (which is allowed by RFC 2045)
+          if (encoded_string[idx] == '=') { return true; }
+
+          current_char_position = base64_chars.find(encoded_string[idx]);
+          char1_position        = base64_chars.find(encoded_string[idx + 1]);
+          if (current_char_position == std::string::npos or char1_position == std::string::npos) {
+            return false;
+          }
+          // Emit the first output byte that is produced in each chunk:
+          decoded.push_back(static_cast<std::string::value_type>((current_char_position << 2) +
+                                                                 ((char1_position & 0x30) >> 4)));
+
+          // increment the index by 1
+          idx += 1;
+          // check for = padding
+          if (encoded_string[idx] == '=') { return true; }
+
+          // increment the index by 1
+          idx += 1;
+          // check for = padding
+          if (encoded_string[idx] == '=') { return true; }
+
+          char1_position = base64_chars.find(encoded_string[idx - 1]);
+          char2_position = base64_chars.find(encoded_string[idx]);
+          if (char1_position == std::string::npos or char2_position == std::string::npos) {
+            return false;
+          }
+          // Emit a chunk's second byte (which might not be produced in the last
+          // chunk).
+          decoded.push_back(static_cast<std::string::value_type>(((char1_position & 0x0f) << 4) +
+                                                                 ((char2_position & 0x3c) >> 2)));
+
+          // increment the index by 1
+          idx += 1;
+          // check for = padding
+          if (encoded_string[idx] == '=') { return true; }
+
+          char2_position        = base64_chars.find(encoded_string[idx - 1]);
+          current_char_position = base64_chars.find(encoded_string[idx]);
+          if (current_char_position == std::string::npos or char2_position == std::string::npos) {
+            return false;
+          }
+          // Emit a chunk's third byte (which might not be produced in the last
+          // chunk).
+          decoded.push_back(static_cast<std::string::value_type>(((char2_position & 0x03) << 6) +
+                                                                 current_char_position));
+
+          // all good, return true
+          return true;
+        })) {
+    return std::string{};
+  }
+
+  // return the decoded string
+  return decoded;
+}
+
+}  // namespace cudf::io::detail
diff --git a/cpp/src/io/utilities/base64_utilities.hpp b/cpp/src/io/utilities/base64_utilities.hpp
index 67584f61f62..537d9c96d6b 100644
--- a/cpp/src/io/utilities/base64_utilities.hpp
+++ b/cpp/src/io/utilities/base64_utilities.hpp
@@ -52,186 +52,36 @@
  */
 
 /**
- * @file base64_utils.hpp
- * @brief base64 string encoding/decoding utilities and implementation
+ * @file base64_utils.cpp
+ * @brief base64 string encoding/decoding utilities
  */
 
 #pragma once
 
-// altered: include required cudf and std headers
-#include <cudf/detail/utilities/logger.hpp>
-
-#include <thrust/iterator/counting_iterator.h>
+// altered: applying clang-format for libcudf on this file.
 
-#include <algorithm>
+// altered: include required headers
 #include <string>
 
-// altered: merged base64.h and base64.cpp into one file.
-// altered: applying clang-format for libcudf on this file.
-
 // altered: use cudf namespaces
 namespace cudf::io::detail {
 
-static const std::string base64_chars =
-  "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
-  "abcdefghijklmnopqrstuvwxyz"
-  "0123456789+/";
-
-static constexpr unsigned char trailing_char = '=';
-
-// Function to encode input string to base64 and return the encoded string
-std::string base64_encode(std::string_view string_to_encode)
-{
-  auto input_length = static_cast<int32_t>(string_to_encode.size());
-
-  // altered: compute number of encoding iterations = floor(multiple of 3)
-  int32_t num_iterations = (input_length / 3);
-  num_iterations += (input_length % 3) ? 1 : 0;
-
-  std::string encoded;
-  size_t encoded_length = (input_length + 2) / 3 * 4;
-  encoded.reserve(encoded_length);
-
-  // altered: modify base64 encoder loop using STL and Thrust.
-  // TODO: Port this loop to thrust cooperative groups of size 4 if needed for too-wide tables.
-  std::for_each(thrust::make_counting_iterator(0),
-                thrust::make_counting_iterator(num_iterations),
-                [&](auto&& iter) {
-                  auto idx = iter * 3;
-
-                  encoded.push_back(base64_chars[(string_to_encode[idx] & 0xfc) >> 2]);
-                  // increment the index by 1
-                  idx += 1;
-
-                  if (idx < input_length) {
-                    encoded.push_back(base64_chars[((string_to_encode[idx - 1] & 0x03) << 4) +
-                                                   ((string_to_encode[idx] & 0xf0) >> 4)]);
-                    // increment the index by 1
-                    idx += 1;
-
-                    if (idx < input_length) {
-                      encoded.push_back(base64_chars[((string_to_encode[idx - 1] & 0x0f) << 2) +
-                                                     ((string_to_encode[idx] & 0xc0) >> 6)]);
-                      encoded.push_back(base64_chars[string_to_encode[idx] & 0x3f]);
-                    } else {
-                      encoded.push_back(base64_chars[(string_to_encode[idx - 1] & 0x0f) << 2]);
-                      encoded.push_back(trailing_char);
-                    }
-                  } else {
-                    encoded.push_back(base64_chars[(string_to_encode[idx - 1] & 0x03) << 4]);
-                    encoded.push_back(trailing_char);
-                    encoded.push_back(trailing_char);
-                  }
-                });
-
-  return encoded;
-}
-
-// base64 decode function
-std::string base64_decode(std::string_view encoded_string)
-{
-  // altered: there must be at least 2 characters in the base64-encoded string
-  if (encoded_string.size() < 2) {
-    CUDF_LOG_ERROR(
-      "Parquet reader encountered invalid base64-encoded string size."
-      "arrow:schema not processed.");
-    return std::string{};
-  }
-
-  size_t input_length = encoded_string.length();
-  std::string decoded;
-
-  // altered: compute number of decoding iterations = floor (multiple of 4)
-  int32_t num_iterations = (input_length / 4);
-  num_iterations += (input_length % 4) ? 1 : 0;
-
-  //
-  // The approximate length (bytes) of the decoded string might be one or
-  // two bytes smaller, depending on the amount of trailing equal signs
-  // in the encoded string. This approximation is needed to reserve
-  // enough space in the string to be returned.
-  size_t approx_decoded_length = input_length / 4 * 3;
-  decoded.reserve(approx_decoded_length);
-
-  //
-  // Iterate over encoded input string in chunks. The size of all
-  // chunks except the last one is 4 bytes.
-  //
-  // The last chunk might be padded with equal signs or dots
-  // in order to make it 4 bytes in size as well, but this
-  // is not required as per RFC 2045.
-  //
-  // All chunks except the last one produce three output bytes.
-  //
-  // The last chunk produces at least one and up to three bytes.
-  //
-  // altered: modify base64 encoder loop using STL and Thrust.
-  // TODO: Port this loop to thrust cooperative groups of size 3 if needed for too-wide tables.
-  if (not std::all_of(
-        thrust::make_counting_iterator(0),
-        thrust::make_counting_iterator(num_iterations),
-        [&](auto&& iter) {
-          int32_t idx                  = iter * 4;
-          size_t current_char_position = 0;
-          size_t char1_position        = 0;
-          size_t char2_position        = 0;
-
-          // Check for data that is not padded with equal
-          // signs (which is allowed by RFC 2045)
-          if (encoded_string[idx] == '=') { return true; }
-
-          current_char_position = base64_chars.find(encoded_string[idx]);
-          char1_position        = base64_chars.find(encoded_string[idx + 1]);
-          if (current_char_position == std::string::npos or char1_position == std::string::npos) {
-            return false;
-          }
-          // Emit the first output byte that is produced in each chunk:
-          decoded.push_back(static_cast<std::string::value_type>((current_char_position << 2) +
-                                                                 ((char1_position & 0x30) >> 4)));
-
-          // increment the index by 1
-          idx += 1;
-          // check for = padding
-          if (encoded_string[idx] == '=') { return true; }
-
-          // increment the index by 1
-          idx += 1;
-          // check for = padding
-          if (encoded_string[idx] == '=') { return true; }
-
-          char1_position = base64_chars.find(encoded_string[idx - 1]);
-          char2_position = base64_chars.find(encoded_string[idx]);
-          if (char1_position == std::string::npos or char2_position == std::string::npos) {
-            return false;
-          }
-          // Emit a chunk's second byte (which might not be produced in the last
-          // chunk).
-          decoded.push_back(static_cast<std::string::value_type>(((char1_position & 0x0f) << 4) +
-                                                                 ((char2_position & 0x3c) >> 2)));
-
-          // increment the index by 1
-          idx += 1;
-          // check for = padding
-          if (encoded_string[idx] == '=') { return true; }
-
-          char2_position        = base64_chars.find(encoded_string[idx - 1]);
-          current_char_position = base64_chars.find(encoded_string[idx]);
-          if (current_char_position == std::string::npos or char2_position == std::string::npos) {
-            return false;
-          }
-          // Emit a chunk's third byte (which might not be produced in the last
-          // chunk).
-          decoded.push_back(static_cast<std::string::value_type>(((char2_position & 0x03) << 6) +
-                                                                 current_char_position));
-
-          // all good, return true
-          return true;
-        })) {
-    return std::string{};
-  }
+/**
+ * @brief Encodes input string to base64 and returns it
+ *
+ * @param string_to_encode a view of the string to be encoded in base64
+ * @return the base64-encoded string
+ *
+ */
+std::string base64_encode(std::string_view string_to_encode);
 
-  // return the decoded string
-  return decoded;
-}
+/**
+ * @brief Decodes the input base64-encoded string and returns it
+ *
+ * @param encoded_string a view of the base64-encoded string to be decoded
+ * @return the decoded string
+ *
+ */
+std::string base64_decode(std::string_view encoded_string);
 
 }  // namespace cudf::io::detail
diff --git a/cpp/tests/utilities_tests/io_utilities_tests.cpp b/cpp/tests/utilities_tests/io_utilities_tests.cpp
index 9c2f1b99347..e5a153bf781 100644
--- a/cpp/tests/utilities_tests/io_utilities_tests.cpp
+++ b/cpp/tests/utilities_tests/io_utilities_tests.cpp
@@ -71,7 +71,7 @@ TEST(IoUtilitiesTest, HostMemoryGetAndSet)
 
 TEST(IoUtilitiesTest, Base64EncodeAndDecode)
 {
-  // a vector oflorem ipsum strings
+  // a vector of lorem ipsum strings
   std::vector<std::string> strings = {
     "Lorem ipsum dolor sit amet, consectetur adipiscing elit, sed do eiusmod tempor incididunt ut ",
     "labore et dolore magna aliqua. Id ornare arcu odio ut sem. Ultrices neque ornare aenean ",

From ac85ecc8fa8e99a75d53f7e42c42a108a111a398 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Fri, 10 May 2024 20:19:45 +0000
Subject: [PATCH 40/53] apply suggestions from the reviews

---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 72 +++++++++++-----------
 cpp/src/io/parquet/reader_impl_helpers.hpp |  7 +--
 2 files changed, 37 insertions(+), 42 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 4699495cb23..631da4b909a 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -536,7 +536,6 @@ aggregate_reader_metadata::aggregate_reader_metadata(
   host_span<std::unique_ptr<datasource> const> sources, bool use_arrow_schema)
   : per_file_metadata(metadatas_from_sources(sources)),
     keyval_maps(collect_keyval_metadata()),
-    arrow_schema(collect_arrow_schema(use_arrow_schema)),
     num_rows(calc_num_rows()),
     num_row_groups(calc_num_row_groups())
 {
@@ -556,24 +555,16 @@ aggregate_reader_metadata::aggregate_reader_metadata(
     }
   }
 
-  if (arrow_schema.has_value()) {
-    // consume arrow schema into the parquet schema
-    consume_arrow_schema();
-    // we no longer keep arrow schema alive
-    arrow_schema.reset();
-  }
+  // Collect and apply arrow:schema from Parquet's key value metadata section
+  if (use_arrow_schema) { apply_arrow_schema(); }
 
-  // erase "ARROW:schema" from the output pfm if exists
+  // Erase "ARROW:schema" from the output pfm if exists
   std::for_each(
     keyval_maps.begin(), keyval_maps.end(), [](auto& pfm) { pfm.erase("ARROW:schema"); });
 }
 
-[[nodiscard]] std::optional<arrow_schema_data_types>
-aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
+arrow_schema_data_types aggregate_reader_metadata::collect_arrow_schema() const
 {
-  // Check if we want to collect the arrow_schema
-  if (not use_arrow_schema) { return std::nullopt; }
-
   // Check the key_value metadata for ARROW:schema, decode and walk it
   // Function to convert from flatbuf::duration type to cudf::type_id
   auto const duration_from_flatbuffer = [](flatbuf::Duration const* duration) {
@@ -589,10 +580,8 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
         return cudf::data_type{cudf::type_id::DURATION_MICROSECONDS};
       case flatbuf::TimeUnit::TimeUnit_NANOSECOND:
         return cudf::data_type{cudf::type_id::DURATION_NANOSECONDS};
-      default: break;
+      default: return cudf::data_type{};
     }
-    // 0 is simply a dummy value for the scalar
-    return cudf::data_type{};
   };
 
   // variable that tracks if an arrow_type specific column is seen
@@ -653,7 +642,7 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
   // Question: Should we check if any file has the "ARROW:schema" key or
   // Or if all files have the same "ARROW:schema"?
   auto const it = keyval_maps[0].find("ARROW:schema");
-  if (it == keyval_maps[0].end()) { return std::nullopt; }
+  if (it == keyval_maps[0].end()) { return arrow_schema_data_types{}; }
 
   // Decode the base64 encoded ipc message string
   // Note: Store the output from base64_decode in the lvalue here and then pass
@@ -667,21 +656,21 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
   // Check if the string_view exists
   if (not metadata_buf.has_value()) {
     // No need to re-log error here as already logged inside decode_ipc_message
-    return std::nullopt;
+    return arrow_schema_data_types{};
   }
 
   // Check if the decoded Message flatbuffer is valid
   if (flatbuf::GetMessage(metadata_buf.value().data()) == nullptr) {
     CUDF_LOG_ERROR("Parquet reader encountered an invalid ipc:Message flatbuffer pointer.",
                    "arrow:schema not processed.");
-    return std::nullopt;
+    return arrow_schema_data_types{};
   }
 
   // Check if the Message flatbuffer has a valid arrow:schema in its header
   if (flatbuf::GetMessage(metadata_buf.value().data())->header_as_Schema() == nullptr) {
     CUDF_LOG_ERROR("Parquet reader encountered an invalid arrow:schema flatbuffer pointer.",
                    "arrow:schema not processed.");
-    return std::nullopt;
+    return arrow_schema_data_types{};
   }
 
   // Get the vector of fields from arrow:schema flatbuffer object
@@ -690,7 +679,7 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
   if (fields == nullptr) {
     CUDF_LOG_ERROR("Parquet reader encountered an invalid fields pointer.",
                    "arrow:schema not processed.");
-    return std::nullopt;
+    return arrow_schema_data_types{};
   }
 
   // arrow schema structure to return
@@ -705,18 +694,26 @@ aggregate_reader_metadata::collect_arrow_schema(bool use_arrow_schema) const
                         [&](auto const& idx) {
                           return walk_field(*(fields->begin() + idx), schema.children[idx]);
                         })) {
-      return std::nullopt;
+      return arrow_schema_data_types{};
     }
 
     // if no arrow type column seen, return nullopt.
-    if (not arrow_type_col_seen) { return std::nullopt; }
+    if (not arrow_type_col_seen) { return arrow_schema_data_types{}; }
   }
 
-  return std::make_optional(std::move(schema));
+  return schema;
 }
 
-void aggregate_reader_metadata::consume_arrow_schema()
+void aggregate_reader_metadata::apply_arrow_schema()
 {
+  // Collect the arrow schema from the key value section of Parquet metadata
+  auto arrow_schema_root = collect_arrow_schema();
+
+  // Check if empty arrow schema collected
+  if (arrow_schema_root.type.id() == type_id::EMPTY and arrow_schema_root.children.size() == 0) {
+    return;
+  }
+
   // Function to verify equal num_children at each level in Parquet and arrow schemas.
   std::function<bool(arrow_schema_data_types&, int)> validate_schemas =
     [&](arrow_schema_data_types& arrow_schema, int schema_idx) {
@@ -739,24 +736,24 @@ void aggregate_reader_metadata::consume_arrow_schema()
   // Function to co-walk arrow and parquet schemas
   std::function<void(arrow_schema_data_types&, int)> co_walk_schemas =
     [&](arrow_schema_data_types& arrow_schema, int schema_idx) {
-      auto& schema_elem = per_file_metadata[0].schema[schema_idx];
+      auto& pq_schema_elem = per_file_metadata[0].schema[schema_idx];
       std::for_each(thrust::make_counting_iterator(0),
-                    thrust::make_counting_iterator(schema_elem.num_children),
+                    thrust::make_counting_iterator(pq_schema_elem.num_children),
                     [&](auto const& idx) {
-                      co_walk_schemas(arrow_schema.children[idx], schema_elem.children_idx[idx]);
+                      co_walk_schemas(arrow_schema.children[idx], pq_schema_elem.children_idx[idx]);
                     });
 
       // true for DurationType columns only for now.
       if (arrow_schema.type.id() != type_id::EMPTY) {
-        schema_elem.arrow_type = arrow_schema.type.id();
+        pq_schema_elem.arrow_type = arrow_schema.type.id();
       }
     };
 
-  auto schema_root       = get_schema(0);
-  auto arrow_schema_root = arrow_schema.value();
+  // Get Parquet schema root
+  auto pq_schema_root = get_schema(0);
 
-  // verify equal number of children at root level
-  if (schema_root.num_children != static_cast<int32_t>(arrow_schema_root.children.size())) {
+  // verify equal number of children for both schemas at root level
+  if (pq_schema_root.num_children != static_cast<int32_t>(arrow_schema_root.children.size())) {
     CUDF_LOG_DEBUG("Parquet reader encountered a mismatch between Parquet and arrow schema.",
                    "arrow:schema not processed.");
     return;
@@ -764,10 +761,10 @@ void aggregate_reader_metadata::consume_arrow_schema()
 
   // Verify equal number of children at all sub-levels
   if (not std::all_of(thrust::make_counting_iterator(0),
-                      thrust::make_counting_iterator(schema_root.num_children),
+                      thrust::make_counting_iterator(pq_schema_root.num_children),
                       [&](auto const& idx) {
                         return validate_schemas(arrow_schema_root.children[idx],
-                                                schema_root.children_idx[idx]);
+                                                pq_schema_root.children_idx[idx]);
                       })) {
     CUDF_LOG_DEBUG("Parquet reader encountered a mismatch between Parquet and arrow schema.",
                    "arrow:schema not processed.");
@@ -776,9 +773,10 @@ void aggregate_reader_metadata::consume_arrow_schema()
 
   // All good, now co-walk schemas
   std::for_each(thrust::make_counting_iterator(0),
-                thrust::make_counting_iterator(schema_root.num_children),
+                thrust::make_counting_iterator(pq_schema_root.num_children),
                 [&](auto const& idx) {
-                  co_walk_schemas(arrow_schema_root.children[idx], schema_root.children_idx[idx]);
+                  co_walk_schemas(arrow_schema_root.children[idx],
+                                  pq_schema_root.children_idx[idx]);
                 });
 }
 
diff --git a/cpp/src/io/parquet/reader_impl_helpers.hpp b/cpp/src/io/parquet/reader_impl_helpers.hpp
index 2500accabd8..398812945e2 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.hpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.hpp
@@ -129,7 +129,6 @@ struct arrow_schema_data_types {
 class aggregate_reader_metadata {
   std::vector<metadata> per_file_metadata;
   std::vector<std::unordered_map<std::string, std::string>> keyval_maps;
-  std::optional<arrow_schema_data_types> arrow_schema;
 
   int64_t num_rows;
   size_type num_row_groups;
@@ -150,14 +149,13 @@ class aggregate_reader_metadata {
    * @brief Decodes and constructs the arrow schema from the "ARROW:schema" IPC message
    * in key value metadata section of Parquet file footer
    */
-  [[nodiscard]] std::optional<arrow_schema_data_types> collect_arrow_schema(
-    bool use_arrow_schema) const;
+  [[nodiscard]] arrow_schema_data_types collect_arrow_schema() const;
 
   /**
    * @brief Co-walks the collected arrow and Parquet schema, updates
    * dtypes and destroys the no longer needed arrow schema object(s).
    */
-  void consume_arrow_schema();
+  void apply_arrow_schema();
 
   /**
    * @brief Decode an arrow:IPC message and returns an optional string_view of
@@ -211,7 +209,6 @@ class aggregate_reader_metadata {
   }
 
   [[nodiscard]] auto const& get_key_value_metadata() const& { return keyval_maps; }
-  [[nodiscard]] auto const& get_arrow_schema() const& { return arrow_schema; }
   [[nodiscard]] auto&& get_key_value_metadata() && { return std::move(keyval_maps); }
 
   /**

From 45261f170bc3120812e115f5ac6a7239d5a232bf Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <14217455+mhaseeb123@users.noreply.github.com>
Date: Fri, 10 May 2024 15:29:52 -0700
Subject: [PATCH 41/53] Apply suggestions from code review

Co-authored-by: Vukasin Milovanovic <vmilovanovic@nvidia.com>
---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 631da4b909a..c80a55aaf35 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -592,9 +592,9 @@ arrow_schema_data_types aggregate_reader_metadata::collect_arrow_schema() const
   // return boolean walk success status
   std::function<bool(const flatbuf::Field*, arrow_schema_data_types&)> walk_field =
     [&walk_field, &duration_from_flatbuffer, &arrow_type_col_seen](
-      const flatbuf::Field* field, arrow_schema_data_types& schema_elem) {
+      flatbuf::Field const* field, arrow_schema_data_types& schema_elem) {
       // DFS: recursively walk over the children first
-      auto const& field_children = field->children();
+      auto const field_children = field->children();
 
       if (field_children != nullptr) {
         auto schema_children = std::vector<arrow_schema_data_types>(field->children()->size());
@@ -642,7 +642,7 @@ arrow_schema_data_types aggregate_reader_metadata::collect_arrow_schema() const
   // Question: Should we check if any file has the "ARROW:schema" key or
   // Or if all files have the same "ARROW:schema"?
   auto const it = keyval_maps[0].find("ARROW:schema");
-  if (it == keyval_maps[0].end()) { return arrow_schema_data_types{}; }
+  if (it == keyval_maps[0].end()) { return {}; }
 
   // Decode the base64 encoded ipc message string
   // Note: Store the output from base64_decode in the lvalue here and then pass

From f92fcc8cd6e71d45b6615674bca24ce9ba505b22 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Fri, 10 May 2024 23:44:35 +0000
Subject: [PATCH 42/53] improve round trip tests for thorough arrow schema
 testing plus minor updates

---
 cpp/src/io/parquet/reader_impl_helpers.cpp |  16 +--
 python/cudf/cudf/tests/test_parquet.py     | 117 ++++++++++-----------
 2 files changed, 63 insertions(+), 70 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index c80a55aaf35..4996a491864 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -639,7 +639,7 @@ arrow_schema_data_types aggregate_reader_metadata::collect_arrow_schema() const
       return true;
     };
 
-  // Question: Should we check if any file has the "ARROW:schema" key or
+  // TODO: Should we check if any file has the "ARROW:schema" key or
   // Or if all files have the same "ARROW:schema"?
   auto const it = keyval_maps[0].find("ARROW:schema");
   if (it == keyval_maps[0].end()) { return {}; }
@@ -754,7 +754,7 @@ void aggregate_reader_metadata::apply_arrow_schema()
 
   // verify equal number of children for both schemas at root level
   if (pq_schema_root.num_children != static_cast<int32_t>(arrow_schema_root.children.size())) {
-    CUDF_LOG_DEBUG("Parquet reader encountered a mismatch between Parquet and arrow schema.",
+    CUDF_LOG_ERROR("Parquet reader encountered a mismatch between Parquet and arrow schema.",
                    "arrow:schema not processed.");
     return;
   }
@@ -766,7 +766,7 @@ void aggregate_reader_metadata::apply_arrow_schema()
                         return validate_schemas(arrow_schema_root.children[idx],
                                                 pq_schema_root.children_idx[idx]);
                       })) {
-    CUDF_LOG_DEBUG("Parquet reader encountered a mismatch between Parquet and arrow schema.",
+    CUDF_LOG_ERROR("Parquet reader encountered a mismatch between Parquet and arrow schema.",
                    "arrow:schema not processed.");
     return;
   }
@@ -785,7 +785,7 @@ std::optional<std::string_view> aggregate_reader_metadata::decode_ipc_message(
 {
   // Constants copied from arrow source and renamed to match the case
   constexpr auto MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL         = sizeof(int32_t);
-  constexpr auto message_decoder_next_required_size_metadata_length = sizeof(int32_t);
+  constexpr auto MESSAGE_DECODER_NEXT_REQUIRED_SIZE_METADATA_LENGTH = sizeof(int32_t);
   constexpr int32_t IPC_CONTINUATION_TOKEN                          = -1;
 
   // message buffer
@@ -821,14 +821,14 @@ std::optional<std::string_view> aggregate_reader_metadata::decode_ipc_message(
   }
 
   // Check for improper message.
-  if (message_size - message_decoder_next_required_size_metadata_length < 0) {
+  if (message_size - MESSAGE_DECODER_NEXT_REQUIRED_SIZE_METADATA_LENGTH < 0) {
     CUDF_LOG_ERROR("Parquet reader encountered unexpected arrow:schema message length.",
                    "arrow:schema not processed.");
   }
 
   // Get the next 4 bytes (metadata_len) of the ipc message
   int32_t metadata_len;
-  std::memcpy(&metadata_len, message_buf, message_decoder_next_required_size_metadata_length);
+  std::memcpy(&metadata_len, message_buf, MESSAGE_DECODER_NEXT_REQUIRED_SIZE_METADATA_LENGTH);
 
   // Check if the continuation matches the expected token
   if (metadata_len <= 0) {
@@ -837,8 +837,8 @@ std::optional<std::string_view> aggregate_reader_metadata::decode_ipc_message(
     return std::nullopt;
   } else {
     // Offset the message buf and reduce remaining size
-    message_buf += message_decoder_next_required_size_metadata_length;
-    message_size -= message_decoder_next_required_size_metadata_length;
+    message_buf += MESSAGE_DECODER_NEXT_REQUIRED_SIZE_METADATA_LENGTH;
+    message_size -= MESSAGE_DECODER_NEXT_REQUIRED_SIZE_METADATA_LENGTH;
   }
 
   // TODO: Since the arrow:schema message doesn't have a body,
diff --git a/python/cudf/cudf/tests/test_parquet.py b/python/cudf/cudf/tests/test_parquet.py
index d625774b14d..aca7dc51b2f 100644
--- a/python/cudf/cudf/tests/test_parquet.py
+++ b/python/cudf/cudf/tests/test_parquet.py
@@ -30,6 +30,7 @@
 from cudf.testing._utils import (
     TIMEDELTA_TYPES,
     assert_eq,
+    assert_neq,
     set_random_null_mask_inplace,
 )
 
@@ -3182,21 +3183,39 @@ def test_parquet_reader_zstd_huff_tables(datadir):
     assert_eq(actual, expected)
 
 
-def test_parquet_reader_duration_types():
-    # arrow schema is used to faithfully round trip duration
-    # types (timedelta64) across Parquet read and write.
+def test_parquet_reader_roundtrip_with_arrow_schema():
+    # Ensure that the nested types are faithfully being roundtripped
+    # across Parquet with arrow schema which is used to faithfully
+    # round trip duration types (timedelta64) across Parquet read and write.
     pdf = pd.DataFrame(
         {
             "s": pd.Series([1234, 3456, 32442], dtype="timedelta64[s]"),
             "ms": pd.Series([1234, 3456, 32442], dtype="timedelta64[ms]"),
             "us": pd.Series([1234, 3456, 32442], dtype="timedelta64[us]"),
             "ns": pd.Series([1234, 3456, 32442], dtype="timedelta64[ns]"),
+            "duration_list": [
+                [
+                    datetime.timedelta(minutes=7, seconds=4),
+                    datetime.timedelta(minutes=7),
+                ],
+                [
+                    datetime.timedelta(minutes=7, seconds=4),
+                    datetime.timedelta(minutes=7),
+                ],
+                [
+                    datetime.timedelta(minutes=7, seconds=4),
+                    datetime.timedelta(minutes=7),
+                ],
+            ],
+            "int64": pd.Series([1234, 123, 4123], dtype="int64"),
+            "list": list([[1, 2], [1, 2], [1, 2]]),
+            "datetime": pd.Series([1234, 123, 4123], dtype="datetime64[ms]"),
+            "map": pd.Series(["cat", "dog", "lion"]).map(
+                {"cat": "kitten", "dog": "puppy", "lion": "cub"}
+            ),
         }
     )
 
-    # Convert all pdf dtypes to int64
-    pdf2 = pdf.astype("int64")
-
     # Write parquet with arrow for now (to write arrow:schema)
     buffer = BytesIO()
     pdf.to_parquet(buffer, engine="pyarrow")
@@ -3210,82 +3229,56 @@ def test_parquet_reader_duration_types():
     assert_eq(expected.dtypes, got.dtypes)
     assert_eq(expected, got)
 
-    # Read parquet without arrow schema
-    got2 = cudf.read_parquet(buffer, use_arrow_schema=False)
-    # Convert to cudf table for an apple to apple comparison
-    expected2 = cudf.from_pandas(pdf2)
-
-    # Check results for reader without schema
-    assert_eq(expected2.dtypes, got2.dtypes)
-    assert_eq(expected2, got2)
-
-
-def test_parquet_reader_roundtrip_with_arrow_schema():
-    # Ensure that the nested types are faithfully being roundtripped
-    # across Parquet with arrow schema present
-
-    # data frame with several types that round trip perfectly
-    # without arrow schema as well
-    expected = cudf.DataFrame(
-        {
-            "int64": cudf.Series([1234, 123, 4123], dtype="int64"),
-            "list": list([[1, 2], [1, 2], [1, 2]]),
-            "datetime": cudf.Series([1234, 123, 4123], dtype="datetime64[ms]"),
-            "map": cudf.Series(["cat", "dog", "cow"]).map(
-                {"cat": "kitten", "dog": "puppy", "lion": "cub"}
-            ),
-        }
-    )
-
-    # Write parquet with arrow for now (to write arrow:schema)
-    buffer = BytesIO()
-    pdf = expected.to_pandas()
-    pdf.to_parquet(buffer, engine="pyarrow")
-
-    # Read parquet with arrow schema
-    got_with_schema = cudf.read_parquet(buffer)
-    got_without_schema = cudf.read_parquet(buffer, use_arrow_schema=False)
+    # Now read parquet without arrow schema
+    got = cudf.read_parquet(buffer, use_arrow_schema=False)
 
     # Check results for reader with schema
-    assert_eq(expected.dtypes, got_with_schema.dtypes)
-    assert_eq(expected, got_with_schema)
+    assert_neq(expected.dtypes, got.dtypes)
+    assert_neq(expected, got)
 
-    # Check results for reader without schema
-    assert_eq(expected.dtypes, got_without_schema.dtypes)
-    assert_eq(expected, got_without_schema)
 
-    # reset data frame with a column of struct type
-    expected = cudf.DataFrame(
+def test_parquet_reader_roundtrip_structs_with_arrow_schema():
+    # Ensure that the structs with duration types are faithfully being
+    # roundtripped across Parquet with arrow schema
+    pdf = pd.DataFrame(
         {
-            "a": {
+            "struct": {
                 "payload": {
                     "Domain": {
                         "Name": "abc",
                         "Id": {"Name": "host", "Value": "127.0.0.8"},
+                        "Duration": datetime.timedelta(minutes=12),
                     },
                     "StreamId": "12345678",
-                    "Duration": 10,
+                    "Duration": datetime.timedelta(minutes=4),
                     "Offset": 12,
-                    "Resource": [{"Name": "ZoneName", "Value": "RAPIDS"}],
+                    "Resource": [
+                        {
+                            "Name": "ZoneName",
+                            "Value": "RAPIDS",
+                            "Duration": datetime.timedelta(minutes=1),
+                        }
+                    ],
                 }
             }
         }
     )
 
-    # Reset the buffer
+    # Reset the buffer and write parquet with arrow
     buffer = BytesIO()
-
-    pdf = expected.to_pandas()
     pdf.to_parquet(buffer, engine="pyarrow")
 
     # Read parquet with arrow schema
-    got_with_schema = cudf.read_parquet(buffer)
-    got_without_schema = cudf.read_parquet(buffer, use_arrow_schema=False)
+    got = cudf.read_parquet(buffer)
 
-    # Check results for reader with schema
-    assert_eq(expected.dtypes, got_with_schema.dtypes)
-    assert_eq(expected, got_with_schema)
+    # Convert to cudf table for an apple to apple comparison
+    expected = cudf.from_pandas(pdf)
+    assert_eq(expected, got)
+    assert_eq(expected["struct"]._dtypes, got["struct"]._dtypes)
 
-    # Check results for reader without schema
-    assert_eq(expected.dtypes, got_without_schema.dtypes)
-    assert_eq(expected, got_without_schema)
+    # Now read parquet without arrow schema
+    got = cudf.read_parquet(buffer, use_arrow_schema=False)
+
+    # Check results for reader with schema
+    assert_neq(expected["struct"]._dtypes, got["struct"]._dtypes)
+    assert_neq(expected, got)

From 1c36d366a298e750d62d0ffa4eb887e18884ed08 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <14217455+mhaseeb123@users.noreply.github.com>
Date: Fri, 10 May 2024 16:47:56 -0700
Subject: [PATCH 43/53] Update cpp/src/io/parquet/reader_impl_helpers.cpp

Co-authored-by: Vukasin Milovanovic <vmilovanovic@nvidia.com>
---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 4996a491864..502c8224cb2 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -603,7 +603,7 @@ arrow_schema_data_types aggregate_reader_metadata::collect_arrow_schema() const
               thrust::make_counting_iterator(0),
               thrust::make_counting_iterator(static_cast<int32_t>(field_children->size())),
               [&](auto const& idx) {
-                return walk_field(*(field_children->begin() + idx), schema_children[idx]);
+                return walk_field((*field_children)[idx], schema_children[idx]);
               })) {
           return false;
         }

From 336574a30fdded6bba1a373a4d63bb9618b4051f Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Fri, 10 May 2024 23:52:18 +0000
Subject: [PATCH 44/53] minor syntactical updates to tests

---
 python/cudf/cudf/tests/test_parquet.py | 30 ++++++++++++++------------
 1 file changed, 16 insertions(+), 14 deletions(-)

diff --git a/python/cudf/cudf/tests/test_parquet.py b/python/cudf/cudf/tests/test_parquet.py
index aca7dc51b2f..3b07067e39d 100644
--- a/python/cudf/cudf/tests/test_parquet.py
+++ b/python/cudf/cudf/tests/test_parquet.py
@@ -3193,20 +3193,22 @@ def test_parquet_reader_roundtrip_with_arrow_schema():
             "ms": pd.Series([1234, 3456, 32442], dtype="timedelta64[ms]"),
             "us": pd.Series([1234, 3456, 32442], dtype="timedelta64[us]"),
             "ns": pd.Series([1234, 3456, 32442], dtype="timedelta64[ns]"),
-            "duration_list": [
+            "duration_list": list(
                 [
-                    datetime.timedelta(minutes=7, seconds=4),
-                    datetime.timedelta(minutes=7),
-                ],
-                [
-                    datetime.timedelta(minutes=7, seconds=4),
-                    datetime.timedelta(minutes=7),
-                ],
-                [
-                    datetime.timedelta(minutes=7, seconds=4),
-                    datetime.timedelta(minutes=7),
-                ],
-            ],
+                    [
+                        datetime.timedelta(minutes=7, seconds=4),
+                        datetime.timedelta(minutes=7),
+                    ],
+                    [
+                        datetime.timedelta(minutes=7, seconds=4),
+                        datetime.timedelta(minutes=7),
+                    ],
+                    [
+                        datetime.timedelta(minutes=7, seconds=4),
+                        datetime.timedelta(minutes=7),
+                    ],
+                ]
+            ),
             "int64": pd.Series([1234, 123, 4123], dtype="int64"),
             "list": list([[1, 2], [1, 2], [1, 2]]),
             "datetime": pd.Series([1234, 123, 4123], dtype="datetime64[ms]"),
@@ -3256,7 +3258,7 @@ def test_parquet_reader_roundtrip_structs_with_arrow_schema():
                         {
                             "Name": "ZoneName",
                             "Value": "RAPIDS",
-                            "Duration": datetime.timedelta(minutes=1),
+                            "Duration": datetime.timedelta(seconds=1),
                         }
                     ],
                 }

From b0289b82995d3e6eb6d9ca2cef1a3106794f9a1c Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <14217455+mhaseeb123@users.noreply.github.com>
Date: Mon, 13 May 2024 11:17:31 -0700
Subject: [PATCH 45/53] Apply suggestions from code review

Co-authored-by: Vukasin Milovanovic <vmilovanovic@nvidia.com>
---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index 502c8224cb2..c46f9d4a08f 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -639,7 +639,7 @@ arrow_schema_data_types aggregate_reader_metadata::collect_arrow_schema() const
       return true;
     };
 
-  // TODO: Should we check if any file has the "ARROW:schema" key or
+  // TODO: Should we check if any file has the "ARROW:schema" key
   // Or if all files have the same "ARROW:schema"?
   auto const it = keyval_maps[0].find("ARROW:schema");
   if (it == keyval_maps[0].end()) { return {}; }
@@ -656,21 +656,21 @@ arrow_schema_data_types aggregate_reader_metadata::collect_arrow_schema() const
   // Check if the string_view exists
   if (not metadata_buf.has_value()) {
     // No need to re-log error here as already logged inside decode_ipc_message
-    return arrow_schema_data_types{};
+    return {};
   }
 
   // Check if the decoded Message flatbuffer is valid
   if (flatbuf::GetMessage(metadata_buf.value().data()) == nullptr) {
     CUDF_LOG_ERROR("Parquet reader encountered an invalid ipc:Message flatbuffer pointer.",
                    "arrow:schema not processed.");
-    return arrow_schema_data_types{};
+    return {};
   }
 
   // Check if the Message flatbuffer has a valid arrow:schema in its header
   if (flatbuf::GetMessage(metadata_buf.value().data())->header_as_Schema() == nullptr) {
     CUDF_LOG_ERROR("Parquet reader encountered an invalid arrow:schema flatbuffer pointer.",
                    "arrow:schema not processed.");
-    return arrow_schema_data_types{};
+    return {};
   }
 
   // Get the vector of fields from arrow:schema flatbuffer object
@@ -679,7 +679,7 @@ arrow_schema_data_types aggregate_reader_metadata::collect_arrow_schema() const
   if (fields == nullptr) {
     CUDF_LOG_ERROR("Parquet reader encountered an invalid fields pointer.",
                    "arrow:schema not processed.");
-    return arrow_schema_data_types{};
+    return {};
   }
 
   // arrow schema structure to return
@@ -692,13 +692,13 @@ arrow_schema_data_types aggregate_reader_metadata::collect_arrow_schema() const
     if (not std::all_of(thrust::make_counting_iterator(0),
                         thrust::make_counting_iterator(static_cast<int32_t>(fields->size())),
                         [&](auto const& idx) {
-                          return walk_field(*(fields->begin() + idx), schema.children[idx]);
+                          return walk_field((*fields)[idx], schema.children[idx]);
                         })) {
-      return arrow_schema_data_types{};
+      return {};
     }
 
     // if no arrow type column seen, return nullopt.
-    if (not arrow_type_col_seen) { return arrow_schema_data_types{}; }
+    if (not arrow_type_col_seen) { return {}; }
   }
 
   return schema;

From 3a602cc01b16dfe52dcb2bad8b2c287503f38dfa Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Mon, 13 May 2024 21:18:24 +0000
Subject: [PATCH 46/53] small improvements and using zip iterator instead of
 counting iterator where possible

---
 cpp/src/io/parquet/reader_impl_helpers.cpp | 122 +++++++++++----------
 1 file changed, 63 insertions(+), 59 deletions(-)

diff --git a/cpp/src/io/parquet/reader_impl_helpers.cpp b/cpp/src/io/parquet/reader_impl_helpers.cpp
index c46f9d4a08f..34f6cfc273a 100644
--- a/cpp/src/io/parquet/reader_impl_helpers.cpp
+++ b/cpp/src/io/parquet/reader_impl_helpers.cpp
@@ -23,6 +23,7 @@
 #include "ipc/Schema_generated.h"
 
 #include <thrust/iterator/counting_iterator.h>
+#include <thrust/iterator/zip_iterator.h>
 
 #include <numeric>
 #include <regex>
@@ -590,9 +591,9 @@ arrow_schema_data_types aggregate_reader_metadata::collect_arrow_schema() const
 
   // Lambda function to walk a field and its children in DFS manner and
   // return boolean walk success status
-  std::function<bool(const flatbuf::Field*, arrow_schema_data_types&)> walk_field =
+  std::function<bool(flatbuf::Field const* const, arrow_schema_data_types&)> walk_field =
     [&walk_field, &duration_from_flatbuffer, &arrow_type_col_seen](
-      flatbuf::Field const* field, arrow_schema_data_types& schema_elem) {
+      flatbuf::Field const* const field, arrow_schema_data_types& schema_elem) {
       // DFS: recursively walk over the children first
       auto const field_children = field->children();
 
@@ -689,11 +690,10 @@ arrow_schema_data_types aggregate_reader_metadata::collect_arrow_schema() const
   if (fields->size() > 0) {
     schema.children = std::vector<arrow_schema_data_types>(fields->size());
 
-    if (not std::all_of(thrust::make_counting_iterator(0),
-                        thrust::make_counting_iterator(static_cast<int32_t>(fields->size())),
-                        [&](auto const& idx) {
-                          return walk_field((*fields)[idx], schema.children[idx]);
-                        })) {
+    if (not std::all_of(
+          thrust::make_counting_iterator(0),
+          thrust::make_counting_iterator(static_cast<int32_t>(fields->size())),
+          [&](auto const& idx) { return walk_field((*fields)[idx], schema.children[idx]); })) {
       return {};
     }
 
@@ -715,18 +715,19 @@ void aggregate_reader_metadata::apply_arrow_schema()
   }
 
   // Function to verify equal num_children at each level in Parquet and arrow schemas.
-  std::function<bool(arrow_schema_data_types&, int)> validate_schemas =
-    [&](arrow_schema_data_types& arrow_schema, int schema_idx) {
-      auto& schema_elem = per_file_metadata[0].schema[schema_idx];
+  std::function<bool(arrow_schema_data_types const&, int const)> validate_schemas =
+    [&](arrow_schema_data_types const& arrow_schema, int const schema_idx) {
+      auto& pq_schema_elem = per_file_metadata[0].schema[schema_idx];
 
       // ensure equal number of children first to avoid any segfaults in children
-      if (schema_elem.num_children == static_cast<int32_t>(arrow_schema.children.size())) {
+      if (pq_schema_elem.num_children == static_cast<int32_t>(arrow_schema.children.size())) {
         // true if and only if true for all children as well
-        return std::all_of(thrust::make_counting_iterator(0),
-                           thrust::make_counting_iterator(schema_elem.num_children),
-                           [&](auto const& idx) {
-                             return validate_schemas(arrow_schema.children[idx],
-                                                     schema_elem.children_idx[idx]);
+        return std::all_of(thrust::make_zip_iterator(thrust::make_tuple(
+                             arrow_schema.children.begin(), pq_schema_elem.children_idx.begin())),
+                           thrust::make_zip_iterator(thrust::make_tuple(
+                             arrow_schema.children.end(), pq_schema_elem.children_idx.end())),
+                           [&](auto const& elem) {
+                             return validate_schemas(thrust::get<0>(elem), thrust::get<1>(elem));
                            });
       } else {
         return false;
@@ -734,14 +735,15 @@ void aggregate_reader_metadata::apply_arrow_schema()
     };
 
   // Function to co-walk arrow and parquet schemas
-  std::function<void(arrow_schema_data_types&, int)> co_walk_schemas =
-    [&](arrow_schema_data_types& arrow_schema, int schema_idx) {
+  std::function<void(arrow_schema_data_types const&, int const)> co_walk_schemas =
+    [&](arrow_schema_data_types const& arrow_schema, int const schema_idx) {
       auto& pq_schema_elem = per_file_metadata[0].schema[schema_idx];
-      std::for_each(thrust::make_counting_iterator(0),
-                    thrust::make_counting_iterator(pq_schema_elem.num_children),
-                    [&](auto const& idx) {
-                      co_walk_schemas(arrow_schema.children[idx], pq_schema_elem.children_idx[idx]);
-                    });
+      std::for_each(
+        thrust::make_zip_iterator(
+          thrust::make_tuple(arrow_schema.children.begin(), pq_schema_elem.children_idx.begin())),
+        thrust::make_zip_iterator(
+          thrust::make_tuple(arrow_schema.children.end(), pq_schema_elem.children_idx.end())),
+        [&](auto const& elem) { co_walk_schemas(thrust::get<0>(elem), thrust::get<1>(elem)); });
 
       // true for DurationType columns only for now.
       if (arrow_schema.type.id() != type_id::EMPTY) {
@@ -759,92 +761,94 @@ void aggregate_reader_metadata::apply_arrow_schema()
     return;
   }
 
+  // zip iterator to validate and co-walk the two schemas
+  auto schemas = thrust::make_zip_iterator(
+    thrust::make_tuple(arrow_schema_root.children.begin(), pq_schema_root.children_idx.begin()));
+
   // Verify equal number of children at all sub-levels
-  if (not std::all_of(thrust::make_counting_iterator(0),
-                      thrust::make_counting_iterator(pq_schema_root.num_children),
-                      [&](auto const& idx) {
-                        return validate_schemas(arrow_schema_root.children[idx],
-                                                pq_schema_root.children_idx[idx]);
-                      })) {
+  if (not std::all_of(schemas, schemas + pq_schema_root.num_children, [&](auto const& elem) {
+        return validate_schemas(thrust::get<0>(elem), thrust::get<1>(elem));
+      })) {
     CUDF_LOG_ERROR("Parquet reader encountered a mismatch between Parquet and arrow schema.",
                    "arrow:schema not processed.");
     return;
   }
 
   // All good, now co-walk schemas
-  std::for_each(thrust::make_counting_iterator(0),
-                thrust::make_counting_iterator(pq_schema_root.num_children),
-                [&](auto const& idx) {
-                  co_walk_schemas(arrow_schema_root.children[idx],
-                                  pq_schema_root.children_idx[idx]);
-                });
+  std::for_each(schemas, schemas + pq_schema_root.num_children, [&](auto const& elem) {
+    co_walk_schemas(thrust::get<0>(elem), thrust::get<1>(elem));
+  });
 }
 
 std::optional<std::string_view> aggregate_reader_metadata::decode_ipc_message(
   std::string_view const serialized_message) const
 {
   // Constants copied from arrow source and renamed to match the case
-  constexpr auto MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL         = sizeof(int32_t);
-  constexpr auto MESSAGE_DECODER_NEXT_REQUIRED_SIZE_METADATA_LENGTH = sizeof(int32_t);
-  constexpr int32_t IPC_CONTINUATION_TOKEN                          = -1;
+  constexpr int32_t MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL         = sizeof(int32_t);
+  constexpr int32_t MESSAGE_DECODER_NEXT_REQUIRED_SIZE_METADATA_LENGTH = sizeof(int32_t);
+  constexpr int32_t IPC_CONTINUATION_TOKEN                             = -1;
 
   // message buffer
   auto message_buf = serialized_message.data();
   // current message (buffer) size
   auto message_size = static_cast<int32_t>(serialized_message.size());
 
+  // Lambda function to read and return 4 bytes as int32_t from the ipc message buffer and update
+  // buffer pointer and size
+  auto read_int32_from_ipc_message = [&]() {
+    int32_t bytes;
+    std::memcpy(&bytes, message_buf, sizeof(int32_t));
+    // Offset the message buf and reduce remaining size
+    message_buf += sizeof(int32_t);
+    message_size -= sizeof(int32_t);
+    return bytes;
+  };
+
   // Check for empty message
   if (message_size == 0) {
     CUDF_LOG_ERROR("Parquet reader encountered zero length arrow:schema.",
                    "arrow:schema not processed.");
     return std::nullopt;
   }
-  // Check for improper message.
-  if (message_size - MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL < 0) {
+
+  // Check for improper message size.
+  if (message_size < MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL) {
     CUDF_LOG_ERROR("Parquet reader encountered unexpected arrow:schema message length.",
                    "arrow:schema not processed.");
+    return std::nullopt;
   }
 
   // Get the first 4 bytes (continuation) of the ipc message
-  int32_t continuation;
-  std::memcpy(&continuation, message_buf, MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL);
-
-  // Check if the continuation matches the expected token
-  if (continuation != IPC_CONTINUATION_TOKEN) {
+  // and check if it matches the expected token
+  if (read_int32_from_ipc_message() != IPC_CONTINUATION_TOKEN) {
     CUDF_LOG_ERROR("Parquet reader encountered unexpected IPC continuation token.",
                    "arrow:schema not processed.");
     return std::nullopt;
-  } else {
-    // Offset the message buf and reduce remaining size
-    message_buf += MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL;
-    message_size -= MESSAGE_DECODER_NEXT_REQUIRED_SIZE_INITIAL;
   }
 
-  // Check for improper message.
-  if (message_size - MESSAGE_DECODER_NEXT_REQUIRED_SIZE_METADATA_LENGTH < 0) {
+  // Check for improper message size after the continuation bytes.
+  if (message_size < MESSAGE_DECODER_NEXT_REQUIRED_SIZE_METADATA_LENGTH) {
     CUDF_LOG_ERROR("Parquet reader encountered unexpected arrow:schema message length.",
                    "arrow:schema not processed.");
+    return std::nullopt;
   }
 
   // Get the next 4 bytes (metadata_len) of the ipc message
-  int32_t metadata_len;
-  std::memcpy(&metadata_len, message_buf, MESSAGE_DECODER_NEXT_REQUIRED_SIZE_METADATA_LENGTH);
+  // and check if invalid metadata length read
+  auto const metadata_len = read_int32_from_ipc_message();
 
-  // Check if the continuation matches the expected token
+  // Check if the read metadata (header) length is > zero
   if (metadata_len <= 0) {
     CUDF_LOG_ERROR("Parquet reader encountered unexpected metadata length.",
                    "arrow:schema not processed.");
     return std::nullopt;
-  } else {
-    // Offset the message buf and reduce remaining size
-    message_buf += MESSAGE_DECODER_NEXT_REQUIRED_SIZE_METADATA_LENGTH;
-    message_size -= MESSAGE_DECODER_NEXT_REQUIRED_SIZE_METADATA_LENGTH;
   }
 
+  // Check if the remaining message size is smaller than the expected metadata length
   // TODO: Since the arrow:schema message doesn't have a body,
   // the following check may be made tighter from < to ==
   if (message_size < metadata_len) {
-    CUDF_LOG_ERROR("Parquet reader encountered unexpected metadata bytes.",
+    CUDF_LOG_ERROR("Parquet reader encountered unexpected arrow:schema message length.",
                    "arrow:schema not processed.");
     return std::nullopt;
   }

From 7fbbea00a58c974260dc08d447a3f202ae766e06 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <14217455+mhaseeb123@users.noreply.github.com>
Date: Mon, 13 May 2024 15:55:26 -0700
Subject: [PATCH 47/53] Remove explicit check for dtypes as already being done

Co-authored-by: Matthew Roeschke <10647082+mroeschke@users.noreply.github.com>
---
 python/cudf/cudf/tests/test_parquet.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/python/cudf/cudf/tests/test_parquet.py b/python/cudf/cudf/tests/test_parquet.py
index cb786551081..999a21783f1 100644
--- a/python/cudf/cudf/tests/test_parquet.py
+++ b/python/cudf/cudf/tests/test_parquet.py
@@ -3291,7 +3291,6 @@ def test_parquet_reader_roundtrip_with_arrow_schema():
     expected = cudf.from_pandas(pdf)
 
     # Check results for reader with schema
-    assert_eq(expected.dtypes, got.dtypes)
     assert_eq(expected, got)
 
     # Now read parquet without arrow schema
@@ -3339,7 +3338,6 @@ def test_parquet_reader_roundtrip_structs_with_arrow_schema():
     # Convert to cudf table for an apple to apple comparison
     expected = cudf.from_pandas(pdf)
     assert_eq(expected, got)
-    assert_eq(expected["struct"]._dtypes, got["struct"]._dtypes)
 
     # Now read parquet without arrow schema
     got = cudf.read_parquet(buffer, use_arrow_schema=False)

From 6ab3b170c6e2cd24ea9659f03ed8399c7c73e1de Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <14217455+mhaseeb123@users.noreply.github.com>
Date: Mon, 13 May 2024 18:27:32 -0700
Subject: [PATCH 48/53] move `use_arrow_schema` to the end of parameters

Co-authored-by: GALI PREM SAGAR <sagarprem75@gmail.com>
---
 python/cudf/cudf/_lib/parquet.pyx | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/python/cudf/cudf/_lib/parquet.pyx b/python/cudf/cudf/_lib/parquet.pyx
index 2ec9aa100ca..216aaecdb11 100644
--- a/python/cudf/cudf/_lib/parquet.pyx
+++ b/python/cudf/cudf/_lib/parquet.pyx
@@ -124,9 +124,9 @@ def _parse_metadata(meta):
 
 
 cpdef read_parquet(filepaths_or_buffers, columns=None, row_groups=None,
-                   use_arrow_schema=True,
                    use_pandas_metadata=True,
-                   Expression filters=None):
+                   Expression filters=None,
+                   use_arrow_schema=True):
     """
     Cython function to call into libcudf API, see `read_parquet`.
 

From 4d74b248b41888360439376629a7e1f5c68d24cf Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Tue, 14 May 2024 02:00:20 +0000
Subject: [PATCH 49/53] Update tests to construct `expected` and use
 `assert_eq` for dtypes

---
 python/cudf/cudf/io/parquet.py         |  6 +-
 python/cudf/cudf/tests/test_parquet.py | 79 +++++++++++++++++++++++---
 2 files changed, 74 insertions(+), 11 deletions(-)

diff --git a/python/cudf/cudf/io/parquet.py b/python/cudf/cudf/io/parquet.py
index 282897ee82f..1b17158a159 100644
--- a/python/cudf/cudf/io/parquet.py
+++ b/python/cudf/cudf/io/parquet.py
@@ -473,13 +473,13 @@ def read_parquet(
     storage_options=None,
     filters=None,
     row_groups=None,
-    use_arrow_schema=True,
     use_pandas_metadata=True,
     use_python_file_object=True,
     categorical_partitions=True,
     open_file_options=None,
     bytes_per_thread=None,
     dataset_kwargs=None,
+    use_arrow_schema=True,
     *args,
     **kwargs,
 ):
@@ -611,11 +611,11 @@ def read_parquet(
         *args,
         columns=columns,
         row_groups=row_groups,
-        use_arrow_schema=use_arrow_schema,
         use_pandas_metadata=use_pandas_metadata,
         partition_keys=partition_keys,
         partition_categories=partition_categories,
         dataset_kwargs=dataset_kwargs,
+        use_arrow_schema=use_arrow_schema,
         **kwargs,
     )
 
@@ -843,8 +843,8 @@ def _read_parquet(
     engine,
     columns=None,
     row_groups=None,
-    use_arrow_schema=None,
     use_pandas_metadata=None,
+    use_arrow_schema=None,
     *args,
     **kwargs,
 ):
diff --git a/python/cudf/cudf/tests/test_parquet.py b/python/cudf/cudf/tests/test_parquet.py
index 999a21783f1..0e865c84c0d 100644
--- a/python/cudf/cudf/tests/test_parquet.py
+++ b/python/cudf/cudf/tests/test_parquet.py
@@ -31,7 +31,6 @@
 from cudf.testing._utils import (
     TIMEDELTA_TYPES,
     assert_eq,
-    assert_neq,
     set_random_null_mask_inplace,
 )
 
@@ -3293,12 +3292,47 @@ def test_parquet_reader_roundtrip_with_arrow_schema():
     # Check results for reader with schema
     assert_eq(expected, got)
 
+    # Reset pdf by changing all duration andtimedelta data to dummy int64 data. Dummy int64 data
+    # are used as the time units used by Arrow to convert durations to int64 may be
+    # different for different columns and/or source time units
+    pdf = pd.DataFrame(
+        {
+            "s": pd.Series([0, 0, 0], dtype="int64"),
+            "ms": pd.Series([0, 0, 0], dtype="int64"),
+            "us": pd.Series([0, 0, 0], dtype="int64"),
+            "ns": pd.Series([0, 0, 0], dtype="int64"),
+            "duration_list": list(
+                [
+                    [
+                        np.int64(0),
+                        np.int64(0),
+                    ],
+                    [
+                        np.int64(0),
+                        np.int64(0),
+                    ],
+                    [
+                        np.int64(0),
+                        np.int64(0),
+                    ],
+                ]
+            ),
+            "int64": pd.Series([0, 0, 0], dtype="int64"),
+            "list": list([[0, 0], [0, 0], [0, 0]]),
+            "datetime": pd.Series([0, 0, 0], dtype="datetime64[ms]"),
+            "map": pd.Series(["cat", "dog", "lion"]).map(
+                {"cat": "kitten", "dog": "puppy", "lion": "cub"}
+            ),
+        }
+    )
+
     # Now read parquet without arrow schema
     got = cudf.read_parquet(buffer, use_arrow_schema=False)
+    # Convert to cudf table for an apple to apple comparison
+    expected = cudf.from_pandas(pdf)
 
-    # Check results for reader with schema
-    assert_neq(expected.dtypes, got.dtypes)
-    assert_neq(expected, got)
+    # Check only the dtypes
+    assert_eq(expected.dtypes, got.dtypes)
 
 
 def test_parquet_reader_roundtrip_structs_with_arrow_schema():
@@ -3334,14 +3368,43 @@ def test_parquet_reader_roundtrip_structs_with_arrow_schema():
 
     # Read parquet with arrow schema
     got = cudf.read_parquet(buffer)
-
     # Convert to cudf table for an apple to apple comparison
     expected = cudf.from_pandas(pdf)
+
+    # Check results
     assert_eq(expected, got)
 
+    # Reset pdf by to changing all timedelta data to dummy int64 data. Dummy int64 data
+    # are used as the time units used by Arrow to convert durations to int64 may be
+    # different for different columns and/or source time units
+    pdf = pd.DataFrame(
+        {
+            "struct": {
+                "payload": {
+                    "Domain": {
+                        "Name": "abc",
+                        "Id": {"Name": "host", "Value": "127.0.0.8"},
+                        "Duration": np.int64(0),  # 12m
+                    },
+                    "StreamId": "12345678",
+                    "Duration": np.int64(0),  # 4m
+                    "Offset": 12,
+                    "Resource": [
+                        {
+                            "Name": "ZoneName",
+                            "Value": "RAPIDS",
+                            "Duration": np.int64(0),  # 1s
+                        }
+                    ],
+                }
+            }
+        }
+    )
+
     # Now read parquet without arrow schema
     got = cudf.read_parquet(buffer, use_arrow_schema=False)
+    # Convert to cudf table for an apple to apple comparison
+    expected = cudf.from_pandas(pdf)
 
-    # Check results for reader with schema
-    assert_neq(expected["struct"]._dtypes, got["struct"]._dtypes)
-    assert_neq(expected, got)
+    # Check only the dtypes
+    assert_eq(expected.dtypes, got.dtypes)

From a80f562e5dd35f16311a73c2b5dc0ebb711bec30 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Tue, 14 May 2024 02:10:23 +0000
Subject: [PATCH 50/53] Remove `use_arrow_schema` from public Python APIs.

---
 python/cudf/cudf/io/parquet.py         |  4 --
 python/cudf/cudf/tests/test_parquet.py | 77 --------------------------
 2 files changed, 81 deletions(-)

diff --git a/python/cudf/cudf/io/parquet.py b/python/cudf/cudf/io/parquet.py
index 1b17158a159..a6c67d22af7 100644
--- a/python/cudf/cudf/io/parquet.py
+++ b/python/cudf/cudf/io/parquet.py
@@ -479,7 +479,6 @@ def read_parquet(
     open_file_options=None,
     bytes_per_thread=None,
     dataset_kwargs=None,
-    use_arrow_schema=True,
     *args,
     **kwargs,
 ):
@@ -615,7 +614,6 @@ def read_parquet(
         partition_keys=partition_keys,
         partition_categories=partition_categories,
         dataset_kwargs=dataset_kwargs,
-        use_arrow_schema=use_arrow_schema,
         **kwargs,
     )
 
@@ -844,7 +842,6 @@ def _read_parquet(
     columns=None,
     row_groups=None,
     use_pandas_metadata=None,
-    use_arrow_schema=None,
     *args,
     **kwargs,
 ):
@@ -866,7 +863,6 @@ def _read_parquet(
             columns=columns,
             row_groups=row_groups,
             use_pandas_metadata=use_pandas_metadata,
-            use_arrow_schema=use_arrow_schema,
         )
     else:
         if (
diff --git a/python/cudf/cudf/tests/test_parquet.py b/python/cudf/cudf/tests/test_parquet.py
index 0e865c84c0d..e3d99642eac 100644
--- a/python/cudf/cudf/tests/test_parquet.py
+++ b/python/cudf/cudf/tests/test_parquet.py
@@ -3292,48 +3292,6 @@ def test_parquet_reader_roundtrip_with_arrow_schema():
     # Check results for reader with schema
     assert_eq(expected, got)
 
-    # Reset pdf by changing all duration andtimedelta data to dummy int64 data. Dummy int64 data
-    # are used as the time units used by Arrow to convert durations to int64 may be
-    # different for different columns and/or source time units
-    pdf = pd.DataFrame(
-        {
-            "s": pd.Series([0, 0, 0], dtype="int64"),
-            "ms": pd.Series([0, 0, 0], dtype="int64"),
-            "us": pd.Series([0, 0, 0], dtype="int64"),
-            "ns": pd.Series([0, 0, 0], dtype="int64"),
-            "duration_list": list(
-                [
-                    [
-                        np.int64(0),
-                        np.int64(0),
-                    ],
-                    [
-                        np.int64(0),
-                        np.int64(0),
-                    ],
-                    [
-                        np.int64(0),
-                        np.int64(0),
-                    ],
-                ]
-            ),
-            "int64": pd.Series([0, 0, 0], dtype="int64"),
-            "list": list([[0, 0], [0, 0], [0, 0]]),
-            "datetime": pd.Series([0, 0, 0], dtype="datetime64[ms]"),
-            "map": pd.Series(["cat", "dog", "lion"]).map(
-                {"cat": "kitten", "dog": "puppy", "lion": "cub"}
-            ),
-        }
-    )
-
-    # Now read parquet without arrow schema
-    got = cudf.read_parquet(buffer, use_arrow_schema=False)
-    # Convert to cudf table for an apple to apple comparison
-    expected = cudf.from_pandas(pdf)
-
-    # Check only the dtypes
-    assert_eq(expected.dtypes, got.dtypes)
-
 
 def test_parquet_reader_roundtrip_structs_with_arrow_schema():
     # Ensure that the structs with duration types are faithfully being
@@ -3373,38 +3331,3 @@ def test_parquet_reader_roundtrip_structs_with_arrow_schema():
 
     # Check results
     assert_eq(expected, got)
-
-    # Reset pdf by to changing all timedelta data to dummy int64 data. Dummy int64 data
-    # are used as the time units used by Arrow to convert durations to int64 may be
-    # different for different columns and/or source time units
-    pdf = pd.DataFrame(
-        {
-            "struct": {
-                "payload": {
-                    "Domain": {
-                        "Name": "abc",
-                        "Id": {"Name": "host", "Value": "127.0.0.8"},
-                        "Duration": np.int64(0),  # 12m
-                    },
-                    "StreamId": "12345678",
-                    "Duration": np.int64(0),  # 4m
-                    "Offset": 12,
-                    "Resource": [
-                        {
-                            "Name": "ZoneName",
-                            "Value": "RAPIDS",
-                            "Duration": np.int64(0),  # 1s
-                        }
-                    ],
-                }
-            }
-        }
-    )
-
-    # Now read parquet without arrow schema
-    got = cudf.read_parquet(buffer, use_arrow_schema=False)
-    # Convert to cudf table for an apple to apple comparison
-    expected = cudf.from_pandas(pdf)
-
-    # Check only the dtypes
-    assert_eq(expected.dtypes, got.dtypes)

From 4e368d87496518772293e8dd89337962de77edbf Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <14217455+mhaseeb123@users.noreply.github.com>
Date: Mon, 13 May 2024 19:19:38 -0700
Subject: [PATCH 51/53] Remove `use_arrow_schema` from Cython API args as well

Co-authored-by: GALI PREM SAGAR <sagarprem75@gmail.com>
---
 python/cudf/cudf/_lib/parquet.pyx | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/python/cudf/cudf/_lib/parquet.pyx b/python/cudf/cudf/_lib/parquet.pyx
index 216aaecdb11..c5591fe6a09 100644
--- a/python/cudf/cudf/_lib/parquet.pyx
+++ b/python/cudf/cudf/_lib/parquet.pyx
@@ -125,8 +125,7 @@ def _parse_metadata(meta):
 
 cpdef read_parquet(filepaths_or_buffers, columns=None, row_groups=None,
                    use_pandas_metadata=True,
-                   Expression filters=None,
-                   use_arrow_schema=True):
+                   Expression filters=None):
     """
     Cython function to call into libcudf API, see `read_parquet`.
 
@@ -153,7 +152,6 @@ cpdef read_parquet(filepaths_or_buffers, columns=None, row_groups=None,
         filepaths_or_buffers)
 
     cdef bool cpp_use_pandas_metadata = use_pandas_metadata
-    cdef bool cpp_use_arrow_schema = use_arrow_schema
 
     cdef vector[vector[size_type]] cpp_row_groups
     cdef data_type cpp_timestamp_type = cudf_types.data_type(
@@ -169,7 +167,7 @@ cpdef read_parquet(filepaths_or_buffers, columns=None, row_groups=None,
         parquet_reader_options.builder(source)
         .row_groups(cpp_row_groups)
         .use_pandas_metadata(cpp_use_pandas_metadata)
-        .use_arrow_schema(cpp_use_arrow_schema)
+        .use_arrow_schema(True)
         .timestamp_type(cpp_timestamp_type)
     )
     if filters is not None:

From 93ec78978deb0c0bd1b3b424740c3c47e38861f4 Mon Sep 17 00:00:00 2001
From: Muhammad Haseeb <mhaseeb@nvidia.com>
Date: Tue, 14 May 2024 02:21:19 +0000
Subject: [PATCH 52/53] Throw some Nulls in python tests

---
 python/cudf/cudf/tests/test_parquet.py | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/python/cudf/cudf/tests/test_parquet.py b/python/cudf/cudf/tests/test_parquet.py
index e3d99642eac..b2896d55b80 100644
--- a/python/cudf/cudf/tests/test_parquet.py
+++ b/python/cudf/cudf/tests/test_parquet.py
@@ -3251,9 +3251,9 @@ def test_parquet_reader_roundtrip_with_arrow_schema():
     # round trip duration types (timedelta64) across Parquet read and write.
     pdf = pd.DataFrame(
         {
-            "s": pd.Series([1234, 3456, 32442], dtype="timedelta64[s]"),
-            "ms": pd.Series([1234, 3456, 32442], dtype="timedelta64[ms]"),
-            "us": pd.Series([1234, 3456, 32442], dtype="timedelta64[us]"),
+            "s": pd.Series([None, None, None], dtype="timedelta64[s]"),
+            "ms": pd.Series([1234, None, 32442], dtype="timedelta64[ms]"),
+            "us": pd.Series([None, 3456, None], dtype="timedelta64[us]"),
             "ns": pd.Series([1234, 3456, 32442], dtype="timedelta64[ns]"),
             "duration_list": list(
                 [
@@ -3262,12 +3262,12 @@ def test_parquet_reader_roundtrip_with_arrow_schema():
                         datetime.timedelta(minutes=7),
                     ],
                     [
-                        datetime.timedelta(minutes=7, seconds=4),
-                        datetime.timedelta(minutes=7),
+                        None,
+                        None,
                     ],
                     [
                         datetime.timedelta(minutes=7, seconds=4),
-                        datetime.timedelta(minutes=7),
+                        None,
                     ],
                 ]
             ),
@@ -3307,7 +3307,7 @@ def test_parquet_reader_roundtrip_structs_with_arrow_schema():
                     },
                     "StreamId": "12345678",
                     "Duration": datetime.timedelta(minutes=4),
-                    "Offset": 12,
+                    "Offset": None,
                     "Resource": [
                         {
                             "Name": "ZoneName",

From 50d0b77742a01e89ca2a4ac8fa6cac7ce06d1e4c Mon Sep 17 00:00:00 2001
From: GALI PREM SAGAR <sagarprem75@gmail.com>
Date: Tue, 14 May 2024 14:45:34 -0500
Subject: [PATCH 53/53] Update .pre-commit-config.yaml

Co-authored-by: Bradley Dice <bdice@bradleydice.com>
---
 .pre-commit-config.yaml | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index fe7ff953a54..5a8d9f54673 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -144,10 +144,10 @@ repos:
       - id: verify-copyright
         exclude: |
           (?x)^(
-            cpp/include/cudf_test/cxxopts[.]hpp|
-            cpp/src/io/parquet/ipc/Message_generated[.]h|
-            cpp/src/io/parquet/ipc/Schema_generated[.]h
-          )$
+            cpp/include/cudf_test/cxxopts[.]hpp$|
+            cpp/src/io/parquet/ipc/Message_generated[.]h$|
+            cpp/src/io/parquet/ipc/Schema_generated[.]h$
+          )
 
 default_language_version:
       python: python3