8#include <unordered_set>
11#include <sparrow/arrow_interface/arrow_array_schema_proxy.hpp>
35 template <
template<
typename...>
class ArrayType,
typename T>
39 std::optional<std::string> format_override = std::nullopt
42 const std::string_view format = format_override.has_value()
44 : sparrow::data_type_to_format(sparrow::detail::get_data_type_from_array<ArrayType<T>>::get());
56 const auto compression = context.
record_batch.compression();
57 std::vector<arrow_array_private_data::optionally_owned_buffer> buffers;
58 constexpr auto nb_buffers = 2;
59 buffers.reserve(nb_buffers);
71 buffers.push_back(std::move(validity_buffer_span));
72 buffers.push_back(std::move(data_buffer_span));
76 const auto null_count = std::visit(
77 [length = field_desc.
length](
const auto& arg) {
78 std::span<const uint8_t> span(arg.data(), arg.size());
79 return utils::get_bitmap_pointer_and_null_count(span, length).second;
94 sparrow::arrow_proxy ap{std::move(array), std::move(schema)};
95 return ArrayType<T>{std::move(ap)};
ArrayType< T > deserialize_simple_array(deserialization_context &context, const field_descriptor &field_desc, std::optional< std::string > format_override=std::nullopt)
Generic implementation for deserializing non-owning arrays with simple layout.
std::span< const uint8_t > get_buffer(const org::apache::arrow::flatbuf::RecordBatch &record_batch, std::span< const uint8_t > body, size_t &buffer_index)
Extracts a buffer from a RecordBatch's body.
std::variant< sparrow::buffer< std::uint8_t >, std::span< const std::uint8_t > > get_decompressed_buffer(std::span< const uint8_t > buffer_span, const org::apache::arrow::flatbuf::BodyCompression *compression)
Retrieves a decompressed buffer or a view of the original buffer.
ArrowSchema make_non_owning_arrow_schema(std::string_view format, std::string_view name, std::optional< M > metadata, std::optional< std::unordered_set< sparrow::ArrowFlag > > flags, size_t children_count, ArrowSchema **children, ArrowSchema *dictionary)
ArrowArray make_arrow_array(int64_t length, int64_t null_count, int64_t offset, size_t children_count, ArrowArray **children, ArrowArray *dictionary, Arg &&private_data_arg)
Encapsulates the context required for deserialization.
std::span< const uint8_t > body
const org::apache::arrow::flatbuf::RecordBatch & record_batch
Encapsulates the description of a field to be deserialized.
std::optional< std::vector< sparrow::metadata_pair > > metadata
std::optional< std::unordered_set< sparrow::ArrowFlag > > flags