6#include <unordered_map>
9#include <sparrow/record_batch.hpp>
21 sparrow::record_batch
data;
69 [[nodiscard]]
bool is_emitted(int64_t
id)
const noexcept;
79 std::set<int64_t> m_emitted_dict_ids;
80 std::unordered_map<int64_t, std::
string> m_dictionary_id_origins;
81 std::unordered_map<int64_t, std::
size_t> m_emitted_dict_sizes;
82 std::unordered_map<int64_t, std::
size_t> m_pending_dict_sizes;
Tracks dictionaries during serialization.
void mark_emitted(int64_t id) noexcept
Mark a dictionary as emitted.
std::vector< dictionary_info > extract_dictionaries_from_batch(const sparrow::record_batch &batch)
Extract dictionaries from a record batch.
bool is_emitted(int64_t id) const noexcept
Check if a dictionary has been emitted.
void reset() noexcept
Reset tracking state.
Information about a dictionary used for encoding.
bool is_delta
Whether this is a delta update.
sparrow::record_batch data
Dictionary values as a single-column record batch.
int64_t id
Dictionary identifier.
bool is_ordered
Whether dictionary values are ordered.