OmniSciDB
a5dc49c757
|
#include <ParquetInPlaceEncoder.h>
Public Member Functions | |
TypedParquetInPlaceEncoder (Data_Namespace::AbstractBuffer *buffer, const ColumnDescriptor *column_desciptor, const parquet::ColumnDescriptor *parquet_column_descriptor) | |
TypedParquetInPlaceEncoder (Data_Namespace::AbstractBuffer *buffer, const size_t omnisci_data_type_byte_size, const size_t parquet_data_type_byte_size) | |
void | validate (const int8_t *parquet_data, const int64_t j, const SQLTypeInfo &column_type) const override |
std::string | integralTypeToString (const V &element) const |
bool | isIntegralType (const SQLTypeInfo &type) const |
std::string | elementToString (const V &element) const |
std::string | encodedDataToString (const int8_t *bytes) const override |
void | setDetectBufferConverterType () |
void | validateUsingEncodersColumnType (const int8_t *parquet_data, const int64_t j) const override |
void | reserve (const size_t num_append_elements) override |
void | appendDataTrackErrors (const int16_t *def_levels, const int16_t *rep_levels, const int64_t values_read, const int64_t levels_read, int8_t *values) override |
void | validateAndAppendData (const int16_t *def_levels, const int16_t *rep_levels, const int64_t values_read, const int64_t levels_read, int8_t *values, const SQLTypeInfo &column_type, InvalidRowGroupIndices &invalid_indices) override |
void | eraseInvalidIndicesInBuffer (const InvalidRowGroupIndices &invalid_indices) override |
void | appendData (const int16_t *def_levels, const int16_t *rep_levels, const int64_t values_read, const int64_t levels_read, int8_t *values) override |
void | encodeAndCopyContiguous (const int8_t *parquet_data_bytes, int8_t *omnisci_data_bytes, const size_t num_elements) override |
void | setNull (int8_t *omnisci_data_bytes) override |
void | copy (const int8_t *omnisci_data_bytes_source, int8_t *omnisci_data_bytes_destination) override |
std::shared_ptr< ChunkMetadata > | getRowGroupMetadata (const parquet::RowGroupMetaData *group_metadata, const int parquet_column_index, const SQLTypeInfo &column_type) override |
Public Member Functions inherited from foreign_storage::ParquetInPlaceEncoder | |
ParquetInPlaceEncoder (Data_Namespace::AbstractBuffer *buffer, const size_t omnisci_data_type_byte_size, const size_t parquet_data_type_byte_size) | |
Public Member Functions inherited from foreign_storage::ParquetScalarEncoder | |
ParquetScalarEncoder (Data_Namespace::AbstractBuffer *buffer) | |
virtual void | encodeAndCopy (const int8_t *parquet_data_bytes, int8_t *omnisci_data_bytes)=0 |
Public Member Functions inherited from foreign_storage::ParquetEncoder | |
ParquetEncoder (Data_Namespace::AbstractBuffer *buffer) | |
virtual | ~ParquetEncoder ()=default |
RejectedRowIndices | getRejectedRowIndices () const |
virtual void | disableMetadataStatsValidation () |
virtual void | initializeErrorTracking () |
virtual void | initializeColumnType (const SQLTypeInfo &column_type) |
Protected Member Functions | |
virtual bool | encodingIsIdentityForSameTypes () const |
std::pair< T, T > | getUnencodedStats (std::shared_ptr< parquet::Statistics > stats) const |
Private Member Functions | |
std::pair< V, V > | getEncodedStats (const parquet::ColumnDescriptor *parquet_column_descriptor, std::shared_ptr< parquet::Statistics > stats) |
Static Private Member Functions | |
static ChunkStats | getUpdatedStats (V &stats_min, V &stats_max, const SQLTypeInfo &column_type) |
Private Attributes | |
int64_t | current_batch_offset_ = 0 |
Additional Inherited Members | |
Static Protected Member Functions inherited from foreign_storage::ParquetEncoder | |
static std::shared_ptr < ChunkMetadata > | createMetadata (const SQLTypeInfo &column_type) |
static void | throwNotNullViolation (const std::string &parquet_column_name) |
static void | validateNullCount (const std::string &parquet_column_name, int64_t null_count, const SQLTypeInfo &column_type) |
Protected Attributes inherited from foreign_storage::ParquetInPlaceEncoder | |
const size_t | omnisci_data_type_byte_size_ |
const size_t | parquet_data_type_byte_size_ |
Protected Attributes inherited from foreign_storage::ParquetEncoder | |
Data_Namespace::AbstractBuffer * | buffer_ |
bool | is_error_tracking_enabled_ |
RejectedRowIndices | invalid_indices_ |
size_t | current_chunk_offset_ |
SQLTypeInfo | column_type_ |
bool | validate_metadata_stats_ |
Definition at line 114 of file ParquetInPlaceEncoder.h.
|
inline |
Definition at line 116 of file ParquetInPlaceEncoder.h.
|
inline |
Definition at line 129 of file ParquetInPlaceEncoder.h.
|
inlineoverridevirtual |
This is a specialization of ParquetInPlaceEncoder::appendData
for known types that allows for optimization.
See comment for ParquetInPlaceEncoder::appendData
for details.
Reimplemented from foreign_storage::ParquetInPlaceEncoder.
Definition at line 264 of file ParquetInPlaceEncoder.h.
Referenced by foreign_storage::ParquetStringEncoder< V >::appendData(), foreign_storage::TypedParquetInPlaceEncoder< V, V >::appendDataTrackErrors(), and foreign_storage::TypedParquetInPlaceEncoder< V, V >::validateAndAppendData().
|
inlineoverridevirtual |
Implements foreign_storage::ParquetEncoder.
Definition at line 191 of file ParquetInPlaceEncoder.h.
|
inlineoverridevirtual |
Implements foreign_storage::ParquetScalarEncoder.
Definition at line 299 of file ParquetInPlaceEncoder.h.
Referenced by foreign_storage::ParquetStringEncoder< V >::encodeAndCopy().
|
inline |
Definition at line 156 of file ParquetInPlaceEncoder.h.
Referenced by foreign_storage::TypedParquetInPlaceEncoder< V, V >::encodedDataToString(), and foreign_storage::TypedParquetInPlaceEncoder< V, V >::setDetectBufferConverterType().
|
inlineoverridevirtual |
Implements foreign_storage::ParquetScalarEncoder.
Definition at line 283 of file ParquetInPlaceEncoder.h.
|
inlineoverridevirtual |
Implements foreign_storage::ParquetScalarEncoder.
Definition at line 168 of file ParquetInPlaceEncoder.h.
|
inlineprotectedvirtual |
Reimplemented in foreign_storage::ParquetStringEncoder< V >, foreign_storage::ParquetFixedLengthEncoder< V, T, NullType >, and foreign_storage::ParquetDecimalEncoder< V, T, NullType >.
Definition at line 362 of file ParquetInPlaceEncoder.h.
Referenced by foreign_storage::TypedParquetInPlaceEncoder< V, V >::appendData().
|
inlineoverridevirtual |
Implements foreign_storage::ParquetImportEncoder.
Definition at line 239 of file ParquetInPlaceEncoder.h.
|
inlineprivate |
Definition at line 394 of file ParquetInPlaceEncoder.h.
Referenced by foreign_storage::TypedParquetInPlaceEncoder< V, V >::getRowGroupMetadata().
|
inlineoverridevirtual |
Reimplemented from foreign_storage::ParquetEncoder.
Definition at line 308 of file ParquetInPlaceEncoder.h.
|
inlineprotected |
Definition at line 364 of file ParquetInPlaceEncoder.h.
Referenced by foreign_storage::ParquetDateInSecondsEncoder< NullType >::validate(), foreign_storage::ParquetTimestampEncoder< V, T, conversion_denominator *kSecsPerDay, NullType >::validate(), foreign_storage::ParquetUnsignedFixedLengthEncoder< V, T, U, NullType >::validate(), and foreign_storage::ParquetFixedLengthEncoder< V, T, NullType >::validateIntegralOrFloatingPointMetadata().
|
inlinestaticprivate |
Definition at line 371 of file ParquetInPlaceEncoder.h.
Referenced by foreign_storage::TypedParquetInPlaceEncoder< V, V >::getRowGroupMetadata().
|
inline |
Definition at line 145 of file ParquetInPlaceEncoder.h.
Referenced by foreign_storage::TypedParquetInPlaceEncoder< V, V >::elementToString().
|
inline |
Definition at line 151 of file ParquetInPlaceEncoder.h.
Referenced by foreign_storage::TypedParquetInPlaceEncoder< V, V >::elementToString().
|
inlineoverridevirtual |
Implements foreign_storage::ParquetInPlaceEncoder.
Definition at line 187 of file ParquetInPlaceEncoder.h.
|
inline |
Definition at line 173 of file ParquetInPlaceEncoder.h.
Referenced by foreign_storage::TypedParquetInPlaceEncoder< V, V >::TypedParquetInPlaceEncoder().
|
inlineoverridevirtual |
Implements foreign_storage::ParquetScalarEncoder.
Definition at line 294 of file ParquetInPlaceEncoder.h.
|
inlineoverridevirtual |
Implements foreign_storage::ParquetScalarEncoder.
Reimplemented in foreign_storage::ParquetTimestampEncoder< V, T, conversion_denominator, NullType >, and foreign_storage::ParquetTimestampEncoder< V, T, conversion_denominator *kSecsPerDay, NullType >.
Definition at line 139 of file ParquetInPlaceEncoder.h.
Referenced by foreign_storage::TypedParquetInPlaceEncoder< V, V >::validateAndAppendData(), and foreign_storage::TypedParquetInPlaceEncoder< V, V >::validateUsingEncodersColumnType().
|
inlineoverridevirtual |
Implements foreign_storage::ParquetImportEncoder.
Definition at line 217 of file ParquetInPlaceEncoder.h.
|
inlineoverridevirtual |
Implements foreign_storage::ParquetScalarEncoder.
Definition at line 182 of file ParquetInPlaceEncoder.h.
Referenced by foreign_storage::TypedParquetInPlaceEncoder< V, V >::appendDataTrackErrors().
|
private |
Definition at line 430 of file ParquetInPlaceEncoder.h.
Referenced by foreign_storage::TypedParquetInPlaceEncoder< V, V >::validateAndAppendData().