OmniSciDB
c1a53651b2
|
Classes | |
struct | MaxRowGroupSizeStats |
Functions | |
bool | within_range (int64_t lower_bound, int64_t upper_bound, int64_t value) |
bool | is_valid_parquet_string (const parquet::ColumnDescriptor *parquet_column) |
bool | is_valid_parquet_list_column (const parquet::ColumnDescriptor *parquet_column) |
Detect a valid list parquet column. More... | |
template<typename V , typename NullType > | |
std::shared_ptr< ParquetEncoder > | create_parquet_decimal_encoder_with_omnisci_type (const ColumnDescriptor *column_descriptor, const parquet::ColumnDescriptor *parquet_column_descriptor, AbstractBuffer *buffer) |
std::shared_ptr< ParquetEncoder > | create_parquet_decimal_encoder (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, AbstractBuffer *buffer, const bool is_metadata_scan_or_for_import) |
template<typename V , typename T , typename U , typename NullType > | |
std::shared_ptr< ParquetEncoder > | create_parquet_signed_or_unsigned_integral_encoder_with_types (AbstractBuffer *buffer, const size_t omnisci_data_type_byte_size, const size_t parquet_data_type_byte_size, const bool is_signed) |
Create a signed or unsigned integral parquet encoder using types. More... | |
template<typename V , typename NullType > | |
std::shared_ptr< ParquetEncoder > | create_parquet_integral_encoder_with_omnisci_type (AbstractBuffer *buffer, const size_t omnisci_data_type_byte_size, const size_t parquet_data_type_byte_size, const int bit_width, const bool is_signed) |
Create a integral parquet encoder using types. More... | |
std::shared_ptr< ParquetEncoder > | create_parquet_integral_encoder (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, AbstractBuffer *buffer, const bool is_metadata_scan_or_for_import) |
std::shared_ptr< ParquetEncoder > | create_parquet_floating_point_encoder (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, AbstractBuffer *buffer) |
std::shared_ptr< ParquetEncoder > | create_parquet_none_type_encoder (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, AbstractBuffer *buffer) |
template<typename V , typename T , typename NullType > | |
std::shared_ptr< ParquetEncoder > | create_parquet_timestamp_encoder_with_types (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, AbstractBuffer *buffer) |
template<typename V , typename T , typename NullType > | |
std::shared_ptr< ParquetEncoder > | create_parquet_date_from_timestamp_encoder_with_types (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, AbstractBuffer *buffer, const bool is_metadata_scan_or_for_import) |
std::shared_ptr< ParquetEncoder > | create_parquet_timestamp_encoder (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, AbstractBuffer *buffer, const bool is_metadata_scan_or_for_import) |
template<typename V , typename T , typename NullType > | |
std::shared_ptr< ParquetEncoder > | create_parquet_time_encoder_with_types (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, AbstractBuffer *buffer) |
std::shared_ptr< ParquetEncoder > | create_parquet_time_encoder (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, AbstractBuffer *buffer, const bool is_metadata_scan_or_for_import) |
std::shared_ptr< ParquetEncoder > | create_parquet_date_from_timestamp_encoder (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, AbstractBuffer *buffer, const bool is_metadata_scan_or_for_import) |
std::shared_ptr< ParquetEncoder > | create_parquet_date_encoder (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, AbstractBuffer *buffer, const bool is_metadata_scan_or_for_import) |
std::shared_ptr< ParquetEncoder > | create_parquet_string_encoder (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, const Chunk_NS::Chunk &chunk, StringDictionary *string_dictionary, std::list< std::unique_ptr< ChunkMetadata >> &chunk_metadata, bool is_for_import, const bool is_for_detect) |
std::shared_ptr< ParquetEncoder > | create_parquet_geospatial_encoder (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, std::list< Chunk_NS::Chunk > &chunks, std::list< std::unique_ptr< ChunkMetadata >> &chunk_metadata, const RenderGroupAnalyzerMap *render_group_analyzer_map, const bool is_metadata_scan, const bool is_for_import) |
std::shared_ptr< ParquetEncoder > | create_parquet_array_encoder (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, std::list< Chunk_NS::Chunk > &chunks, StringDictionary *string_dictionary, std::list< std::unique_ptr< ChunkMetadata >> &chunk_metadata, const bool is_metadata_scan, const bool is_for_import, const bool is_for_detect) |
std::shared_ptr< ParquetEncoder > | create_parquet_encoder (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, std::list< Chunk_NS::Chunk > &chunks, StringDictionary *string_dictionary, std::list< std::unique_ptr< ChunkMetadata >> &chunk_metadata, const RenderGroupAnalyzerMap *render_group_analyzer_map, const bool is_metadata_scan=false, const bool is_for_import=false, const bool is_for_detect=false) |
Create a Parquet specific encoder for a Parquet to OmniSci mapping. More... | |
std::shared_ptr< ParquetEncoder > | create_parquet_encoder_for_import (std::list< Chunk_NS::Chunk > &chunks, const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, StringDictionary *string_dictionary, const RenderGroupAnalyzerMap *render_group_analyzer_map) |
std::shared_ptr< ParquetEncoder > | create_parquet_encoder_for_metadata_scan (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, const RenderGroupAnalyzerMap *render_group_analyzer_map) |
void | validate_definition_levels (const parquet::ParquetFileReader *reader, const int row_group_index, const int column_index, const int16_t *def_levels, const int64_t num_levels, const parquet::ColumnDescriptor *parquet_column_descriptor) |
void | validate_max_repetition_and_definition_level (const ColumnDescriptor *omnisci_column_descriptor, const parquet::ColumnDescriptor *parquet_column_descriptor) |
void | resize_values_buffer (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column, std::vector< int8_t > &values) |
bool | validate_decimal_mapping (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column) |
SQLTypeInfo | suggest_decimal_mapping (const parquet::ColumnDescriptor *parquet_column) |
bool | validate_floating_point_mapping (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column) |
SQLTypeInfo | suggest_floating_point_mapping (const parquet::ColumnDescriptor *parquet_column) |
bool | validate_integral_mapping (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column) |
SQLTypeInfo | suggest_integral_mapping (const parquet::ColumnDescriptor *parquet_column) |
bool | is_nanosecond_precision (const ColumnDescriptor *omnisci_column) |
bool | is_nanosecond_precision (const parquet::TimestampLogicalType *timestamp_logical_column) |
bool | is_microsecond_precision (const ColumnDescriptor *omnisci_column) |
bool | is_microsecond_precision (const parquet::TimestampLogicalType *timestamp_logical_column) |
bool | is_millisecond_precision (const ColumnDescriptor *omnisci_column) |
bool | is_millisecond_precision (const parquet::TimestampLogicalType *timestamp_logical_column) |
bool | validate_none_type_mapping (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column) |
SQLTypeInfo | suggest_boolean_type_mapping (const parquet::ColumnDescriptor *parquet_column) |
bool | validate_timestamp_mapping (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column) |
SQLTypeInfo | suggest_timestamp_mapping (const parquet::ColumnDescriptor *parquet_column) |
bool | validate_time_mapping (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column) |
SQLTypeInfo | suggest_time_mapping (const parquet::ColumnDescriptor *parquet_column) |
bool | validate_date_mapping (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column) |
SQLTypeInfo | suggest_date_mapping (const parquet::ColumnDescriptor *parquet_column) |
bool | validate_string_mapping (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column) |
SQLTypeInfo | suggest_string_mapping (const parquet::ColumnDescriptor *parquet_column) |
bool | validate_array_mapping (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column) |
bool | validate_geospatial_mapping (const ColumnDescriptor *omnisci_column, const parquet::ColumnDescriptor *parquet_column) |
void | validate_equal_schema (const parquet::arrow::FileReader *reference_file_reader, const parquet::arrow::FileReader *new_file_reader, const std::string &reference_file_path, const std::string &new_file_path) |
void | validate_allowed_mapping (const parquet::ColumnDescriptor *parquet_column, const ColumnDescriptor *omnisci_column) |
SQLTypeInfo | suggest_column_scalar_type (const parquet::ColumnDescriptor *parquet_column) |
void | validate_number_of_columns (const std::shared_ptr< parquet::FileMetaData > &file_metadata, const std::string &file_path, const ForeignTableSchema &schema) |
void | throw_missing_metadata_error (const int row_group_index, const int column_index, const std::string &file_path) |
void | throw_row_group_larger_than_fragment_size_error (const MaxRowGroupSizeStats max_row_group_stats, const int fragment_size) |
MaxRowGroupSizeStats | validate_column_mapping_and_row_group_metadata (const std::shared_ptr< parquet::FileMetaData > &file_metadata, const std::string &file_path, const ForeignTableSchema &schema) |
MaxRowGroupSizeStats | validate_parquet_metadata (const std::shared_ptr< parquet::FileMetaData > &file_metadata, const std::string &file_path, const ForeignTableSchema &schema) |
std::list< RowGroupMetadata > | metadata_scan_rowgroup_interval (const std::map< int, std::shared_ptr< ParquetEncoder >> &encoder_map, const RowGroupInterval &row_group_interval, const ReaderPtr &reader, const ForeignTableSchema &schema) |
std::map< int, std::shared_ptr < ParquetEncoder > > | populate_encoder_map_for_import (const std::map< int, Chunk_NS::Chunk > chunks, const ForeignTableSchema &schema, const ReaderPtr &reader, const std::map< int, StringDictionary * > column_dictionaries, const int64_t num_rows, const RenderGroupAnalyzerMap *render_group_analyzer_map) |
std::map< int, std::shared_ptr < ParquetEncoder > > | populate_encoder_map_for_metadata_scan (const Interval< ColumnType > &column_interval, const ForeignTableSchema &schema, const ReaderPtr &reader, const RenderGroupAnalyzerMap *render_group_analyzer_map, const bool do_metadata_stats_validation) |
std::shared_ptr< ParquetEncoder > foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_array_encoder | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
std::list< Chunk_NS::Chunk > & | chunks, | ||
StringDictionary * | string_dictionary, | ||
std::list< std::unique_ptr< ChunkMetadata >> & | chunk_metadata, | ||
const bool | is_metadata_scan, | ||
const bool | is_for_import, | ||
const bool | is_for_detect | ||
) |
Definition at line 1018 of file LazyParquetChunkLoader.cpp.
References CHECK, ColumnDescriptor::columnType, create_parquet_encoder(), foreign_storage::get_sub_type_column_descriptor(), SQLTypeInfo::is_array(), SQLTypeInfo::is_fixlen_array(), and is_valid_parquet_list_column().
Referenced by create_parquet_encoder().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_date_encoder | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
AbstractBuffer * | buffer, | ||
const bool | is_metadata_scan_or_for_import | ||
) |
Definition at line 736 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, kENCODING_DATE_IN_DAYS, kENCODING_NONE, and UNREACHABLE.
Referenced by create_parquet_encoder().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_date_from_timestamp_encoder | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
AbstractBuffer * | buffer, | ||
const bool | is_metadata_scan_or_for_import | ||
) |
Definition at line 693 of file LazyParquetChunkLoader.cpp.
References CHECK, ColumnDescriptor::columnType, create_parquet_date_from_timestamp_encoder_with_types(), kENCODING_DATE_IN_DAYS, and UNREACHABLE.
Referenced by create_parquet_encoder().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_date_from_timestamp_encoder_with_types | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
AbstractBuffer * | buffer, | ||
const bool | is_metadata_scan_or_for_import | ||
) |
Definition at line 508 of file LazyParquetChunkLoader.cpp.
References heavydb.dtypes::T, and UNREACHABLE.
Referenced by create_parquet_date_from_timestamp_encoder().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_decimal_encoder | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
AbstractBuffer * | buffer, | ||
const bool | is_metadata_scan_or_for_import | ||
) |
Definition at line 171 of file LazyParquetChunkLoader.cpp.
References CHECK, ColumnDescriptor::columnType, SQLTypeInfo::get_comp_param(), SQLTypeInfo::get_compression(), kENCODING_FIXED, kENCODING_NONE, and UNREACHABLE.
Referenced by create_parquet_encoder().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_decimal_encoder_with_omnisci_type | ( | const ColumnDescriptor * | column_descriptor, |
const parquet::ColumnDescriptor * | parquet_column_descriptor, | ||
AbstractBuffer * | buffer | ||
) |
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_encoder | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
std::list< Chunk_NS::Chunk > & | chunks, | ||
StringDictionary * | string_dictionary, | ||
std::list< std::unique_ptr< ChunkMetadata >> & | chunk_metadata, | ||
const RenderGroupAnalyzerMap * | render_group_analyzer_map, | ||
const bool | is_metadata_scan = false , |
||
const bool | is_for_import = false , |
||
const bool | is_for_detect = false |
||
) |
Create a Parquet specific encoder for a Parquet to OmniSci mapping.
omnisci_column | - the descriptor of OmniSci column |
parquet_column | - the descriptor of Parquet column |
chunks | - list of chunks to populate (the case of more than one chunk happens only if a logical column expands to multiple physical columns) |
string_dictionary | - string dictionary used in encoding for string dictionary encoded columns |
chunk_metadata | - similar to the list of chunks, a list of chunk metadata that is populated |
is_metadata_scan | - a flag indicating if the encoders created should be for a metadata scan |
is_for_import | - a flag indicating if the encoders created should be for import |
Notes:
isColumnMappingSupported
work in conjunction with each other. For example, once a mapping is known to be allowed (since isColumnMappingSupported
returned true) this function does not have to check many corner cases exhaustively as it would be redundant with what was checked in isColumnMappingSupported
. Definition at line 902 of file LazyParquetChunkLoader.cpp.
References CHECK, create_parquet_array_encoder(), create_parquet_date_encoder(), create_parquet_date_from_timestamp_encoder(), create_parquet_decimal_encoder(), create_parquet_floating_point_encoder(), create_parquet_geospatial_encoder(), create_parquet_integral_encoder(), create_parquet_none_type_encoder(), create_parquet_string_encoder(), create_parquet_time_encoder(), create_parquet_timestamp_encoder(), and UNREACHABLE.
Referenced by foreign_storage::LazyParquetChunkLoader::appendRowGroups(), create_parquet_array_encoder(), create_parquet_encoder_for_import(), and create_parquet_encoder_for_metadata_scan().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_encoder_for_import | ( | std::list< Chunk_NS::Chunk > & | chunks, |
const ColumnDescriptor * | omnisci_column, | ||
const parquet::ColumnDescriptor * | parquet_column, | ||
StringDictionary * | string_dictionary, | ||
const RenderGroupAnalyzerMap * | render_group_analyzer_map | ||
) |
Intended to be used for the import case.
Definition at line 982 of file LazyParquetChunkLoader.cpp.
References create_parquet_encoder().
Referenced by populate_encoder_map_for_import().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_encoder_for_metadata_scan | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
const RenderGroupAnalyzerMap * | render_group_analyzer_map | ||
) |
Intended to be used only with metadata scan. Creates an incomplete encoder capable of updating metadata.
Definition at line 1003 of file LazyParquetChunkLoader.cpp.
References create_parquet_encoder().
Referenced by populate_encoder_map_for_metadata_scan().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_floating_point_encoder | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
AbstractBuffer * | buffer | ||
) |
Definition at line 427 of file LazyParquetChunkLoader.cpp.
References CHECK, CHECK_EQ, ColumnDescriptor::columnType, kDOUBLE, kENCODING_NONE, kFLOAT, and UNREACHABLE.
Referenced by create_parquet_encoder().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_geospatial_encoder | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
std::list< Chunk_NS::Chunk > & | chunks, | ||
std::list< std::unique_ptr< ChunkMetadata >> & | chunk_metadata, | ||
const RenderGroupAnalyzerMap * | render_group_analyzer_map, | ||
const bool | is_metadata_scan, | ||
const bool | is_for_import | ||
) |
Definition at line 830 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, and is_valid_parquet_string().
Referenced by create_parquet_encoder().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_integral_encoder | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
AbstractBuffer * | buffer, | ||
const bool | is_metadata_scan_or_for_import | ||
) |
Definition at line 297 of file LazyParquetChunkLoader.cpp.
References CHECK, ColumnDescriptor::columnType, kBIGINT, kENCODING_NONE, kINT, kSMALLINT, kTINYINT, and UNREACHABLE.
Referenced by create_parquet_encoder().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_integral_encoder_with_omnisci_type | ( | AbstractBuffer * | buffer, |
const size_t | omnisci_data_type_byte_size, | ||
const size_t | parquet_data_type_byte_size, | ||
const int | bit_width, | ||
const bool | is_signed | ||
) |
Create a integral parquet encoder using types.
buffer | - buffer used within the encoder |
omnisci_data_type_byte_size | - size in number of bytes of OmniSci type |
parquet_data_type_byte_size | - size in number of bytes of Parquet physical type |
bit_width | - bit width specified for the Parquet column |
is_signed | - flag indicating if Parquet column is signed |
See the documentation for ParquetFixedLengthEncoder and ParquetUnsignedFixedLengthEncoder for a description of the semantics of the templated type V
and NullType
.
Note, this function determines the appropriate bit depth integral encoder to create, while create_parquet_signed_or_unsigned_integral_encoder_with_types
determines whether to create a signed or unsigned integral encoder.
Definition at line 260 of file LazyParquetChunkLoader.cpp.
References create_parquet_signed_or_unsigned_integral_encoder_with_types(), and UNREACHABLE.
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_none_type_encoder | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
AbstractBuffer * | buffer | ||
) |
Definition at line 458 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, SQLTypeInfo::is_string(), kBOOLEAN, kENCODING_NONE, and UNREACHABLE.
Referenced by create_parquet_encoder().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_signed_or_unsigned_integral_encoder_with_types | ( | AbstractBuffer * | buffer, |
const size_t | omnisci_data_type_byte_size, | ||
const size_t | parquet_data_type_byte_size, | ||
const bool | is_signed | ||
) |
Create a signed or unsigned integral parquet encoder using types.
buffer | - buffer used within the encoder |
omnisci_data_type_byte_size | - size in number of bytes of OmniSci type |
parquet_data_type_byte_size | - size in number of bytes of Parquet physical type |
is_signed | - flag indicating if Parquet column is signed |
See the documentation for ParquetFixedLengthEncoder and ParquetUnsignedFixedLengthEncoder for a description of the semantics of the templated types V
, T
, U
, and NullType
.
Definition at line 225 of file LazyParquetChunkLoader.cpp.
References CHECK.
Referenced by create_parquet_integral_encoder_with_omnisci_type().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_string_encoder | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
const Chunk_NS::Chunk & | chunk, | ||
StringDictionary * | string_dictionary, | ||
std::list< std::unique_ptr< ChunkMetadata >> & | chunk_metadata, | ||
bool | is_for_import, | ||
const bool | is_for_detect | ||
) |
Definition at line 777 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, Chunk_NS::Chunk::getBuffer(), Chunk_NS::Chunk::getIndexBuf(), SQLTypeInfo::is_string(), is_valid_parquet_string(), kENCODING_DICT, kENCODING_NONE, and UNREACHABLE.
Referenced by create_parquet_encoder().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_time_encoder | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
AbstractBuffer * | buffer, | ||
const bool | is_metadata_scan_or_for_import | ||
) |
Definition at line 640 of file LazyParquetChunkLoader.cpp.
References CHECK, ColumnDescriptor::columnType, kENCODING_FIXED, kENCODING_NONE, and UNREACHABLE.
Referenced by create_parquet_encoder().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_time_encoder_with_types | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
AbstractBuffer * | buffer | ||
) |
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_timestamp_encoder | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
AbstractBuffer * | buffer, | ||
const bool | is_metadata_scan_or_for_import | ||
) |
Definition at line 555 of file LazyParquetChunkLoader.cpp.
References CHECK, ColumnDescriptor::columnType, SQLTypeInfo::get_precision(), kENCODING_FIXED, kENCODING_NONE, and UNREACHABLE.
Referenced by create_parquet_encoder().
std::shared_ptr<ParquetEncoder> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::create_parquet_timestamp_encoder_with_types | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
AbstractBuffer * | buffer | ||
) |
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::is_microsecond_precision | ( | const ColumnDescriptor * | omnisci_column | ) |
Definition at line 1298 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, and SQLTypeInfo::get_dimension().
Referenced by suggest_timestamp_mapping(), and validate_timestamp_mapping().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::is_microsecond_precision | ( | const parquet::TimestampLogicalType * | timestamp_logical_column | ) |
Definition at line 1302 of file LazyParquetChunkLoader.cpp.
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::is_millisecond_precision | ( | const ColumnDescriptor * | omnisci_column | ) |
Definition at line 1307 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, and SQLTypeInfo::get_dimension().
Referenced by suggest_timestamp_mapping(), and validate_timestamp_mapping().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::is_millisecond_precision | ( | const parquet::TimestampLogicalType * | timestamp_logical_column | ) |
Definition at line 1311 of file LazyParquetChunkLoader.cpp.
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::is_nanosecond_precision | ( | const ColumnDescriptor * | omnisci_column | ) |
Definition at line 1289 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, and SQLTypeInfo::get_dimension().
Referenced by suggest_timestamp_mapping(), and validate_timestamp_mapping().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::is_nanosecond_precision | ( | const parquet::TimestampLogicalType * | timestamp_logical_column | ) |
Definition at line 1293 of file LazyParquetChunkLoader.cpp.
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::is_valid_parquet_list_column | ( | const parquet::ColumnDescriptor * | parquet_column | ) |
Detect a valid list parquet column.
parquet_column | - the parquet column descriptor of the column to detect |
Note: the notion of a valid parquet list column is adapted from the parquet schema specification for logical type definitions:
<list-repetition> group <name> (LIST) { repeated group list { <element-repetition> <element-type> element; } }
Testing has shown that there are small deviations from this specification in at least one library– pyarrow– where the innermost schema node is named "item" as opposed to "element".
The following is also true of the schema definition.
FSI further restricts lists to be defined only at the top level, meaning directly below the root schema node.
Definition at line 101 of file LazyParquetChunkLoader.cpp.
Referenced by create_parquet_array_encoder(), foreign_storage::LazyParquetChunkLoader::suggestColumnMapping(), validate_array_mapping(), validate_column_mapping_and_row_group_metadata(), validate_definition_levels(), and validate_max_repetition_and_definition_level().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::is_valid_parquet_string | ( | const parquet::ColumnDescriptor * | parquet_column | ) |
Definition at line 59 of file LazyParquetChunkLoader.cpp.
Referenced by create_parquet_geospatial_encoder(), create_parquet_string_encoder(), suggest_column_scalar_type(), suggest_string_mapping(), validate_geospatial_mapping(), and validate_string_mapping().
std::list<RowGroupMetadata> foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::metadata_scan_rowgroup_interval | ( | const std::map< int, std::shared_ptr< ParquetEncoder >> & | encoder_map, |
const RowGroupInterval & | row_group_interval, | ||
const ReaderPtr & | reader, | ||
const ForeignTableSchema & | schema | ||
) |
Definition at line 1676 of file LazyParquetChunkLoader.cpp.
References CHECK, ColumnDescriptor::columnId, foreign_storage::RowGroupInterval::end_index, foreign_storage::RowGroupInterval::file_path, foreign_storage::ForeignTableSchema::getColumnDescriptor(), foreign_storage::ForeignTableSchema::getLogicalAndPhysicalColumns(), foreign_storage::ForeignTableSchema::getLogicalColumn(), foreign_storage::ForeignTableSchema::getParquetColumnIndex(), and foreign_storage::RowGroupInterval::start_index.
Referenced by foreign_storage::LazyParquetChunkLoader::metadataScan().
std::map<int, std::shared_ptr<ParquetEncoder> > foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::populate_encoder_map_for_import | ( | const std::map< int, Chunk_NS::Chunk > | chunks, |
const ForeignTableSchema & | schema, | ||
const ReaderPtr & | reader, | ||
const std::map< int, StringDictionary * > | column_dictionaries, | ||
const int64_t | num_rows, | ||
const RenderGroupAnalyzerMap * | render_group_analyzer_map | ||
) |
Definition at line 1719 of file LazyParquetChunkLoader.cpp.
References create_parquet_encoder_for_import(), shared::get_from_map(), foreign_storage::ForeignTableSchema::getColumnDescriptor(), and foreign_storage::ForeignTableSchema::getParquetColumnIndex().
Referenced by foreign_storage::LazyParquetChunkLoader::loadRowGroups().
std::map<int, std::shared_ptr<ParquetEncoder> > foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::populate_encoder_map_for_metadata_scan | ( | const Interval< ColumnType > & | column_interval, |
const ForeignTableSchema & | schema, | ||
const ReaderPtr & | reader, | ||
const RenderGroupAnalyzerMap * | render_group_analyzer_map, | ||
const bool | do_metadata_stats_validation | ||
) |
Definition at line 1761 of file LazyParquetChunkLoader.cpp.
References create_parquet_encoder_for_metadata_scan(), foreign_storage::Interval< T >::end, shared::get_from_map(), foreign_storage::ForeignTableSchema::getColumnDescriptor(), foreign_storage::ForeignTableSchema::getParquetColumnIndex(), and foreign_storage::Interval< T >::start.
Referenced by foreign_storage::LazyParquetChunkLoader::metadataScan().
void foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::resize_values_buffer | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column, | ||
std::vector< int8_t > & | values | ||
) |
Definition at line 1136 of file LazyParquetChunkLoader.cpp.
References foreign_storage::LazyParquetChunkLoader::batch_reader_num_elements, ColumnDescriptor::columnType, and SQLTypeInfo::get_size().
Referenced by foreign_storage::LazyParquetChunkLoader::appendRowGroups(), and foreign_storage::ParquetRowGroupReader::readAndValidateRowGroup().
SQLTypeInfo foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::suggest_boolean_type_mapping | ( | const parquet::ColumnDescriptor * | parquet_column | ) |
Definition at line 1325 of file LazyParquetChunkLoader.cpp.
References kBOOLEAN, kENCODING_NONE, SQLTypeInfo::set_compression(), SQLTypeInfo::set_fixed_size(), SQLTypeInfo::set_type(), and run_benchmark_import::type.
Referenced by suggest_column_scalar_type().
SQLTypeInfo foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::suggest_column_scalar_type | ( | const parquet::ColumnDescriptor * | parquet_column | ) |
Definition at line 1530 of file LazyParquetChunkLoader.cpp.
References is_valid_parquet_string(), suggest_boolean_type_mapping(), suggest_date_mapping(), suggest_decimal_mapping(), suggest_floating_point_mapping(), suggest_integral_mapping(), suggest_string_mapping(), suggest_time_mapping(), and suggest_timestamp_mapping().
Referenced by foreign_storage::LazyParquetChunkLoader::suggestColumnMapping().
SQLTypeInfo foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::suggest_date_mapping | ( | const parquet::ColumnDescriptor * | parquet_column | ) |
Definition at line 1429 of file LazyParquetChunkLoader.cpp.
References CHECK, kDATE, kENCODING_NONE, and run_benchmark_import::type.
Referenced by suggest_column_scalar_type().
SQLTypeInfo foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::suggest_decimal_mapping | ( | const parquet::ColumnDescriptor * | parquet_column | ) |
Definition at line 1161 of file LazyParquetChunkLoader.cpp.
References kDECIMAL, kENCODING_NONE, sql_constants::kMaxNumericPrecision, SQLTypeInfo::scale, SQLTypeInfo::set_compression(), SQLTypeInfo::set_fixed_size(), SQLTypeInfo::set_precision(), SQLTypeInfo::set_scale(), SQLTypeInfo::set_type(), to_string(), run_benchmark_import::type, and UNREACHABLE.
Referenced by suggest_column_scalar_type().
SQLTypeInfo foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::suggest_floating_point_mapping | ( | const parquet::ColumnDescriptor * | parquet_column | ) |
Definition at line 1202 of file LazyParquetChunkLoader.cpp.
References kDOUBLE, kENCODING_NONE, kFLOAT, SQLTypeInfo::set_compression(), SQLTypeInfo::set_fixed_size(), SQLTypeInfo::set_type(), run_benchmark_import::type, and UNREACHABLE.
Referenced by suggest_column_scalar_type().
SQLTypeInfo foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::suggest_integral_mapping | ( | const parquet::ColumnDescriptor * | parquet_column | ) |
Definition at line 1244 of file LazyParquetChunkLoader.cpp.
References CHECK, kBIGINT, kENCODING_NONE, kINT, kSMALLINT, kTINYINT, SQLTypeInfo::set_compression(), SQLTypeInfo::set_fixed_size(), SQLTypeInfo::set_type(), run_benchmark_import::type, and within_range().
Referenced by suggest_column_scalar_type().
SQLTypeInfo foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::suggest_string_mapping | ( | const parquet::ColumnDescriptor * | parquet_column | ) |
Definition at line 1446 of file LazyParquetChunkLoader.cpp.
References CHECK, is_valid_parquet_string(), kENCODING_DICT, kTEXT, SQLTypeInfo::set_comp_param(), SQLTypeInfo::set_compression(), SQLTypeInfo::set_fixed_size(), SQLTypeInfo::set_type(), and run_benchmark_import::type.
Referenced by suggest_column_scalar_type().
SQLTypeInfo foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::suggest_time_mapping | ( | const parquet::ColumnDescriptor * | parquet_column | ) |
Definition at line 1403 of file LazyParquetChunkLoader.cpp.
References CHECK, kENCODING_NONE, kTIME, and run_benchmark_import::type.
Referenced by suggest_column_scalar_type().
SQLTypeInfo foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::suggest_timestamp_mapping | ( | const parquet::ColumnDescriptor * | parquet_column | ) |
Definition at line 1369 of file LazyParquetChunkLoader.cpp.
References is_microsecond_precision(), is_millisecond_precision(), is_nanosecond_precision(), kENCODING_NONE, kTIMESTAMP, SQLTypeInfo::set_compression(), SQLTypeInfo::set_fixed_size(), SQLTypeInfo::set_precision(), SQLTypeInfo::set_type(), run_benchmark_import::type, and UNREACHABLE.
Referenced by suggest_column_scalar_type().
void foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::throw_missing_metadata_error | ( | const int | row_group_index, |
const int | column_index, | ||
const std::string & | file_path | ||
) |
Definition at line 1584 of file LazyParquetChunkLoader.cpp.
References to_string().
Referenced by validate_column_mapping_and_row_group_metadata().
void foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::throw_row_group_larger_than_fragment_size_error | ( | const MaxRowGroupSizeStats | max_row_group_stats, |
const int | fragment_size | ||
) |
Definition at line 1600 of file LazyParquetChunkLoader.cpp.
References foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::MaxRowGroupSizeStats::file_path, foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::MaxRowGroupSizeStats::max_row_group_index, foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::MaxRowGroupSizeStats::max_row_group_size, and to_string().
Referenced by foreign_storage::LazyParquetChunkLoader::metadataScan().
void foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_allowed_mapping | ( | const parquet::ColumnDescriptor * | parquet_column, |
const ColumnDescriptor * | omnisci_column | ||
) |
Definition at line 1499 of file LazyParquetChunkLoader.cpp.
References CHECK, ColumnDescriptor::columnName, ColumnDescriptor::columnType, SQLTypeInfo::get_type_name(), foreign_storage::LazyParquetChunkLoader::isColumnMappingSupported(), LOG, run_benchmark_import::type, and logger::WARNING.
Referenced by foreign_storage::LazyParquetChunkLoader::loadRowGroups(), and validate_column_mapping_and_row_group_metadata().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_array_mapping | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column | ||
) |
Definition at line 1456 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, foreign_storage::get_sub_type_column_descriptor(), SQLTypeInfo::is_array(), is_valid_parquet_list_column(), and foreign_storage::LazyParquetChunkLoader::isColumnMappingSupported().
Referenced by foreign_storage::LazyParquetChunkLoader::isColumnMappingSupported().
MaxRowGroupSizeStats foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_column_mapping_and_row_group_metadata | ( | const std::shared_ptr< parquet::FileMetaData > & | file_metadata, |
const std::string & | file_path, | ||
const ForeignTableSchema & | schema | ||
) |
Definition at line 1616 of file LazyParquetChunkLoader.cpp.
References foreign_storage::ForeignTableSchema::getLogicalColumns(), is_valid_parquet_list_column(), throw_missing_metadata_error(), and validate_allowed_mapping().
Referenced by validate_parquet_metadata().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_date_mapping | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column | ||
) |
Definition at line 1412 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, SQLTypeInfo::get_comp_param(), SQLTypeInfo::get_compression(), SQLTypeInfo::get_type(), kDATE, kENCODING_DATE_IN_DAYS, and kENCODING_NONE.
Referenced by foreign_storage::LazyParquetChunkLoader::isColumnMappingSupported().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_decimal_mapping | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column | ||
) |
Definition at line 1147 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, SQLTypeInfo::get_compression(), SQLTypeInfo::get_precision(), SQLTypeInfo::get_scale(), SQLTypeInfo::is_decimal(), kENCODING_FIXED, and kENCODING_NONE.
Referenced by foreign_storage::LazyParquetChunkLoader::isColumnMappingSupported().
void foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_definition_levels | ( | const parquet::ParquetFileReader * | reader, |
const int | row_group_index, | ||
const int | column_index, | ||
const int16_t * | def_levels, | ||
const int64_t | num_levels, | ||
const parquet::ColumnDescriptor * | parquet_column_descriptor | ||
) |
Definition at line 1070 of file LazyParquetChunkLoader.cpp.
References is_valid_parquet_list_column(), and foreign_storage::validate_and_get_column_metadata_statistics().
Referenced by foreign_storage::LazyParquetChunkLoader::appendRowGroups(), and foreign_storage::ParquetRowGroupReader::readAndValidateRowGroup().
void foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_equal_schema | ( | const parquet::arrow::FileReader * | reference_file_reader, |
const parquet::arrow::FileReader * | new_file_reader, | ||
const std::string & | reference_file_path, | ||
const std::string & | new_file_path | ||
) |
Definition at line 1473 of file LazyParquetChunkLoader.cpp.
References foreign_storage::get_column_descriptor(), to_string(), and foreign_storage::validate_equal_column_descriptor().
Referenced by foreign_storage::LazyParquetChunkLoader::metadataScan(), and foreign_storage::LazyParquetChunkLoader::previewFiles().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_floating_point_mapping | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column | ||
) |
Definition at line 1186 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, SQLTypeInfo::get_compression(), SQLTypeInfo::get_type(), SQLTypeInfo::is_fp(), kENCODING_NONE, and kFLOAT.
Referenced by foreign_storage::LazyParquetChunkLoader::isColumnMappingSupported().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_geospatial_mapping | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column | ||
) |
Definition at line 1467 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, SQLTypeInfo::is_geometry(), and is_valid_parquet_string().
Referenced by foreign_storage::LazyParquetChunkLoader::isColumnMappingSupported().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_integral_mapping | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column | ||
) |
Definition at line 1217 of file LazyParquetChunkLoader.cpp.
References CHECK, ColumnDescriptor::columnType, SQLTypeInfo::get_compression(), SQLTypeInfo::get_size(), SQLTypeInfo::is_integer(), kENCODING_FIXED, and kENCODING_NONE.
Referenced by foreign_storage::LazyParquetChunkLoader::isColumnMappingSupported().
void foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_max_repetition_and_definition_level | ( | const ColumnDescriptor * | omnisci_column_descriptor, |
const parquet::ColumnDescriptor * | parquet_column_descriptor | ||
) |
Definition at line 1097 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnName, ColumnDescriptor::columnType, SQLTypeInfo::is_array(), is_valid_parquet_list_column(), and to_string().
Referenced by foreign_storage::LazyParquetChunkLoader::appendRowGroups(), and foreign_storage::LazyParquetChunkLoader::loadRowGroups().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_none_type_mapping | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column | ||
) |
Definition at line 1316 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, SQLTypeInfo::get_compression(), SQLTypeInfo::get_type(), kBOOLEAN, and kENCODING_NONE.
Referenced by foreign_storage::LazyParquetChunkLoader::isColumnMappingSupported().
void foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_number_of_columns | ( | const std::shared_ptr< parquet::FileMetaData > & | file_metadata, |
const std::string & | file_path, | ||
const ForeignTableSchema & | schema | ||
) |
Definition at line 1574 of file LazyParquetChunkLoader.cpp.
References foreign_storage::ForeignTableSchema::numLogicalColumns(), and foreign_storage::throw_number_of_columns_mismatch_error().
Referenced by foreign_storage::LazyParquetChunkLoader::loadRowGroups(), and validate_parquet_metadata().
MaxRowGroupSizeStats foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_parquet_metadata | ( | const std::shared_ptr< parquet::FileMetaData > & | file_metadata, |
const std::string & | file_path, | ||
const ForeignTableSchema & | schema | ||
) |
Definition at line 1668 of file LazyParquetChunkLoader.cpp.
References validate_column_mapping_and_row_group_metadata(), and validate_number_of_columns().
Referenced by foreign_storage::LazyParquetChunkLoader::metadataScan().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_string_mapping | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column | ||
) |
Definition at line 1438 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, SQLTypeInfo::get_compression(), SQLTypeInfo::is_string(), is_valid_parquet_string(), kENCODING_DICT, and kENCODING_NONE.
Referenced by foreign_storage::LazyParquetChunkLoader::isColumnMappingSupported().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_time_mapping | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column | ||
) |
Definition at line 1389 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, SQLTypeInfo::get_comp_param(), SQLTypeInfo::get_compression(), SQLTypeInfo::get_type(), kENCODING_FIXED, kENCODING_NONE, and kTIME.
Referenced by foreign_storage::LazyParquetChunkLoader::isColumnMappingSupported().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::validate_timestamp_mapping | ( | const ColumnDescriptor * | omnisci_column, |
const parquet::ColumnDescriptor * | parquet_column | ||
) |
Definition at line 1334 of file LazyParquetChunkLoader.cpp.
References ColumnDescriptor::columnType, SQLTypeInfo::get_comp_param(), SQLTypeInfo::get_compression(), SQLTypeInfo::get_dimension(), SQLTypeInfo::get_type(), is_microsecond_precision(), is_millisecond_precision(), is_nanosecond_precision(), kENCODING_FIXED, kENCODING_NONE, and kTIMESTAMP.
Referenced by foreign_storage::LazyParquetChunkLoader::isColumnMappingSupported().
bool foreign_storage::anonymous_namespace{LazyParquetChunkLoader.cpp}::within_range | ( | int64_t | lower_bound, |
int64_t | upper_bound, | ||
int64_t | value | ||
) |
Definition at line 55 of file LazyParquetChunkLoader.cpp.
References gpu_enabled::upper_bound().
Referenced by suggest_integral_mapping().