OmniSciDB  95562058bd
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Pages
foreign_storage::ParquetVariableLengthArrayEncoder Class Reference

#include <ParquetVariableLengthArrayEncoder.h>

+ Inheritance diagram for foreign_storage::ParquetVariableLengthArrayEncoder:
+ Collaboration diagram for foreign_storage::ParquetVariableLengthArrayEncoder:

Public Member Functions

 ParquetVariableLengthArrayEncoder (Data_Namespace::AbstractBuffer *data_buffer, Data_Namespace::AbstractBuffer *index_buffer, std::shared_ptr< ParquetScalarEncoder > scalar_encoder, const ColumnDescriptor *column_desciptor)
 
void appendData (const int16_t *def_levels, const int16_t *rep_levels, const int64_t values_read, const int64_t levels_read, const bool is_last_batch, int8_t *values) override
 
- Public Member Functions inherited from foreign_storage::ParquetArrayEncoder
 ParquetArrayEncoder (Data_Namespace::AbstractBuffer *data_buffer, std::shared_ptr< ParquetScalarEncoder > scalar_encoder, const ColumnDescriptor *column_desciptor)
 
- Public Member Functions inherited from foreign_storage::ParquetEncoder
 ParquetEncoder (Data_Namespace::AbstractBuffer *buffer)
 
virtual ~ParquetEncoder ()=default
 
virtual std::shared_ptr
< ChunkMetadata
getRowGroupMetadata (const parquet::RowGroupMetaData *group_metadata, const int parquet_column_index, const SQLTypeInfo &column_type)
 

Protected Member Functions

void appendArraysToBuffer () override
 
void processLastArray () override
 
- Protected Member Functions inherited from foreign_storage::ParquetArrayEncoder
bool isLastArrayNull () const
 
size_t sizeOfLastArray () const
 
int8_t * resizeArrayDataBytes (const size_t additional_num_elements)
 

Private Member Functions

void setFirstOffsetForBuffer (const int16_t def_level)
 
void appendLastArrayOffset ()
 

Private Attributes

Data_Namespace::AbstractBufferindex_buffer_
 
std::vector< ArrayOffsetToffsets_
 

Additional Inherited Members

- Static Protected Member Functions inherited from foreign_storage::ParquetEncoder
static std::shared_ptr
< ChunkMetadata
createMetadata (const SQLTypeInfo &column_type)
 
- Protected Attributes inherited from foreign_storage::ParquetArrayEncoder
size_t omnisci_data_type_byte_size_
 
std::shared_ptr
< ParquetScalarEncoder
scalar_encoder_
 
std::vector< int8_t > data_buffer_bytes_
 
- Protected Attributes inherited from foreign_storage::ParquetEncoder
Data_Namespace::AbstractBufferbuffer_
 
- Static Protected Attributes inherited from foreign_storage::ParquetArrayEncoder
static const int16_t non_null_def_level = 3
 
static const int16_t item_null_def_level = 2
 
static const int16_t list_null_def_level = 0
 

Detailed Description

Definition at line 23 of file ParquetVariableLengthArrayEncoder.h.

Constructor & Destructor Documentation

foreign_storage::ParquetVariableLengthArrayEncoder::ParquetVariableLengthArrayEncoder ( Data_Namespace::AbstractBuffer data_buffer,
Data_Namespace::AbstractBuffer index_buffer,
std::shared_ptr< ParquetScalarEncoder scalar_encoder,
const ColumnDescriptor column_desciptor 
)
inline

Definition at line 25 of file ParquetVariableLengthArrayEncoder.h.

29  : ParquetArrayEncoder(data_buffer, scalar_encoder, column_desciptor)
30  , index_buffer_(index_buffer) {}
ParquetArrayEncoder(Data_Namespace::AbstractBuffer *data_buffer, std::shared_ptr< ParquetScalarEncoder > scalar_encoder, const ColumnDescriptor *column_desciptor)

Member Function Documentation

void foreign_storage::ParquetVariableLengthArrayEncoder::appendArraysToBuffer ( )
inlineoverrideprotectedvirtual

Reimplemented from foreign_storage::ParquetArrayEncoder.

Definition at line 45 of file ParquetVariableLengthArrayEncoder.h.

References Data_Namespace::AbstractBuffer::append(), foreign_storage::ParquetArrayEncoder::appendArraysToBuffer(), index_buffer_, and offsets_.

45  {
46  index_buffer_->append(reinterpret_cast<int8_t*>(offsets_.data()),
47  offsets_.size() * sizeof(ArrayOffsetT));
48  offsets_.clear();
50  }
int32_t ArrayOffsetT
Definition: sqltypes.h:869
virtual void append(int8_t *src, const size_t num_bytes, const MemoryLevel src_buffer_type=CPU_LEVEL, const int device_id=-1)=0

+ Here is the call graph for this function:

void foreign_storage::ParquetVariableLengthArrayEncoder::appendData ( const int16_t *  def_levels,
const int16_t *  rep_levels,
const int64_t  values_read,
const int64_t  levels_read,
const bool  is_last_batch,
int8_t *  values 
)
inlineoverridevirtual

Reimplemented from foreign_storage::ParquetArrayEncoder.

Definition at line 32 of file ParquetVariableLengthArrayEncoder.h.

References foreign_storage::ParquetArrayEncoder::appendData(), CHECK, and setFirstOffsetForBuffer().

37  {
38  CHECK(levels_read > 0);
39  setFirstOffsetForBuffer(def_levels[0]);
41  def_levels, rep_levels, values_read, levels_read, is_last_batch, values);
42  }
#define CHECK(condition)
Definition: Logger.h:197
void appendData(const int16_t *def_levels, const int16_t *rep_levels, const int64_t values_read, const int64_t levels_read, const bool is_last_batch, int8_t *values) override

+ Here is the call graph for this function:

void foreign_storage::ParquetVariableLengthArrayEncoder::appendLastArrayOffset ( )
inlineprivate

Definition at line 73 of file ParquetVariableLengthArrayEncoder.h.

References foreign_storage::ParquetEncoder::buffer_, foreign_storage::ParquetArrayEncoder::data_buffer_bytes_, foreign_storage::ParquetArrayEncoder::isLastArrayNull(), offsets_, and Data_Namespace::AbstractBuffer::size().

Referenced by processLastArray().

73  {
74  int64_t last_offset = buffer_->size() + data_buffer_bytes_.size();
75  if (!isLastArrayNull()) {
76  // append array data offset
77  offsets_.push_back(last_offset);
78  } else {
79  // append a null array offset
80  offsets_.push_back(-last_offset);
81  }
82  }
Data_Namespace::AbstractBuffer * buffer_

+ Here is the call graph for this function:

+ Here is the caller graph for this function:

void foreign_storage::ParquetVariableLengthArrayEncoder::processLastArray ( )
inlineoverrideprotectedvirtual

Implements foreign_storage::ParquetArrayEncoder.

Definition at line 52 of file ParquetVariableLengthArrayEncoder.h.

References appendLastArrayOffset().

+ Here is the call graph for this function:

void foreign_storage::ParquetVariableLengthArrayEncoder::setFirstOffsetForBuffer ( const int16_t  def_level)
inlineprivate

Definition at line 55 of file ParquetVariableLengthArrayEncoder.h.

References foreign_storage::ParquetEncoder::buffer_, foreign_storage::ParquetArrayEncoder::data_buffer_bytes_, foreign_storage::ParquetArrayEncoder::list_null_def_level, offsets_, and Data_Namespace::AbstractBuffer::size().

Referenced by appendData().

55  {
56  if (data_buffer_bytes_.size() == 0 && buffer_->size() == 0) { // first element
58  // OmniSci variable array types have a special encoding for chunks in
59  // which the first array is null: the first 8 bytes of the chunk are
60  // filled and the offset is set appropriately. Ostensibly, this is
61  // done to allow marking a null array by negating a non-zero value;
62  // however, the choice of 8 appears arbitrary.
63  offsets_.push_back(8);
64  std::vector<int8_t> zero_bytes(8, 0);
65  data_buffer_bytes_.insert(
66  data_buffer_bytes_.end(), zero_bytes.begin(), zero_bytes.end());
67  } else {
68  offsets_.push_back(0);
69  }
70  }
71  }
Data_Namespace::AbstractBuffer * buffer_

+ Here is the call graph for this function:

+ Here is the caller graph for this function:

Member Data Documentation

Data_Namespace::AbstractBuffer* foreign_storage::ParquetVariableLengthArrayEncoder::index_buffer_
private

Definition at line 84 of file ParquetVariableLengthArrayEncoder.h.

Referenced by appendArraysToBuffer().

std::vector<ArrayOffsetT> foreign_storage::ParquetVariableLengthArrayEncoder::offsets_
private

The documentation for this class was generated from the following file: