_col_slot_context_8cpp_source.html

 /*

  * Copyright 2022 HEAVY.AI, Inc.

  *

  * Licensed under the Apache License, Version 2.0 (the "License");

  * you may not use this file except in compliance with the License.

  * You may obtain a copy of the License at

  *

  *     http://www.apache.org/licenses/LICENSE-2.0

  *

  * Unless required by applicable law or agreed to in writing, software

  * distributed under the License is distributed on an "AS IS" BASIS,

  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

  * See the License for the specific language governing permissions and

  * limitations under the License.

  */


 #include "ColSlotContext.h"


 #include "../BufferCompaction.h"


 #include <Analyzer/Analyzer.h>

 #include <Shared/SqlTypesLayout.h>


 #include <numeric>

 #include <stdexcept>


 extern bool g_bigint_count;


 ColSlotContext::ColSlotContext(const std::vector<Analyzer::Expr*>& col_expr_list,

                                const std::vector<int64_t>& col_exprs_to_not_project) {

   // Note that non-projected col exprs could be projected cols that we can lazy fetch or

   // grouped cols with keyless hash

   if (!col_exprs_to_not_project.empty()) {

     CHECK_EQ(col_expr_list.size(), col_exprs_to_not_project.size());

   }

   size_t col_expr_idx = 0;

   col_to_slot_map_.resize(col_expr_list.size());

   for (const auto col_expr : col_expr_list) {

     if (!col_exprs_to_not_project.empty() &&

         col_exprs_to_not_project[col_expr_idx] != -1) {

       addSlotForColumn(0, 0, col_expr_idx);

       ++col_expr_idx;

       continue;

     }

     if (!col_expr) {

       // row index

       addSlotForColumn(sizeof(int64_t), col_expr_idx);

     } else {

       const auto agg_info = get_target_info(col_expr, g_bigint_count);

       const auto chosen_type = get_compact_type(agg_info);


       if ((chosen_type.is_string() && chosen_type.get_compression() == kENCODING_NONE) ||

           chosen_type.is_array()) {

         addSlotForColumn(sizeof(int64_t), col_expr_idx);

         addSlotForColumn(sizeof(int64_t), col_expr_idx);

         ++col_expr_idx;

         continue;

       }

       if (chosen_type.is_geometry()) {

         if (dynamic_cast<const Analyzer::GeoExpr*>(col_expr)) {

           CHECK_EQ(chosen_type.get_type(), kPOINT);

           // Pointer/offset into varlen buffer

           addSlotForColumn(sizeof(int64_t), col_expr_idx);

           const int64_t arr_size =

               chosen_type.get_compression() == kENCODING_GEOINT ? 8 : 16;

           CHECK(varlen_output_slot_map_

                     .insert(std::make_pair(slot_sizes_.size() - 1, arr_size))

                     .second);

         } else {

           for (auto i = 0; i < chosen_type.get_physical_coord_cols(); ++i) {

             addSlotForColumn(sizeof(int64_t), col_expr_idx);

             addSlotForColumn(sizeof(int64_t), col_expr_idx);

           }

         }

         ++col_expr_idx;

         continue;

       }


       const auto col_expr_bitwidth = get_bit_width(chosen_type);


       CHECK_EQ(size_t(0), col_expr_bitwidth % 8);

       addSlotForColumn(static_cast<int8_t>(col_expr_bitwidth >> 3), col_expr_idx);

       // for average, we'll need to keep the count as well

       if (agg_info.agg_kind == kAVG) {

         CHECK(agg_info.is_agg);

         addSlotForColumn(sizeof(int64_t), col_expr_idx);

       }

     }

     ++col_expr_idx;

   }

 }


 void ColSlotContext::setAllSlotsSize(const int8_t slot_width_size) {

   const SlotSize ss{slot_width_size, slot_width_size};

   std::fill(slot_sizes_.begin(), slot_sizes_.end(), ss);

 }


 void ColSlotContext::setAllSlotsPaddedSize(const int8_t padded_size) {

   for (auto& slot_size : slot_sizes_) {

     slot_size.padded_size = padded_size;

   }

 }


 void ColSlotContext::setAllUnsetSlotsPaddedSize(const int8_t padded_size) {

   for (auto& slot_size : slot_sizes_) {

     if (slot_size.padded_size < 0) {

       slot_size.padded_size = padded_size;

     }

   }

 }


 void ColSlotContext::setAllSlotsPaddedSizeToLogicalSize() {

   for (auto& slot_size : slot_sizes_) {

     slot_size.padded_size = slot_size.logical_size;

   }

 }


 void ColSlotContext::validate() const {

   for (const auto& slot_size : slot_sizes_) {

     CHECK_GE(slot_size.logical_size, 0);

     CHECK_LE(slot_size.logical_size, slot_size.padded_size);

   }

 }


 size_t ColSlotContext::getColCount() const {

   return col_to_slot_map_.size();

 }

 size_t ColSlotContext::getSlotCount() const {

   return slot_sizes_.size();

 }


 size_t ColSlotContext::getAllSlotsPaddedSize() const {

   return std::accumulate(slot_sizes_.cbegin(),

                          slot_sizes_.cend(),

                          size_t(0),

                          [](size_t sum, const auto& slot_size) {

                            CHECK_GE(slot_size.padded_size, 0);

                            return sum + static_cast<size_t>(slot_size.padded_size);

                          });

 }


 size_t ColSlotContext::getAllSlotsAlignedPaddedSize() const {

   return getAlignedPaddedSizeForRange(slot_sizes_.size());

 }


 size_t ColSlotContext::getAlignedPaddedSizeForRange(const size_t end) const {

   return std::accumulate(slot_sizes_.cbegin(),

                          slot_sizes_.cbegin() + end,

                          size_t(0),

                          [](size_t sum, const auto& slot_size) {

                            CHECK_GE(slot_size.padded_size, 0);

                            const auto chosen_bytes =

                                static_cast<size_t>(slot_size.padded_size);

                            if (chosen_bytes == sizeof(int64_t)) {

                              return align_to_int64(sum) + chosen_bytes;

                            } else {

                              return sum + chosen_bytes;

                            }

                          });

 }


 size_t ColSlotContext::getTotalBytesOfColumnarBuffers(const size_t entry_count) const {

   const auto total_bytes = std::accumulate(

       slot_sizes_.cbegin(),

       slot_sizes_.cend(),

       size_t(0),

       [entry_count](size_t sum, const auto& slot_size) {

         CHECK_GE(slot_size.padded_size, 0);

         return sum +

                align_to_int64(static_cast<size_t>(slot_size.padded_size) * entry_count);

       });

   return align_to_int64(total_bytes);

 }


 int8_t ColSlotContext::getMinPaddedByteSize(const int8_t actual_min_byte_width) const {

   if (slot_sizes_.empty()) {

     return actual_min_byte_width;

   }

   const auto min_padded_size = std::min_element(

       slot_sizes_.cbegin(), slot_sizes_.cend(), [](const auto& lhs, const auto& rhs) {

         return lhs.padded_size < rhs.padded_size;

       });

   return std::min(min_padded_size->padded_size, actual_min_byte_width);

 }


 size_t ColSlotContext::getCompactByteWidth() const {

   if (slot_sizes_.empty()) {

     return 8;

   }

   size_t compact_width{0};

   for (const auto& slot_size : slot_sizes_) {

     if (slot_size.padded_size != 0) {

       compact_width = slot_size.padded_size;

       break;

     }

   }

   if (!compact_width) {

     return 0;

   }

   CHECK_GT(compact_width, size_t(0));

   for (const auto& slot_size : slot_sizes_) {

     if (slot_size.padded_size == 0) {

       continue;

     }

     CHECK_EQ(static_cast<size_t>(slot_size.padded_size), compact_width);

   }

   return compact_width;

 }


 size_t ColSlotContext::getColOnlyOffInBytes(const size_t slot_idx) const {

   CHECK_LT(slot_idx, slot_sizes_.size());

   auto offset_bytes = getAlignedPaddedSizeForRange(slot_idx);

   if (slot_sizes_[slot_idx].padded_size == sizeof(int64_t)) {

     offset_bytes = align_to_int64(offset_bytes);

   }

   return offset_bytes;

 }


 bool ColSlotContext::empty() {

   return slot_sizes_.empty();

 }


 void ColSlotContext::clear() {

   slot_sizes_.clear();

   col_to_slot_map_.clear();

 }


 void ColSlotContext::alignPaddedSlots(const bool sort_on_gpu) {

   size_t total_bytes{0};

   for (size_t slot_idx = 0; slot_idx < slot_sizes_.size(); slot_idx++) {

     auto chosen_bytes = slot_sizes_[slot_idx].padded_size;

     if (chosen_bytes == sizeof(int64_t)) {

       const auto aligned_total_bytes = align_to_int64(total_bytes);

       CHECK_GE(aligned_total_bytes, total_bytes);

       if (slot_idx >= 1) {

         const auto padding = aligned_total_bytes - total_bytes;

         CHECK(padding == 0 || padding == 4);

         slot_sizes_[slot_idx - 1].padded_size += padding;

       }

       total_bytes = aligned_total_bytes;

     }

     total_bytes += chosen_bytes;

   }

   if (!sort_on_gpu) {

     const auto aligned_total_bytes = align_to_int64(total_bytes);

     CHECK_GE(aligned_total_bytes, total_bytes);

     const auto padding = aligned_total_bytes - total_bytes;

     CHECK(padding == 0 || padding == 4);

     slot_sizes_.back().padded_size += padding;

   }

 }


 void ColSlotContext::addColumn(

     const std::vector<std::tuple<int8_t, int8_t>>& slots_for_col) {

   const auto col_idx = col_to_slot_map_.size();

   col_to_slot_map_.emplace_back();

   for (const auto& slot_info : slots_for_col) {

     addSlotForColumn(std::get<1>(slot_info), std::get<0>(slot_info), col_idx);

   }

 }


 void ColSlotContext::addColumnFlatBuffer(const int64_t flatbuffer_size) {

   const auto col_idx = col_to_slot_map_.size();

   col_to_slot_map_.emplace_back();

   addSlotForColumn(0, 0, col_idx);

   // reusing varlenOutput infrastructure for storing the size of a flatbuffer:

   varlen_output_slot_map_.insert(std::make_pair(col_idx, flatbuffer_size));

 }


 int64_t ColSlotContext::getFlatBufferSize(const size_t slot_idx) const {

   const auto varlen_map_it = varlen_output_slot_map_.find(slot_idx);

   if (varlen_map_it == varlen_output_slot_map_.end()) {

     throw std::runtime_error("Failed to find FlatBuffer map entry for slot " +

                              std::to_string(slot_idx));

   }

   return varlen_map_it->second;

 }


 bool ColSlotContext::checkSlotUsesFlatBufferFormat(const size_t slot_idx) const {

   const auto varlen_map_it = varlen_output_slot_map_.find(slot_idx);

   if (varlen_map_it != varlen_output_slot_map_.end() &&

       slot_idx < col_to_slot_map_.size() && col_to_slot_map_[slot_idx].size() == 1) {

     const auto& slot_size = slot_sizes_[col_to_slot_map_[slot_idx][0]];

     return slot_size.padded_size == 0 &&

            slot_size.logical_size == 0;  // as per addColumnFlatBuffer

   }

   return false;

 }


 void ColSlotContext::addSlotForColumn(const int8_t logical_size,

                                       const size_t column_idx) {

   addSlotForColumn(-1, logical_size, column_idx);

 }


 void ColSlotContext::addSlotForColumn(const int8_t padded_size,

                                       const int8_t logical_size,

                                       const size_t column_idx) {

   CHECK_LT(column_idx, col_to_slot_map_.size());

   col_to_slot_map_[column_idx].push_back(slot_sizes_.size());

   slot_sizes_.emplace_back(SlotSize{padded_size, logical_size});

 }


 int64_t ColSlotContext::varlenOutputElementSize(const size_t slot_idx) const {

   const auto varlen_map_it = varlen_output_slot_map_.find(slot_idx);

   if (varlen_map_it == varlen_output_slot_map_.end()) {

     throw std::runtime_error("Failed to find varlen map entry for slot " +

                              std::to_string(slot_idx));

   }

   return varlen_map_it->second;

 }

Analyzer.h
Defines data structures for the semantic analysis phase of query processing.

ColSlotContext::getMinPaddedByteSize
int8_t getMinPaddedByteSize(const int8_t actual_min_byte_width) const
Definition: ColSlotContext.cpp:181

CHECK_EQ
#define CHECK_EQ(x, y)
Definition: Logger.h:301

kENCODING_NONE
Definition: sqltypes.h:241

ColSlotContext::alignPaddedSlots
void alignPaddedSlots(const bool sort_on_gpu)
Definition: ColSlotContext.cpp:234

ColSlotContext::ColSlotContext
ColSlotContext()
Definition: ColSlotContext.h:48

kENCODING_GEOINT
Definition: sqltypes.h:247

SqlTypesLayout.h

sort_on_gpu
void sort_on_gpu(int64_t *val_buff, int32_t *idx_buff, const uint64_t entry_count, const bool desc, const uint32_t chosen_bytes, ThrustAllocator &alloc, const int device_id)
Definition: InPlaceSortImpl.cu:94

ColSlotContext::varlen_output_slot_map_
std::unordered_map< SlotIndex, ArraySize > varlen_output_slot_map_
Definition: ColSlotContext.h:161

SlotSize
Definition: ColSlotContext.h:33

CHECK_GE
#define CHECK_GE(x, y)
Definition: Logger.h:306

ColSlotContext::getAllSlotsPaddedSize
size_t getAllSlotsPaddedSize() const
Definition: ColSlotContext.cpp:138

ColSlotContext::getAllSlotsAlignedPaddedSize
size_t getAllSlotsAlignedPaddedSize() const
Definition: ColSlotContext.cpp:148

ColSlotContext::col_to_slot_map_
std::vector< std::vector< size_t > > col_to_slot_map_
Definition: ColSlotContext.h:157

ColSlotContext::slot_sizes_
std::vector< SlotSize > slot_sizes_
Definition: ColSlotContext.h:156

CHECK_GT
#define CHECK_GT(x, y)
Definition: Logger.h:305

ColSlotContext::setAllSlotsSize
void setAllSlotsSize(const int8_t slot_width_size)
Definition: ColSlotContext.cpp:99

get_target_info
TargetInfo get_target_info(const Analyzer::Expr *target_expr, const bool bigint_count)
Definition: TargetInfo.h:92

to_string
std::string to_string(char const *&&v)
Definition: StringTransform.cpp:128

ColSlotContext::getColOnlyOffInBytes
size_t getColOnlyOffInBytes(const size_t slot_idx) const
Definition: ColSlotContext.cpp:216

get_compact_type
const SQLTypeInfo get_compact_type(const TargetInfo &target)
Definition: SqlTypesLayout.h:37

get_bit_width
size_t get_bit_width(const SQLTypeInfo &ti)
Definition: SqlTypesLayout.h:175

gpu_enabled::fill
DEVICE void fill(ARGS &&...args)
Definition: gpu_enabled.h:60

ColSlotContext::addColumnFlatBuffer
void addColumnFlatBuffer(const int64_t flatbuffer_size)
Definition: ColSlotContext.cpp:268

ColSlotContext::getCompactByteWidth
size_t getCompactByteWidth() const
Definition: ColSlotContext.cpp:192

ColSlotContext.h
Provides column info and slot info for the output buffer and some metadata helpers.

ColSlotContext::getAlignedPaddedSizeForRange
size_t getAlignedPaddedSizeForRange(const size_t end) const
Definition: ColSlotContext.cpp:152

g_bigint_count
bool g_bigint_count
Definition: GroupByAndAggregate.cpp:54

gpu_enabled::accumulate
DEVICE auto accumulate(ARGS &&...args)
Definition: gpu_enabled.h:42

ColSlotContext::validate
void validate() const
Definition: ColSlotContext.cpp:124

ColSlotContext::varlenOutputElementSize
int64_t varlenOutputElementSize(const size_t slot_idx) const
Definition: ColSlotContext.cpp:309

ColSlotContext::addColumn
void addColumn(const std::vector< std::tuple< int8_t, int8_t >> &slots_for_col)
Definition: ColSlotContext.cpp:259

CHECK_LT
#define CHECK_LT(x, y)
Definition: Logger.h:303

CHECK_LE
#define CHECK_LE(x, y)
Definition: Logger.h:304

ColSlotContext::setAllSlotsPaddedSize
void setAllSlotsPaddedSize(const int8_t padded_size)
Definition: ColSlotContext.cpp:104

ColSlotContext::checkSlotUsesFlatBufferFormat
bool checkSlotUsesFlatBufferFormat(const size_t slot_idx) const
Definition: ColSlotContext.cpp:285

ColSlotContext::getTotalBytesOfColumnarBuffers
size_t getTotalBytesOfColumnarBuffers(const size_t entry_count) const
Definition: ColSlotContext.cpp:168

ColSlotContext::addSlotForColumn
void addSlotForColumn(const int8_t logical_size, const size_t column_idx)
Definition: ColSlotContext.cpp:296

ColSlotContext::clear
void clear()
Definition: ColSlotContext.cpp:229

ColSlotContext::getSlotCount
size_t getSlotCount() const
Definition: ColSlotContext.cpp:134

ColSlotContext::setAllSlotsPaddedSizeToLogicalSize
void setAllSlotsPaddedSizeToLogicalSize()
Definition: ColSlotContext.cpp:118

CHECK
#define CHECK(condition)
Definition: Logger.h:291

ColSlotContext::getColCount
size_t getColCount() const
Definition: ColSlotContext.cpp:131

ColSlotContext::setAllUnsetSlotsPaddedSize
void setAllUnsetSlotsPaddedSize(const int8_t padded_size)
Definition: ColSlotContext.cpp:110

kAVG
Definition: sqldefs.h:77

ColSlotContext::getFlatBufferSize
int64_t getFlatBufferSize(const size_t slot_idx) const
Definition: ColSlotContext.cpp:276

align_to_int64
FORCE_INLINE HOST DEVICE T align_to_int64(T addr)
Definition: BufferCompaction.h:42

ColSlotContext::empty
bool empty()
Definition: ColSlotContext.cpp:225

kPOINT
Definition: sqltypes.h:84