OmniSciDB  21ac014ffc
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Groups Pages
QueryMemoryInitializer.cpp File Reference
#include "QueryMemoryInitializer.h"
#include "Execute.h"
#include "GpuInitGroups.h"
#include "GpuMemUtils.h"
#include "Logger/Logger.h"
#include "OutputBufferInitialization.h"
#include "ResultSet.h"
#include "StreamingTopN.h"
#include <Shared/checked_alloc.h>
+ Include dependency graph for QueryMemoryInitializer.cpp:

Go to the source code of this file.

Namespaces

 anonymous_namespace{QueryMemoryInitializer.cpp}
 

Functions

void anonymous_namespace{QueryMemoryInitializer.cpp}::check_total_bitmap_memory (const QueryMemoryDescriptor &query_mem_desc)
 
int64_t * anonymous_namespace{QueryMemoryInitializer.cpp}::alloc_group_by_buffer (const size_t numBytes, RenderAllocatorMap *render_allocator_map, const size_t thread_idx, RowSetMemoryOwner *mem_owner)
 
int64_t anonymous_namespace{QueryMemoryInitializer.cpp}::get_consistent_frag_size (const std::vector< uint64_t > &frag_offsets)
 
std::vector< int64_t > anonymous_namespace{QueryMemoryInitializer.cpp}::get_consistent_frags_sizes (const std::vector< std::vector< uint64_t >> &frag_offsets)
 
std::vector< int64_t > anonymous_namespace{QueryMemoryInitializer.cpp}::get_consistent_frags_sizes (const std::vector< Analyzer::Expr * > &target_exprs, const std::vector< int64_t > &table_frag_sizes)
 
std::vector< std::vector
< int64_t > > 
anonymous_namespace{QueryMemoryInitializer.cpp}::get_col_frag_offsets (const std::vector< Analyzer::Expr * > &target_exprs, const std::vector< std::vector< uint64_t >> &table_frag_offsets)
 
 num_buffers_ (1)
 
 varlen_output_buffer_ (0)
 
 varlen_output_buffer_host_ptr_ (nullptr)
 
 count_distinct_bitmap_mem_ (0)
 
 count_distinct_bitmap_mem_bytes_ (0)
 
 count_distinct_bitmap_crt_ptr_ (nullptr)
 
 count_distinct_bitmap_host_mem_ (nullptr)
 
 device_allocator_ (device_allocator)
 
 thread_idx_ (0)
 
template<typename T >
int8_t * anonymous_namespace{QueryMemoryInitializer.cpp}::initColumnarBuffer (T *buffer_ptr, const T init_val, const uint32_t entry_count)
 
void anonymous_namespace{QueryMemoryInitializer.cpp}::compact_projection_buffer_for_cpu_columnar (const QueryMemoryDescriptor &query_mem_desc, int8_t *projection_buffer, const size_t projection_count)
 

Variables

int64_t g_bitmap_memory_limit {8LL * 1000 * 1000 * 1000}
 
 query_mem_desc
 

Function Documentation

count_distinct_bitmap_crt_ptr_ ( nullptr  )
count_distinct_bitmap_host_mem_ ( nullptr  )
count_distinct_bitmap_mem_ ( )
count_distinct_bitmap_mem_bytes_ ( )
device_allocator_ ( device_allocator  )
num_buffers_ ( )

Referenced by thread_idx_().

+ Here is the caller graph for this function:

thread_idx_ ( )

Definition at line 341 of file QueryMemoryInitializer.cpp.

References anonymous_namespace{QueryMemoryInitializer.cpp}::alloc_group_by_buffer(), CHECK_EQ, CHECK_GE, anonymous_namespace{QueryMemoryInitializer.cpp}::get_col_frag_offsets(), anonymous_namespace{QueryMemoryInitializer.cpp}::get_consistent_frags_sizes(), GPU, num_buffers_(), query_mem_desc, and target_exprs_to_infos().

341  {
342  // Table functions output columnar, basically treat this as a projection
343  const auto& consistent_frag_sizes = get_consistent_frags_sizes(frag_offsets);
344  if (consistent_frag_sizes.empty()) {
345  // No fragments in the input, no underlying buffers will be needed.
346  return;
347  }
348 
349  size_t group_buffer_size{0};
350  const size_t num_columns = query_mem_desc.getBufferColSlotCount();
351  group_buffer_size = num_rows_ * num_columns * sizeof(int64_t);
352  CHECK_GE(group_buffer_size, size_t(0));
353 
354  const auto index_buffer_qw =
355  device_type == ExecutorDeviceType::GPU && query_mem_desc.hasKeylessHash()
356  ? query_mem_desc.getEntryCount()
357  : size_t(0);
358  const auto actual_group_buffer_size =
359  group_buffer_size + index_buffer_qw * sizeof(int64_t);
360  CHECK_GE(actual_group_buffer_size, group_buffer_size);
361 
362  CHECK_EQ(num_buffers_, size_t(1));
363  auto group_by_buffer = alloc_group_by_buffer(
364  actual_group_buffer_size, nullptr, thread_idx_, row_set_mem_owner.get());
365  if (!query_mem_desc.lazyInitGroups(device_type)) {
366  initColumnarGroups(
367  query_mem_desc, group_by_buffer + index_buffer_qw, init_agg_vals_, executor);
368  }
369  group_by_buffers_.push_back(group_by_buffer);
370 
371  const auto column_frag_offsets =
372  get_col_frag_offsets(exe_unit.target_exprs, frag_offsets);
373  const auto column_frag_sizes =
374  get_consistent_frags_sizes(exe_unit.target_exprs, consistent_frag_sizes);
375  result_sets_.emplace_back(
376  new ResultSet(target_exprs_to_infos(exe_unit.target_exprs, query_mem_desc),
377  /*col_lazy_fetch_info=*/{},
378  col_buffers,
379  column_frag_offsets,
380  column_frag_sizes,
381  device_type,
382  device_id,
384  row_set_mem_owner_,
385  executor->getCatalog(),
386  executor->blockSize(),
387  executor->gridSize()));
388  result_sets_.back()->allocateStorage(reinterpret_cast<int8_t*>(group_by_buffer),
389  init_agg_vals_);
390 }
#define CHECK_EQ(x, y)
Definition: Logger.h:214
#define CHECK_GE(x, y)
Definition: Logger.h:219
num_buffers_(1)
std::vector< int64_t > get_consistent_frags_sizes(const std::vector< std::vector< uint64_t >> &frag_offsets)
static QueryMemoryDescriptor fixupQueryMemoryDescriptor(const QueryMemoryDescriptor &)
Definition: ResultSet.cpp:491
std::vector< TargetInfo > target_exprs_to_infos(const std::vector< Analyzer::Expr * > &targets, const QueryMemoryDescriptor &query_mem_desc)
int64_t * alloc_group_by_buffer(const size_t numBytes, RenderAllocatorMap *render_allocator_map, const size_t thread_idx, RowSetMemoryOwner *mem_owner)
std::vector< std::vector< int64_t > > get_col_frag_offsets(const std::vector< Analyzer::Expr * > &target_exprs, const std::vector< std::vector< uint64_t >> &table_frag_offsets)

+ Here is the call graph for this function:

varlen_output_buffer_ ( )
varlen_output_buffer_host_ptr_ ( nullptr  )

Variable Documentation

int64_t g_bitmap_memory_limit {8LL * 1000 * 1000 * 1000}