OmniSciDB  fe05a0c208
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Pages
QueryMemoryInitializer.cpp File Reference
#include "QueryMemoryInitializer.h"
#include "Execute.h"
#include "GpuInitGroups.h"
#include "GpuMemUtils.h"
#include "Logger/Logger.h"
#include "OutputBufferInitialization.h"
#include "ResultSet.h"
#include "StreamingTopN.h"
#include <Shared/checked_alloc.h>
+ Include dependency graph for QueryMemoryInitializer.cpp:

Go to the source code of this file.

Namespaces

 anonymous_namespace{QueryMemoryInitializer.cpp}
 

Functions

void anonymous_namespace{QueryMemoryInitializer.cpp}::check_total_bitmap_memory (const QueryMemoryDescriptor &query_mem_desc)
 
int64_t * anonymous_namespace{QueryMemoryInitializer.cpp}::alloc_group_by_buffer (const size_t numBytes, RenderAllocatorMap *render_allocator_map, const size_t thread_idx, RowSetMemoryOwner *mem_owner)
 
int64_t anonymous_namespace{QueryMemoryInitializer.cpp}::get_consistent_frag_size (const std::vector< uint64_t > &frag_offsets)
 
std::vector< int64_t > anonymous_namespace{QueryMemoryInitializer.cpp}::get_consistent_frags_sizes (const std::vector< std::vector< uint64_t >> &frag_offsets)
 
std::vector< int64_t > anonymous_namespace{QueryMemoryInitializer.cpp}::get_consistent_frags_sizes (const std::vector< Analyzer::Expr * > &target_exprs, const std::vector< int64_t > &table_frag_sizes)
 
std::vector< std::vector
< int64_t > > 
anonymous_namespace{QueryMemoryInitializer.cpp}::get_col_frag_offsets (const std::vector< Analyzer::Expr * > &target_exprs, const std::vector< std::vector< uint64_t >> &table_frag_offsets)
 
 num_buffers_ (1)
 
 count_distinct_bitmap_mem_ (0)
 
 count_distinct_bitmap_mem_bytes_ (0)
 
 count_distinct_bitmap_crt_ptr_ (nullptr)
 
 count_distinct_bitmap_host_mem_ (nullptr)
 
 device_allocator_ (device_allocator)
 
 thread_idx_ (0)
 
template<typename T >
int8_t * anonymous_namespace{QueryMemoryInitializer.cpp}::initColumnarBuffer (T *buffer_ptr, const T init_val, const uint32_t entry_count)
 
void anonymous_namespace{QueryMemoryInitializer.cpp}::compact_projection_buffer_for_cpu_columnar (const QueryMemoryDescriptor &query_mem_desc, int8_t *projection_buffer, const size_t projection_count)
 

Variables

int64_t g_bitmap_memory_limit {8LL * 1000 * 1000 * 1000}
 
 query_mem_desc
 

Function Documentation

count_distinct_bitmap_crt_ptr_ ( nullptr  )
count_distinct_bitmap_host_mem_ ( nullptr  )
count_distinct_bitmap_mem_ ( )
count_distinct_bitmap_mem_bytes_ ( )
device_allocator_ ( device_allocator  )
num_buffers_ ( )

Referenced by thread_idx_().

+ Here is the caller graph for this function:

thread_idx_ ( )

Definition at line 327 of file QueryMemoryInitializer.cpp.

References anonymous_namespace{QueryMemoryInitializer.cpp}::alloc_group_by_buffer(), CHECK_EQ, CHECK_GE, anonymous_namespace{QueryMemoryInitializer.cpp}::get_col_frag_offsets(), anonymous_namespace{QueryMemoryInitializer.cpp}::get_consistent_frags_sizes(), GPU, num_buffers_(), query_mem_desc, and target_exprs_to_infos().

327  {
328  // Table functions output columnar, basically treat this as a projection
329  const auto& consistent_frag_sizes = get_consistent_frags_sizes(frag_offsets);
330  if (consistent_frag_sizes.empty()) {
331  // No fragments in the input, no underlying buffers will be needed.
332  return;
333  }
334 
335  size_t group_buffer_size{0};
336  const size_t num_columns = query_mem_desc.getBufferColSlotCount();
337  group_buffer_size = num_rows_ * num_columns * sizeof(int64_t);
338  CHECK_GE(group_buffer_size, size_t(0));
339 
340  const auto index_buffer_qw =
341  device_type == ExecutorDeviceType::GPU && query_mem_desc.hasKeylessHash()
342  ? query_mem_desc.getEntryCount()
343  : size_t(0);
344  const auto actual_group_buffer_size =
345  group_buffer_size + index_buffer_qw * sizeof(int64_t);
346  CHECK_GE(actual_group_buffer_size, group_buffer_size);
347 
348  CHECK_EQ(num_buffers_, size_t(1));
349  auto group_by_buffer = alloc_group_by_buffer(
350  actual_group_buffer_size, nullptr, thread_idx_, row_set_mem_owner.get());
351  if (!query_mem_desc.lazyInitGroups(device_type)) {
352  initColumnarGroups(
353  query_mem_desc, group_by_buffer + index_buffer_qw, init_agg_vals_, executor);
354  }
355  group_by_buffers_.push_back(group_by_buffer);
356 
357  const auto column_frag_offsets =
358  get_col_frag_offsets(exe_unit.target_exprs, frag_offsets);
359  const auto column_frag_sizes =
360  get_consistent_frags_sizes(exe_unit.target_exprs, consistent_frag_sizes);
361  result_sets_.emplace_back(
362  new ResultSet(target_exprs_to_infos(exe_unit.target_exprs, query_mem_desc),
363  {},
364  col_buffers,
365  column_frag_offsets,
366  column_frag_sizes,
367  device_type,
368  device_id,
370  row_set_mem_owner_,
371  executor->getCatalog(),
372  executor->blockSize(),
373  executor->gridSize()));
374  result_sets_.back()->allocateStorage(reinterpret_cast<int8_t*>(group_by_buffer),
375  init_agg_vals_);
376 }
#define CHECK_EQ(x, y)
Definition: Logger.h:211
#define CHECK_GE(x, y)
Definition: Logger.h:216
num_buffers_(1)
std::vector< int64_t > get_consistent_frags_sizes(const std::vector< std::vector< uint64_t >> &frag_offsets)
static QueryMemoryDescriptor fixupQueryMemoryDescriptor(const QueryMemoryDescriptor &)
Definition: ResultSet.cpp:486
std::vector< TargetInfo > target_exprs_to_infos(const std::vector< Analyzer::Expr * > &targets, const QueryMemoryDescriptor &query_mem_desc)
int64_t * alloc_group_by_buffer(const size_t numBytes, RenderAllocatorMap *render_allocator_map, const size_t thread_idx, RowSetMemoryOwner *mem_owner)
std::vector< std::vector< int64_t > > get_col_frag_offsets(const std::vector< Analyzer::Expr * > &target_exprs, const std::vector< std::vector< uint64_t >> &table_frag_offsets)

+ Here is the call graph for this function:

Variable Documentation

int64_t g_bitmap_memory_limit {8LL * 1000 * 1000 * 1000}