OmniSciDB  c1a53651b2
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Groups Pages
anonymous_namespace{OverlapsJoinHashTable.cpp} Namespace Reference

Classes

struct  HashTableProps
 
struct  TuningState
 
class  BucketSizeTuner
 

Functions

std::vector< double > correct_uninitialized_bucket_sizes_to_thresholds (const std::vector< double > &bucket_sizes, const std::vector< double > &bucket_thresholds, const double initial_value)
 
std::vector< double > compute_bucket_sizes (const std::vector< double > &bucket_thresholds, const Data_Namespace::MemoryLevel effective_memory_level, const JoinColumn &join_column, const JoinColumnTypeInfo &join_column_type, const std::vector< InnerOuter > &inner_outer_pairs, const Executor *executor)
 
std::ostream & operator<< (std::ostream &os, const HashTableProps &props)
 
std::ostream & operator<< (std::ostream &os, const BucketSizeTuner &tuner)
 

Function Documentation

std::vector<double> anonymous_namespace{OverlapsJoinHashTable.cpp}::compute_bucket_sizes ( const std::vector< double > &  bucket_thresholds,
const Data_Namespace::MemoryLevel  effective_memory_level,
const JoinColumn join_column,
const JoinColumnTypeInfo join_column_type,
const std::vector< InnerOuter > &  inner_outer_pairs,
const Executor executor 
)

Definition at line 162 of file OverlapsJoinHashTable.cpp.

References CHECK, CHECK_EQ, compute_bucket_sizes_on_cpu(), compute_bucket_sizes_on_device(), CudaAllocator::copyFromDevice(), correct_uninitialized_bucket_sizes_to_thresholds(), Data_Namespace::CPU_LEVEL, cpu_threads(), getQueryEngineCudaStreamForDevice(), to_string(), transfer_flat_object_to_gpu(), transfer_vector_of_flat_objects_to_gpu(), and VLOG.

Referenced by anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::computeBucketSizes().

168  {
169  // No coalesced keys for overlaps joins yet
170  CHECK_EQ(inner_outer_pairs.size(), 1u);
171 
172  const auto col = inner_outer_pairs[0].first;
173  CHECK(col);
174  const auto col_ti = col->get_type_info();
175  CHECK(col_ti.is_array());
176 
177  // TODO: Compute the number of dimensions for this overlaps key
178  const size_t num_dims{2};
179  const double initial_bin_value{0.0};
180  std::vector<double> bucket_sizes(num_dims, initial_bin_value);
181  CHECK_EQ(bucket_thresholds.size(), num_dims);
182 
183  VLOG(1)
184  << "Computing x and y bucket sizes for overlaps hash join with maximum bucket size "
185  << std::to_string(bucket_thresholds[0]) << ", "
186  << std::to_string(bucket_thresholds[1]);
187 
188  if (effective_memory_level == Data_Namespace::MemoryLevel::CPU_LEVEL) {
189  const int thread_count = cpu_threads();
191  bucket_sizes, join_column, join_column_type, bucket_thresholds, thread_count);
192  }
193 #ifdef HAVE_CUDA
194  else {
195  // Note that we compute the bucket sizes using only a single GPU
196  const int device_id = 0;
197  auto data_mgr = executor->getDataMgr();
198  CudaAllocator allocator(
199  data_mgr, device_id, getQueryEngineCudaStreamForDevice(device_id));
200  auto device_bucket_sizes_gpu =
201  transfer_vector_of_flat_objects_to_gpu(bucket_sizes, allocator);
202  auto join_column_gpu = transfer_flat_object_to_gpu(join_column, allocator);
203  auto join_column_type_gpu = transfer_flat_object_to_gpu(join_column_type, allocator);
204  auto device_bucket_thresholds_gpu =
205  transfer_vector_of_flat_objects_to_gpu(bucket_thresholds, allocator);
206 
207  compute_bucket_sizes_on_device(device_bucket_sizes_gpu,
208  join_column_gpu,
209  join_column_type_gpu,
210  device_bucket_thresholds_gpu);
211  allocator.copyFromDevice(reinterpret_cast<int8_t*>(bucket_sizes.data()),
212  reinterpret_cast<int8_t*>(device_bucket_sizes_gpu),
213  bucket_sizes.size() * sizeof(double));
214  }
215 #endif
216  const auto corrected_bucket_sizes = correct_uninitialized_bucket_sizes_to_thresholds(
217  bucket_sizes, bucket_thresholds, initial_bin_value);
218 
219  VLOG(1) << "Computed x and y bucket sizes for overlaps hash join: ("
220  << corrected_bucket_sizes[0] << ", " << corrected_bucket_sizes[1] << ")";
221 
222  return corrected_bucket_sizes;
223 }
#define CHECK_EQ(x, y)
Definition: Logger.h:301
T * transfer_flat_object_to_gpu(const T &object, DeviceAllocator &allocator)
std::string to_string(char const *&&v)
void compute_bucket_sizes_on_device(double *bucket_sizes_buffer, const JoinColumn *join_column, const JoinColumnTypeInfo *type_info, const double *bucket_size_thresholds)
void compute_bucket_sizes_on_cpu(std::vector< double > &bucket_sizes_for_dimension, const JoinColumn &join_column, const JoinColumnTypeInfo &type_info, const std::vector< double > &bucket_size_thresholds, const int thread_count)
CUstream getQueryEngineCudaStreamForDevice(int device_num)
Definition: QueryEngine.cpp:7
std::vector< double > correct_uninitialized_bucket_sizes_to_thresholds(const std::vector< double > &bucket_sizes, const std::vector< double > &bucket_thresholds, const double initial_value)
#define CHECK(condition)
Definition: Logger.h:291
T * transfer_vector_of_flat_objects_to_gpu(const std::vector< T > &vec, DeviceAllocator &allocator)
int cpu_threads()
Definition: thread_count.h:25
#define VLOG(n)
Definition: Logger.h:387

+ Here is the call graph for this function:

+ Here is the caller graph for this function:

std::vector<double> anonymous_namespace{OverlapsJoinHashTable.cpp}::correct_uninitialized_bucket_sizes_to_thresholds ( const std::vector< double > &  bucket_sizes,
const std::vector< double > &  bucket_thresholds,
const double  initial_value 
)

Definition at line 149 of file OverlapsJoinHashTable.cpp.

Referenced by compute_bucket_sizes().

152  {
153  std::vector<double> corrected_bucket_sizes(bucket_sizes);
154  for (size_t i = 0; i != bucket_sizes.size(); ++i) {
155  if (bucket_sizes[i] == initial_value) {
156  corrected_bucket_sizes[i] = bucket_thresholds[i];
157  }
158  }
159  return corrected_bucket_sizes;
160 }

+ Here is the caller graph for this function:

std::ostream& anonymous_namespace{OverlapsJoinHashTable.cpp}::operator<< ( std::ostream &  os,
const HashTableProps &  props 
)

Definition at line 246 of file OverlapsJoinHashTable.cpp.

References anonymous_namespace{OverlapsJoinHashTable.cpp}::HashTableProps::emitted_keys_count, anonymous_namespace{OverlapsJoinHashTable.cpp}::HashTableProps::entry_count, anonymous_namespace{OverlapsJoinHashTable.cpp}::HashTableProps::hash_table_size, and anonymous_namespace{OverlapsJoinHashTable.cpp}::HashTableProps::keys_per_bin.

246  {
247  os << " entry_count: " << props.entry_count << ", emitted_keys "
248  << props.emitted_keys_count << ", hash table size " << props.hash_table_size
249  << ", keys per bin " << props.keys_per_bin;
250  return os;
251 }
std::ostream& anonymous_namespace{OverlapsJoinHashTable.cpp}::operator<< ( std::ostream &  os,
const BucketSizeTuner &  tuner 
)

Definition at line 524 of file OverlapsJoinHashTable.cpp.

References anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::bucket_thresholds_, anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::min_threshold_, anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::num_steps_, and anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::step_.

524  {
525  os << "Step Num: " << tuner.num_steps_ << ", Threshold: " << std::fixed << "("
526  << tuner.bucket_thresholds_[0] << ", " << tuner.bucket_thresholds_[1] << ")"
527  << ", Step Size: " << std::fixed << tuner.step_ << ", Min: " << std::fixed
528  << tuner.min_threshold_;
529  return os;
530 }