OmniSciDB  c0231cc57d
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Groups Pages
anonymous_namespace{OverlapsJoinHashTable.cpp} Namespace Reference

Classes

struct  HashTableProps
 
struct  TuningState
 
class  BucketSizeTuner
 

Functions

std::vector< double > correct_uninitialized_bucket_sizes_to_thresholds (const std::vector< double > &bucket_sizes, const std::vector< double > &bucket_thresholds, const double initial_value)
 
std::vector< double > compute_bucket_sizes (const std::vector< double > &bucket_thresholds, const Data_Namespace::MemoryLevel effective_memory_level, const JoinColumn &join_column, const JoinColumnTypeInfo &join_column_type, const std::vector< InnerOuter > &inner_outer_pairs, const Executor *executor)
 
std::ostream & operator<< (std::ostream &os, const HashTableProps &props)
 
std::ostream & operator<< (std::ostream &os, const BucketSizeTuner &tuner)
 

Function Documentation

std::vector<double> anonymous_namespace{OverlapsJoinHashTable.cpp}::compute_bucket_sizes ( const std::vector< double > &  bucket_thresholds,
const Data_Namespace::MemoryLevel  effective_memory_level,
const JoinColumn join_column,
const JoinColumnTypeInfo join_column_type,
const std::vector< InnerOuter > &  inner_outer_pairs,
const Executor executor 
)

Definition at line 163 of file OverlapsJoinHashTable.cpp.

References CHECK, CHECK_EQ, compute_bucket_sizes_on_cpu(), compute_bucket_sizes_on_device(), CudaAllocator::copyFromDevice(), correct_uninitialized_bucket_sizes_to_thresholds(), Data_Namespace::CPU_LEVEL, cpu_threads(), getQueryEngineCudaStreamForDevice(), to_string(), transfer_flat_object_to_gpu(), transfer_vector_of_flat_objects_to_gpu(), and VLOG.

Referenced by anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::computeBucketSizes().

169  {
170  // No coalesced keys for overlaps joins yet
171  CHECK_EQ(inner_outer_pairs.size(), 1u);
172 
173  const auto col = inner_outer_pairs[0].first;
174  CHECK(col);
175  const auto col_ti = col->get_type_info();
176  CHECK(col_ti.is_array());
177 
178  // TODO: Compute the number of dimensions for this overlaps key
179  const size_t num_dims{2};
180  const double initial_bin_value{0.0};
181  std::vector<double> bucket_sizes(num_dims, initial_bin_value);
182  CHECK_EQ(bucket_thresholds.size(), num_dims);
183 
184  VLOG(1)
185  << "Computing x and y bucket sizes for overlaps hash join with maximum bucket size "
186  << std::to_string(bucket_thresholds[0]) << ", "
187  << std::to_string(bucket_thresholds[1]);
188 
189  if (effective_memory_level == Data_Namespace::MemoryLevel::CPU_LEVEL) {
190  const int thread_count = cpu_threads();
192  bucket_sizes, join_column, join_column_type, bucket_thresholds, thread_count);
193  }
194 #ifdef HAVE_CUDA
195  else {
196  // Note that we compute the bucket sizes using only a single GPU
197  const int device_id = 0;
198  auto data_mgr = executor->getDataMgr();
199  CudaAllocator allocator(
200  data_mgr, device_id, getQueryEngineCudaStreamForDevice(device_id));
201  auto device_bucket_sizes_gpu =
202  transfer_vector_of_flat_objects_to_gpu(bucket_sizes, allocator);
203  auto join_column_gpu = transfer_flat_object_to_gpu(join_column, allocator);
204  auto join_column_type_gpu = transfer_flat_object_to_gpu(join_column_type, allocator);
205  auto device_bucket_thresholds_gpu =
206  transfer_vector_of_flat_objects_to_gpu(bucket_thresholds, allocator);
207 
208  compute_bucket_sizes_on_device(device_bucket_sizes_gpu,
209  join_column_gpu,
210  join_column_type_gpu,
211  device_bucket_thresholds_gpu);
212  allocator.copyFromDevice(reinterpret_cast<int8_t*>(bucket_sizes.data()),
213  reinterpret_cast<int8_t*>(device_bucket_sizes_gpu),
214  bucket_sizes.size() * sizeof(double));
215  }
216 #endif
217  const auto corrected_bucket_sizes = correct_uninitialized_bucket_sizes_to_thresholds(
218  bucket_sizes, bucket_thresholds, initial_bin_value);
219 
220  VLOG(1) << "Computed x and y bucket sizes for overlaps hash join: ("
221  << corrected_bucket_sizes[0] << ", " << corrected_bucket_sizes[1] << ")";
222 
223  return corrected_bucket_sizes;
224 }
#define CHECK_EQ(x, y)
Definition: Logger.h:230
T * transfer_flat_object_to_gpu(const T &object, DeviceAllocator &allocator)
std::string to_string(char const *&&v)
void compute_bucket_sizes_on_device(double *bucket_sizes_buffer, const JoinColumn *join_column, const JoinColumnTypeInfo *type_info, const double *bucket_size_thresholds)
void compute_bucket_sizes_on_cpu(std::vector< double > &bucket_sizes_for_dimension, const JoinColumn &join_column, const JoinColumnTypeInfo &type_info, const std::vector< double > &bucket_size_thresholds, const int thread_count)
CUstream getQueryEngineCudaStreamForDevice(int device_num)
Definition: QueryEngine.cpp:7
std::vector< double > correct_uninitialized_bucket_sizes_to_thresholds(const std::vector< double > &bucket_sizes, const std::vector< double > &bucket_thresholds, const double initial_value)
#define CHECK(condition)
Definition: Logger.h:222
T * transfer_vector_of_flat_objects_to_gpu(const std::vector< T > &vec, DeviceAllocator &allocator)
int cpu_threads()
Definition: thread_count.h:25
#define VLOG(n)
Definition: Logger.h:316

+ Here is the call graph for this function:

+ Here is the caller graph for this function:

std::vector<double> anonymous_namespace{OverlapsJoinHashTable.cpp}::correct_uninitialized_bucket_sizes_to_thresholds ( const std::vector< double > &  bucket_sizes,
const std::vector< double > &  bucket_thresholds,
const double  initial_value 
)

Definition at line 150 of file OverlapsJoinHashTable.cpp.

Referenced by compute_bucket_sizes().

153  {
154  std::vector<double> corrected_bucket_sizes(bucket_sizes);
155  for (size_t i = 0; i != bucket_sizes.size(); ++i) {
156  if (bucket_sizes[i] == initial_value) {
157  corrected_bucket_sizes[i] = bucket_thresholds[i];
158  }
159  }
160  return corrected_bucket_sizes;
161 }

+ Here is the caller graph for this function:

std::ostream& anonymous_namespace{OverlapsJoinHashTable.cpp}::operator<< ( std::ostream &  os,
const HashTableProps &  props 
)

Definition at line 247 of file OverlapsJoinHashTable.cpp.

References anonymous_namespace{OverlapsJoinHashTable.cpp}::HashTableProps::emitted_keys_count, anonymous_namespace{OverlapsJoinHashTable.cpp}::HashTableProps::entry_count, anonymous_namespace{OverlapsJoinHashTable.cpp}::HashTableProps::hash_table_size, and anonymous_namespace{OverlapsJoinHashTable.cpp}::HashTableProps::keys_per_bin.

247  {
248  os << " entry_count: " << props.entry_count << ", emitted_keys "
249  << props.emitted_keys_count << ", hash table size " << props.hash_table_size
250  << ", keys per bin " << props.keys_per_bin;
251  return os;
252 }
std::ostream& anonymous_namespace{OverlapsJoinHashTable.cpp}::operator<< ( std::ostream &  os,
const BucketSizeTuner &  tuner 
)

Definition at line 525 of file OverlapsJoinHashTable.cpp.

References anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::bucket_thresholds_, anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::min_threshold_, anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::num_steps_, and anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::step_.

525  {
526  os << "Step Num: " << tuner.num_steps_ << ", Threshold: " << std::fixed << "("
527  << tuner.bucket_thresholds_[0] << ", " << tuner.bucket_thresholds_[1] << ")"
528  << ", Step Size: " << std::fixed << tuner.step_ << ", Min: " << std::fixed
529  << tuner.min_threshold_;
530  return os;
531 }