OmniSciDB  c1a53651b2
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Groups Pages
anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner Class Reference
+ Collaboration diagram for anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner:

Public Member Functions

 BucketSizeTuner (const double bucket_threshold, const double step, const double min_threshold, const Data_Namespace::MemoryLevel effective_memory_level, const std::vector< ColumnsForDevice > &columns_per_device, const std::vector< InnerOuter > &inner_outer_pairs, const size_t table_tuple_count, const Executor *executor)
 
bool tuneOneStep ()
 
bool tuneOneStep (const TuningState::TuningDirection tuning_direction)
 
bool tuneOneStep (const TuningState::TuningDirection tuning_direction, const double step_overide)
 
auto getMinBucketSize () const
 
std::vector< double > getInverseBucketSizes ()
 

Private Member Functions

bool bucketThresholdsBelowMinThreshold () const
 
std::vector< double > computeBucketSizes () const
 
bool tuneSmallerOneStep (const double step_overide)
 
bool tuneLargerOneStep (const double step_overide)
 

Private Attributes

size_t num_dims_
 
std::vector< double > bucket_thresholds_
 
size_t num_steps_ {0}
 
const double step_
 
const double min_threshold_
 
const Data_Namespace::MemoryLevel effective_memory_level_
 
const std::vector
< ColumnsForDevice > & 
columns_per_device_
 
const std::vector< InnerOuter > & inner_outer_pairs_
 
const size_t table_tuple_count_
 
const Executorexecutor_
 
std::vector< double > current_bucket_sizes_
 

Friends

std::ostream & operator<< (std::ostream &os, const BucketSizeTuner &tuner)
 

Detailed Description

Definition at line 379 of file OverlapsJoinHashTable.cpp.

Constructor & Destructor Documentation

anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::BucketSizeTuner ( const double  bucket_threshold,
const double  step,
const double  min_threshold,
const Data_Namespace::MemoryLevel  effective_memory_level,
const std::vector< ColumnsForDevice > &  columns_per_device,
const std::vector< InnerOuter > &  inner_outer_pairs,
const size_t  table_tuple_count,
const Executor executor 
)
inline

Definition at line 381 of file OverlapsJoinHashTable.cpp.

References CHECK.

389  : num_dims_(2) // Todo: allow varying number of dims
390  , bucket_thresholds_(/*count=*/num_dims_, /*value=*/bucket_threshold)
391  , step_(step)
392  , min_threshold_(min_threshold)
393  , effective_memory_level_(effective_memory_level)
394  , columns_per_device_(columns_per_device)
395  , inner_outer_pairs_(inner_outer_pairs)
396  , table_tuple_count_(table_tuple_count)
397  , executor_(executor) {
398  CHECK(!columns_per_device_.empty());
399  }
#define CHECK(condition)
Definition: Logger.h:291

Member Function Documentation

bool anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::bucketThresholdsBelowMinThreshold ( ) const
inlineprivate

Definition at line 442 of file OverlapsJoinHashTable.cpp.

442  {
443  for (const auto& t : bucket_thresholds_) {
444  if (t < min_threshold_) {
445  return true;
446  }
447  }
448  return false;
449  }
std::vector<double> anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::computeBucketSizes ( ) const
inlineprivate

Definition at line 451 of file OverlapsJoinHashTable.cpp.

References anonymous_namespace{OverlapsJoinHashTable.cpp}::compute_bucket_sizes(), and executor_().

451  {
452  if (table_tuple_count_ == 0) {
453  return std::vector<double>(/*count=*/num_dims_, /*val=*/0);
454  }
457  columns_per_device_.front().join_columns[0],
458  columns_per_device_.front().join_column_types[0],
460  executor_);
461  }
std::vector< double > compute_bucket_sizes(const std::vector< double > &bucket_thresholds, const Data_Namespace::MemoryLevel effective_memory_level, const JoinColumn &join_column, const JoinColumnTypeInfo &join_column_type, const std::vector< InnerOuter > &inner_outer_pairs, const Executor *executor)

+ Here is the call graph for this function:

std::vector<double> anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::getInverseBucketSizes ( )
inline

Method to retrieve inverted bucket sizes, which are what are used elsewhere in the OverlapsHashTable framework

Returns
the inverted bucket sizes, i.e. a set of that will place a raw value in a bucket when multiplied by the raw value

Definition at line 428 of file OverlapsJoinHashTable.cpp.

References CHECK_EQ.

428  {
429  if (num_steps_ == 0) {
430  CHECK_EQ(current_bucket_sizes_.size(), static_cast<size_t>(0));
432  }
434  std::vector<double> inverse_bucket_sizes;
435  for (const auto s : current_bucket_sizes_) {
436  inverse_bucket_sizes.emplace_back(1.0 / s);
437  }
438  return inverse_bucket_sizes;
439  }
#define CHECK_EQ(x, y)
Definition: Logger.h:301
auto anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::getMinBucketSize ( ) const
inline

Definition at line 418 of file OverlapsJoinHashTable.cpp.

418  {
419  return *std::min_element(bucket_thresholds_.begin(), bucket_thresholds_.end());
420  }
bool anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::tuneLargerOneStep ( const double  step_overide)
inlineprivate

Definition at line 487 of file OverlapsJoinHashTable.cpp.

References CHECK_EQ.

487  {
488  if (!current_bucket_sizes_.empty()) {
491  }
492  // If current_bucket_sizes was empty, we will start from our initial threshold
493  for (auto& t : bucket_thresholds_) {
494  t *= step_overide;
495  }
496  // When tuning up, do not dynamically compute bucket_sizes, as compute_bucket_sizes as
497  // written will pick the largest bin size below the threshold, meaning our bucket_size
498  // will never increase beyond the size of the largest polygon. This could mean that we
499  // can never make the bucket sizes large enough to get our hash table below the
500  // maximum size Possible todo: enable templated version of compute_bucket_sizes that
501  // allows for optionally finding smallest extent above threshold, to mirror default
502  // behavior finding largest extent below threshold, and use former variant here
504  num_steps_++;
505  return true;
506  }
#define CHECK_EQ(x, y)
Definition: Logger.h:301
bool anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::tuneOneStep ( )
inline

Definition at line 401 of file OverlapsJoinHashTable.cpp.

References tuneOneStep().

Referenced by tuneOneStep().

+ Here is the call graph for this function:

+ Here is the caller graph for this function:

bool anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::tuneOneStep ( const TuningState::TuningDirection  tuning_direction)
inline
bool anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::tuneOneStep ( const TuningState::TuningDirection  tuning_direction,
const double  step_overide 
)
inline

Definition at line 407 of file OverlapsJoinHashTable.cpp.

bool anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::tuneSmallerOneStep ( const double  step_overide)
inlineprivate

Definition at line 463 of file OverlapsJoinHashTable.cpp.

References CHECK_EQ, and VLOG.

463  {
464  if (!current_bucket_sizes_.empty()) {
467  for (auto& t : bucket_thresholds_) {
468  t /= step_overide;
469  }
470  }
472  VLOG(1) << "Aborting overlaps tuning as at least one bucket size is below min "
473  "threshold";
474  return false;
475  }
476  const auto next_bucket_sizes = computeBucketSizes();
477  if (next_bucket_sizes == current_bucket_sizes_) {
478  VLOG(1) << "Aborting overlaps tuning as bucket size is no longer changing.";
479  return false;
480  }
481 
482  current_bucket_sizes_ = next_bucket_sizes;
483  num_steps_++;
484  return true;
485  }
#define CHECK_EQ(x, y)
Definition: Logger.h:301
#define VLOG(n)
Definition: Logger.h:387

Friends And Related Function Documentation

std::ostream& operator<< ( std::ostream &  os,
const BucketSizeTuner tuner 
)
friend

Definition at line 524 of file OverlapsJoinHashTable.cpp.

524  {
525  os << "Step Num: " << tuner.num_steps_ << ", Threshold: " << std::fixed << "("
526  << tuner.bucket_thresholds_[0] << ", " << tuner.bucket_thresholds_[1] << ")"
527  << ", Step Size: " << std::fixed << tuner.step_ << ", Min: " << std::fixed
528  << tuner.min_threshold_;
529  return os;
530 }

Member Data Documentation

std::vector<double> anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::bucket_thresholds_
private
const std::vector<ColumnsForDevice>& anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::columns_per_device_
private

Definition at line 514 of file OverlapsJoinHashTable.cpp.

std::vector<double> anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::current_bucket_sizes_
private

Definition at line 519 of file OverlapsJoinHashTable.cpp.

const Data_Namespace::MemoryLevel anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::effective_memory_level_
private

Definition at line 513 of file OverlapsJoinHashTable.cpp.

const Executor* anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::executor_
private

Definition at line 517 of file OverlapsJoinHashTable.cpp.

const std::vector<InnerOuter>& anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::inner_outer_pairs_
private

Definition at line 515 of file OverlapsJoinHashTable.cpp.

const double anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::min_threshold_
private
size_t anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::num_dims_
private

Definition at line 508 of file OverlapsJoinHashTable.cpp.

size_t anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::num_steps_ {0}
private
const double anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::step_
private
const size_t anonymous_namespace{OverlapsJoinHashTable.cpp}::BucketSizeTuner::table_tuple_count_
private

Definition at line 516 of file OverlapsJoinHashTable.cpp.


The documentation for this class was generated from the following file: