_execution_kernel_8h_source.html

 /*

  * Copyright 2022 HEAVY.AI, Inc.

  *

  * Licensed under the Apache License, Version 2.0 (the "License");

  * you may not use this file except in compliance with the License.

  * You may obtain a copy of the License at

  *

  *     http://www.apache.org/licenses/LICENSE-2.0

  *

  * Unless required by applicable law or agreed to in writing, software

  * distributed under the License is distributed on an "AS IS" BASIS,

  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

  * See the License for the specific language governing permissions and

  * limitations under the License.

  */


 #pragma once


 #include "Logger/Logger.h"

 #include "QueryEngine/ColumnFetcher.h"

 #include "QueryEngine/Descriptors/QueryCompilationDescriptor.h"


 #include "Shared/threading.h"


 #ifdef HAVE_TBB

 #include "tbb/enumerable_thread_specific.h"

 #endif


 class SharedKernelContext {

  public:

   SharedKernelContext(const std::vector<InputTableInfo>& query_infos)

       : query_infos_(query_infos)

 #ifdef HAVE_TBB

       , task_group_(nullptr)

 #endif

   {

   }


   const std::vector<uint64_t>& getFragOffsets();


   void addDeviceResults(ResultSetPtr&& device_results,

                         std::vector<size_t> outer_table_fragment_ids);


   std::vector<std::pair<ResultSetPtr, std::vector<size_t>>>& getFragmentResults();


   const std::vector<InputTableInfo>& getQueryInfos() const {

     return query_infos_;

   }


   void setNumAllocatedThreads(size_t num_threads) {

     num_allocated_threads_ = num_threads;

   }


   size_t getNumAllocatedThreads() {

     return num_allocated_threads_;

   }


   std::atomic_flag dynamic_watchdog_set = ATOMIC_FLAG_INIT;


 #ifdef HAVE_TBB

   auto getThreadPool() {

     return task_group_;

   }

   void setThreadPool(threading::task_group* tg) {

     task_group_ = tg;

   }

   auto& getTlsExecutionContext() {

     return tls_execution_context_;

   }

 #endif  // HAVE_TBB


  private:

   std::mutex reduce_mutex_;

   std::vector<std::pair<ResultSetPtr, std::vector<size_t>>> all_fragment_results_;


   std::vector<uint64_t> all_frag_row_offsets_;

   std::mutex all_frag_row_offsets_mutex_;

   const std::vector<InputTableInfo>& query_infos_;

   const RegisteredQueryHint query_hint_;

   // the # threads to execute the query (kernel) w/ a value one by default (means serial

   // query execution). After finishing the compilation of the kernel, we will set it to a

   // proper value based on the query's status

   size_t num_allocated_threads_{1};


 #ifdef HAVE_TBB

   threading::task_group* task_group_;

   tbb::enumerable_thread_specific<std::unique_ptr<QueryExecutionContext>>

       tls_execution_context_;

 #endif  // HAVE_TBB

 };


 class ExecutionKernel {

  public:

   ExecutionKernel(const RelAlgExecutionUnit& ra_exe_unit,

                   const ExecutorDeviceType chosen_device_type,

                   int chosen_device_id,

                   const ExecutionOptions& eo,

                   const ColumnFetcher& column_fetcher,

                   const QueryCompilationDescriptor& query_comp_desc,

                   const QueryMemoryDescriptor& query_mem_desc,

                   const FragmentsList& frag_list,

                   const ExecutorDispatchMode kernel_dispatch_mode,

                   RenderInfo* render_info,

                   const int64_t rowid_lookup_key)

       : ra_exe_unit_(ra_exe_unit)

       , chosen_device_type(chosen_device_type)

       , chosen_device_id(chosen_device_id)

       , eo(eo)

       , column_fetcher(column_fetcher)

       , query_comp_desc(query_comp_desc)

       , query_mem_desc(query_mem_desc)

       , frag_list(frag_list)

       , kernel_dispatch_mode(kernel_dispatch_mode)

       , render_info_(render_info)

       , rowid_lookup_key(rowid_lookup_key) {}


   void run(Executor* executor,

            const size_t thread_idx,

            SharedKernelContext& shared_context);


   FragmentsList get_fragment_list() const { return frag_list; }

   int32_t get_chosen_device_id() const { return chosen_device_id; }

   const RelAlgExecutionUnit& ra_exe_unit_;


  private:

   const ExecutorDeviceType chosen_device_type;

   int chosen_device_id;

   const ExecutionOptions& eo;

   const ColumnFetcher& column_fetcher;

   const QueryCompilationDescriptor& query_comp_desc;

   const QueryMemoryDescriptor& query_mem_desc;

   const FragmentsList frag_list;

   const ExecutorDispatchMode kernel_dispatch_mode;

   RenderInfo* render_info_;

   const int64_t rowid_lookup_key;


   ResultSetPtr device_results_;


   void runImpl(Executor* executor,

                const size_t thread_idx,

                SharedKernelContext& shared_context);


   friend class KernelSubtask;

 };


 #ifdef HAVE_TBB

 class KernelSubtask {

  public:

   KernelSubtask(ExecutionKernel& k,

                 SharedKernelContext& shared_context,

                 std::shared_ptr<FetchResult> fetch_result,

                 std::shared_ptr<std::list<ChunkIter>> chunk_iterators,

                 int64_t total_num_input_rows,

                 size_t start_rowid,

                 size_t num_rows_to_process,

                 size_t thread_idx)

       : kernel_(k)

       , shared_context_(shared_context)

       , fetch_result_(fetch_result)

       , chunk_iterators_(chunk_iterators)

       , total_num_input_rows_(total_num_input_rows)

       , start_rowid_(start_rowid)

       , num_rows_to_process_(num_rows_to_process)

       , thread_idx_(thread_idx) {}


   void run(Executor* executor);


  private:

   void runImpl(Executor* executor);


   ExecutionKernel& kernel_;

   SharedKernelContext& shared_context_;

   std::shared_ptr<FetchResult> fetch_result_;

   std::shared_ptr<std::list<ChunkIter>> chunk_iterators_;

   int64_t total_num_input_rows_;

   size_t start_rowid_;

   size_t num_rows_to_process_;

   size_t thread_idx_;

 };

 #endif  // HAVE_TBB

SharedKernelContext::dynamic_watchdog_set
std::atomic_flag dynamic_watchdog_set
Definition: ExecutionKernel.h:58

ExecutionKernel::eo
const ExecutionOptions & eo
Definition: ExecutionKernel.h:128

SharedKernelContext::getFragOffsets
const std::vector< uint64_t > & getFragOffsets()
Definition: ExecutionKernel.cpp:102

ExecutionKernel::get_chosen_device_id
int32_t get_chosen_device_id() const
Definition: ExecutionKernel.h:122

SharedKernelContext::num_allocated_threads_
size_t num_allocated_threads_
Definition: ExecutionKernel.h:83

QueryMemoryDescriptor
Definition: QueryMemoryDescriptor.h:68

ExecutionKernel::kernel_dispatch_mode
const ExecutorDispatchMode kernel_dispatch_mode
Definition: ExecutionKernel.h:133

threading_std::task_group
Definition: threading_std.h:109

ExecutionKernel::ra_exe_unit_
const RelAlgExecutionUnit & ra_exe_unit_
Definition: ExecutionKernel.h:123

SharedKernelContext::all_frag_row_offsets_
std::vector< uint64_t > all_frag_row_offsets_
Definition: ExecutionKernel.h:76

ExecutionKernel::rowid_lookup_key
const int64_t rowid_lookup_key
Definition: ExecutionKernel.h:135

SharedKernelContext::all_frag_row_offsets_mutex_
std::mutex all_frag_row_offsets_mutex_
Definition: ExecutionKernel.h:77

SharedKernelContext::addDeviceResults
void addDeviceResults(ResultSetPtr &&device_results, std::vector< size_t > outer_table_fragment_ids)
Definition: ExecutionKernel.cpp:115

ExecutionKernel
Definition: ExecutionKernel.h:92

ExecutionKernel::chosen_device_type
const ExecutorDeviceType chosen_device_type
Definition: ExecutionKernel.h:126

foreign_storage::num_rows_to_process
size_t num_rows_to_process(const size_t start_row_index, const size_t max_fragment_size, const size_t rows_remaining)
Definition: AbstractTextFileDataWrapper.cpp:493

ResultSetPtr
std::shared_ptr< ResultSet > ResultSetPtr
Definition: RelAlgExecutionUnit.h:231

ExecutionKernel::render_info_
RenderInfo * render_info_
Definition: ExecutionKernel.h:134

thread_idx_
thread_idx_(0)
Definition: QueryMemoryInitializer.cpp:488

QueryCompilationDescriptor.h
Container for compilation results and assorted options for a single execution unit.

FragmentsList
std::vector< FragmentsPerTable > FragmentsList
Definition: QueryFragmentDescriptor.h:58

ExecutorDeviceType
ExecutorDeviceType
Definition: ExecutorDeviceType.h:23

ExecutorDispatchMode
ExecutorDispatchMode
Definition: CompilationOptions.h:29

ColumnFetcher.h

ExecutionKernel::get_fragment_list
FragmentsList get_fragment_list() const
Definition: ExecutionKernel.h:121

threading.h

RenderInfo
Definition: RenderInfo.h:31

SharedKernelContext::query_hint_
const RegisteredQueryHint query_hint_
Definition: ExecutionKernel.h:79

ExecutionKernel::query_mem_desc
const QueryMemoryDescriptor & query_mem_desc
Definition: ExecutionKernel.h:131

ColumnFetcher
Definition: ColumnFetcher.h:49

Logger.h

ExecutionKernel::chosen_device_id
int chosen_device_id
Definition: ExecutionKernel.h:127

RegisteredQueryHint
Definition: QueryHint.h:190

ExecutionKernel::query_comp_desc
const QueryCompilationDescriptor & query_comp_desc
Definition: ExecutionKernel.h:130

ExecutionOptions
Definition: CompilationOptions.h:68

ExecutionKernel::runImpl
void runImpl(Executor *executor, const size_t thread_idx, SharedKernelContext &shared_context)
Definition: ExecutionKernel.cpp:183

SharedKernelContext::all_fragment_results_
std::vector< std::pair< ResultSetPtr, std::vector< size_t > > > all_fragment_results_
Definition: ExecutionKernel.h:74

ExecutionKernel::run
void run(Executor *executor, const size_t thread_idx, SharedKernelContext &shared_context)
Definition: ExecutionKernel.cpp:129

ExecutionKernel::frag_list
const FragmentsList frag_list
Definition: ExecutionKernel.h:132

ExecutionKernel::ExecutionKernel
ExecutionKernel(const RelAlgExecutionUnit &ra_exe_unit, const ExecutorDeviceType chosen_device_type, int chosen_device_id, const ExecutionOptions &eo, const ColumnFetcher &column_fetcher, const QueryCompilationDescriptor &query_comp_desc, const QueryMemoryDescriptor &query_mem_desc, const FragmentsList &frag_list, const ExecutorDispatchMode kernel_dispatch_mode, RenderInfo *render_info, const int64_t rowid_lookup_key)
Definition: ExecutionKernel.h:94

SharedKernelContext::getQueryInfos
const std::vector< InputTableInfo > & getQueryInfos() const
Definition: ExecutionKernel.h:46

ExecutionKernel::device_results_
ResultSetPtr device_results_
Definition: ExecutionKernel.h:137

SharedKernelContext::getFragmentResults
std::vector< std::pair< ResultSetPtr, std::vector< size_t > > > & getFragmentResults()
Definition: ExecutionKernel.cpp:125

SharedKernelContext::reduce_mutex_
std::mutex reduce_mutex_
Definition: ExecutionKernel.h:73

SharedKernelContext::setNumAllocatedThreads
void setNumAllocatedThreads(size_t num_threads)
Definition: ExecutionKernel.h:50

QueryCompilationDescriptor
Definition: QueryCompilationDescriptor.h:53

run
static bool run
Definition: KafkaImporter.cpp:49

SharedKernelContext
Definition: ExecutionKernel.h:29

SharedKernelContext::query_infos_
const std::vector< InputTableInfo > & query_infos_
Definition: ExecutionKernel.h:78

SharedKernelContext::getNumAllocatedThreads
size_t getNumAllocatedThreads()
Definition: ExecutionKernel.h:54

ExecutionKernel::KernelSubtask
friend class KernelSubtask
Definition: ExecutionKernel.h:143

SharedKernelContext::SharedKernelContext
SharedKernelContext(const std::vector< InputTableInfo > &query_infos)
Definition: ExecutionKernel.h:31

RelAlgExecutionUnit
Definition: RelAlgExecutionUnit.h:165

ExecutionKernel::column_fetcher
const ColumnFetcher & column_fetcher
Definition: ExecutionKernel.h:129