_scalar_code_generator_8cpp_source.html

 /*

  * Copyright 2022 HEAVY.AI, Inc.

  *

  * Licensed under the Apache License, Version 2.0 (the "License");

  * you may not use this file except in compliance with the License.

  * You may obtain a copy of the License at

  *

  *     http://www.apache.org/licenses/LICENSE-2.0

  *

  * Unless required by applicable law or agreed to in writing, software

  * distributed under the License is distributed on an "AS IS" BASIS,

  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

  * See the License for the specific language governing permissions and

  * limitations under the License.

  */


 #include "CodeGenerator.h"

 #include "ScalarExprVisitor.h"


 namespace {


 class UsedColumnExpressions : public ScalarExprVisitor<ScalarCodeGenerator::ColumnMap> {

  protected:

   ScalarCodeGenerator::ColumnMap visitColumnVar(

       const Analyzer::ColumnVar* column) const override {

     ScalarCodeGenerator::ColumnMap m;

     const auto& column_key = column->getColumnKey();

     InputColDescriptor input_desc(column_key.column_id,

                                   column_key.table_id,

                                   column_key.db_id,

                                   column->get_rte_idx());

     m.emplace(input_desc,

               std::static_pointer_cast<Analyzer::ColumnVar>(column->deep_copy()));

     return m;

   }


   ScalarCodeGenerator::ColumnMap aggregateResult(

       const ScalarCodeGenerator::ColumnMap& aggregate,

       const ScalarCodeGenerator::ColumnMap& next_result) const override {

     auto result = aggregate;

     result.insert(next_result.begin(), next_result.end());

     return result;

   }

 };


 std::vector<InputTableInfo> g_table_infos;


 llvm::Type* llvm_type_from_sql(const SQLTypeInfo& ti, llvm::LLVMContext& ctx) {

   switch (ti.get_type()) {

     case kINT: {

       return get_int_type(32, ctx);

     }

     default: {

       LOG(FATAL) << "Unsupported type";

       return nullptr;  // satisfy -Wreturn-type

     }

   }

 }


 }  // namespace


 ScalarCodeGenerator::ColumnMap ScalarCodeGenerator::prepare(const Analyzer::Expr* expr) {

   UsedColumnExpressions visitor;

   const auto used_columns = visitor.visit(expr);

   std::list<std::shared_ptr<const InputColDescriptor>> global_col_ids;

   for (const auto& used_column : used_columns) {

     const auto& table_key = used_column.first.getScanDesc().getTableKey();

     global_col_ids.push_back(std::make_shared<InputColDescriptor>(

         used_column.first.getColId(),

         table_key.table_id,

         table_key.db_id,

         used_column.first.getScanDesc().getNestLevel()));

   }

   plan_state_->allocateLocalColumnIds(global_col_ids);

   return used_columns;

 }


 ScalarCodeGenerator::CompiledExpression ScalarCodeGenerator::compile(

     const Analyzer::Expr* expr,

     const bool fetch_columns,

     const CompilationOptions& co) {

   own_plan_state_ = std::make_unique<PlanState>(

       false, std::vector<InputTableInfo>{}, PlanState::DeletedColumnsMap{}, nullptr);

   plan_state_ = own_plan_state_.get();

   const auto used_columns = prepare(expr);

   std::vector<llvm::Type*> arg_types(plan_state_->global_to_local_col_ids_.size() + 1);

   std::vector<std::shared_ptr<Analyzer::ColumnVar>> inputs(arg_types.size() - 1);

   auto& ctx = module_->getContext();

   for (const auto& kv : plan_state_->global_to_local_col_ids_) {

     size_t arg_idx = kv.second;

     CHECK_LT(arg_idx, arg_types.size());

     const auto it = used_columns.find(kv.first);

     const auto col_expr = it->second;

     inputs[arg_idx] = col_expr;

     const auto& ti = col_expr->get_type_info();

     arg_types[arg_idx + 1] = llvm_type_from_sql(ti, ctx);

   }

   arg_types[0] =

       llvm::PointerType::get(llvm_type_from_sql(expr->get_type_info(), ctx), 0);

   auto ft = llvm::FunctionType::get(get_int_type(32, ctx), arg_types, false);

   auto scalar_expr_func = llvm::Function::Create(

       ft, llvm::Function::ExternalLinkage, "scalar_expr", module_.get());

   auto bb_entry = llvm::BasicBlock::Create(ctx, ".entry", scalar_expr_func, 0);

   own_cgen_state_ = std::make_unique<CgenState>(g_table_infos.size(), false);

   own_cgen_state_->module_ = module_.get();

   own_cgen_state_->row_func_ = own_cgen_state_->current_func_ = scalar_expr_func;

   own_cgen_state_->ir_builder_.SetInsertPoint(bb_entry);

   cgen_state_ = own_cgen_state_.get();

   AUTOMATIC_IR_METADATA(cgen_state_);

   const auto expr_lvs = codegen(expr, fetch_columns, co);

   CHECK_EQ(expr_lvs.size(), size_t(1));

   cgen_state_->ir_builder_.CreateStore(expr_lvs.front(),

                                        cgen_state_->row_func_->arg_begin());

   cgen_state_->ir_builder_.CreateRet(ll_int<int32_t>(0, ctx));

   if (co.device_type == ExecutorDeviceType::GPU) {

     std::vector<llvm::Type*> wrapper_arg_types(arg_types.size() + 1);

     wrapper_arg_types[0] = llvm::PointerType::get(get_int_type(32, ctx), 0);

     wrapper_arg_types[1] = arg_types[0];

     for (size_t i = 1; i < arg_types.size(); ++i) {

       wrapper_arg_types[i + 1] = llvm::PointerType::get(arg_types[i], 0);

     }

     auto wrapper_ft =

         llvm::FunctionType::get(llvm::Type::getVoidTy(ctx), wrapper_arg_types, false);

     auto wrapper_scalar_expr_func =

         llvm::Function::Create(wrapper_ft,

                                llvm::Function::ExternalLinkage,

                                "wrapper_scalar_expr",

                                module_.get());

     auto wrapper_bb_entry =

         llvm::BasicBlock::Create(ctx, ".entry", wrapper_scalar_expr_func, 0);

     llvm::IRBuilder<> b(ctx);

     b.SetInsertPoint(wrapper_bb_entry);

     std::vector<llvm::Value*> loaded_args = {wrapper_scalar_expr_func->arg_begin() + 1};

     for (size_t i = 2; i < wrapper_arg_types.size(); ++i) {

       auto* value = wrapper_scalar_expr_func->arg_begin() + i;

       loaded_args.push_back(

           b.CreateLoad(value->getType()->getPointerElementType(), value));

     }

     auto error_lv = b.CreateCall(scalar_expr_func, loaded_args);

     b.CreateStore(error_lv, wrapper_scalar_expr_func->arg_begin());

     b.CreateRetVoid();

     return {scalar_expr_func, wrapper_scalar_expr_func, inputs};

   }

   return {scalar_expr_func, nullptr, inputs};

 }


 std::vector<void*> ScalarCodeGenerator::generateNativeCode(

     Executor* executor,

     const CompiledExpression& compiled_expression,

     const CompilationOptions& co) {

   CHECK(module_ && !execution_engine_.get()) << "Invalid code generator state";

   module_.release();

   switch (co.device_type) {

     case ExecutorDeviceType::CPU: {

       execution_engine_ =

           generateNativeCPUCode(compiled_expression.func, {compiled_expression.func}, co);

       return {execution_engine_->getPointerToFunction(compiled_expression.func)};

     }

     case ExecutorDeviceType::GPU: {

       return generateNativeGPUCode(

           executor, compiled_expression.func, compiled_expression.wrapper_func, co);

     }

     default: {

       LOG(FATAL) << "Invalid device type";

       return {};  // satisfy -Wreturn-type

     }

   }

 }


 std::vector<llvm::Value*> ScalarCodeGenerator::codegenColumn(

     const Analyzer::ColumnVar* column,

     const bool fetch_column,

     const CompilationOptions& co) {

   int arg_idx = plan_state_->getLocalColumnId(column, fetch_column);

   CHECK_LT(static_cast<size_t>(arg_idx), cgen_state_->row_func_->arg_size());

   llvm::Value* arg = cgen_state_->row_func_->arg_begin() + arg_idx + 1;

   return {arg};

 }


 std::vector<void*> ScalarCodeGenerator::generateNativeGPUCode(

     Executor* executor,

     llvm::Function* func,

     llvm::Function* wrapper_func,

     const CompilationOptions& co) {

   if (!nvptx_target_machine_) {

     nvptx_target_machine_ =

         initializeNVPTXBackend(CudaMgr_Namespace::NvidiaDeviceArch::Kepler);

   }

   if (!cuda_mgr_) {

     cuda_mgr_ = std::make_unique<CudaMgr_Namespace::CudaMgr>(0);

   }

   GPUTarget gpu_target;

   gpu_target.nvptx_target_machine = nvptx_target_machine_.get();

   gpu_target.cuda_mgr = cuda_mgr_.get();

   gpu_target.cgen_state = cgen_state_;

   gpu_target.row_func_not_inlined = false;

   gpu_compilation_context_ =

       CodeGenerator::generateNativeGPUCode(executor,

                                            func,

                                            wrapper_func,

                                            {func, wrapper_func},

                                            /*is_gpu_smem_used=*/false,

                                            co,

                                            gpu_target);

   return gpu_compilation_context_->getNativeFunctionPointers();

 }

anonymous_namespace{ScalarCodeGenerator.cpp}::UsedColumnExpressions::visitColumnVar
ScalarCodeGenerator::ColumnMap visitColumnVar(const Analyzer::ColumnVar *column) const override
Definition: ScalarCodeGenerator.cpp:24

CompilationOptions
Definition: CompilationOptions.h:31

CHECK_EQ
#define CHECK_EQ(x, y)
Definition: Logger.h:301

ScalarCodeGenerator::compile
CompiledExpression compile(const Analyzer::Expr *expr, const bool fetch_columns, const CompilationOptions &co)
Definition: ScalarCodeGenerator.cpp:78

ScalarCodeGenerator::codegenColumn
std::vector< llvm::Value * > codegenColumn(const Analyzer::ColumnVar *, const bool fetch_column, const CompilationOptions &) override
Definition: ScalarCodeGenerator.cpp:170

ScalarCodeGenerator::CompiledExpression
Definition: CodeGenerator.h:689

anonymous_namespace{ScalarCodeGenerator.cpp}::llvm_type_from_sql
llvm::Type * llvm_type_from_sql(const SQLTypeInfo &ti, llvm::LLVMContext &ctx)
Definition: ScalarCodeGenerator.cpp:48

PlanState::DeletedColumnsMap
std::unordered_map< shared::TableKey, const ColumnDescriptor * > DeletedColumnsMap
Definition: PlanState.h:44

ScalarCodeGenerator::own_plan_state_
std::unique_ptr< PlanState > own_plan_state_
Definition: CodeGenerator.h:731

CodeGenerator::cgen_state_
CgenState * cgen_state_
Definition: CodeGenerator.h:666

ScalarCodeGenerator::execution_engine_
ExecutionEngineWrapper execution_engine_
Definition: CodeGenerator.h:729

LOG
#define LOG(tag)
Definition: Logger.h:285

Analyzer::Expr
Definition: Analyzer.h:68

ExecutionEngineWrapper::get
llvm::ExecutionEngine * get()
Definition: CompilationContext.h:49

CgenState::ir_builder_
llvm::IRBuilder ir_builder_
Definition: CgenState.h:384

ScalarCodeGenerator::nvptx_target_machine_
std::unique_ptr< llvm::TargetMachine > nvptx_target_machine_
Definition: CodeGenerator.h:734

InputColDescriptor
Definition: InputDescriptors.h:59

logger::FATAL
Definition: Logger.h:111

ScalarCodeGenerator::gpu_compilation_context_
std::shared_ptr< GpuCompilationContext > gpu_compilation_context_
Definition: CodeGenerator.h:733

ScalarCodeGenerator::CompiledExpression::func
llvm::Function * func
Definition: CodeGenerator.h:690

Analyzer::ColumnVar::deep_copy
std::shared_ptr< Analyzer::Expr > deep_copy() const override
Definition: Analyzer.cpp:66

CodeGenerator::generateNativeCPUCode
static ExecutionEngineWrapper generateNativeCPUCode(llvm::Function *func, const std::unordered_set< llvm::Function * > &live_funcs, const CompilationOptions &co)
Definition: NativeCodegen.cpp:439

SQLTypeInfo::get_type
HOST DEVICE SQLTypes get_type() const
Definition: sqltypes.h:391

ScalarCodeGenerator::ColumnMap
std::unordered_map< InputColDescriptor, std::shared_ptr< Analyzer::ColumnVar >> ColumnMap
Definition: CodeGenerator.h:712

get_int_type
llvm::Type * get_int_type(const int width, llvm::LLVMContext &context)
Definition: IRCodegenUtils.h:83

ScalarCodeGenerator::CompiledExpression::wrapper_func
llvm::Function * wrapper_func
Definition: CodeGenerator.h:691

Analyzer::ColumnVar
Definition: Analyzer.h:194

CodeGenerator::GPUTarget::cuda_mgr
const CudaMgr_Namespace::CudaMgr * cuda_mgr
Definition: CodeGenerator.h:101

CgenState::row_func_
llvm::Function * row_func_
Definition: CgenState.h:374

ExecutorDeviceType::GPU

ScalarCodeGenerator::cuda_mgr_
std::unique_ptr< CudaMgr_Namespace::CudaMgr > cuda_mgr_
Definition: CodeGenerator.h:732

CodeGenerator::GPUTarget::nvptx_target_machine
llvm::TargetMachine * nvptx_target_machine
Definition: CodeGenerator.h:100

PlanState::getLocalColumnId
int getLocalColumnId(const Analyzer::ColumnVar *col_var, const bool fetch_column)
Definition: PlanState.cpp:52

anonymous_namespace{ScalarCodeGenerator.cpp}::g_table_infos
std::vector< InputTableInfo > g_table_infos
Definition: ScalarCodeGenerator.cpp:46

ScalarExprVisitor.h

CodeGenerator::GPUTarget::row_func_not_inlined
bool row_func_not_inlined
Definition: CodeGenerator.h:103

anonymous_namespace{ScalarCodeGenerator.cpp}::UsedColumnExpressions::aggregateResult
ScalarCodeGenerator::ColumnMap aggregateResult(const ScalarCodeGenerator::ColumnMap &aggregate, const ScalarCodeGenerator::ColumnMap &next_result) const override
Definition: ScalarCodeGenerator.cpp:37

PlanState::allocateLocalColumnIds
void allocateLocalColumnIds(const std::list< std::shared_ptr< const InputColDescriptor >> &global_col_ids)
Definition: PlanState.cpp:40

AUTOMATIC_IR_METADATA
#define AUTOMATIC_IR_METADATA(CGENSTATE)
Definition: AutomaticIRMetadataGuard.h:205

Analyzer::Expr::get_type_info
const SQLTypeInfo & get_type_info() const
Definition: Analyzer.h:79

CompilationOptions::device_type
ExecutorDeviceType device_type
Definition: CompilationOptions.h:32

CodeGenerator::plan_state_
PlanState * plan_state_
Definition: CodeGenerator.h:667

CodeGenerator::codegen
std::vector< llvm::Value * > codegen(const Analyzer::Expr *, const bool fetch_columns, const CompilationOptions &)
Definition: IRCodegen.cpp:30

CHECK_LT
#define CHECK_LT(x, y)
Definition: Logger.h:303

Analyzer::ColumnVar::getColumnKey
const shared::ColumnKey & getColumnKey() const
Definition: Analyzer.h:198

CodeGenerator::generateNativeGPUCode
static std::shared_ptr< GpuCompilationContext > generateNativeGPUCode(Executor *executor, llvm::Function *func, llvm::Function *wrapper_func, const std::unordered_set< llvm::Function * > &live_funcs, const bool is_gpu_smem_used, const CompilationOptions &co, const GPUTarget &gpu_target)
Definition: NativeCodegen.cpp:1194

CodeGenerator::GPUTarget::cgen_state
CgenState * cgen_state
Definition: CodeGenerator.h:102

ScalarCodeGenerator::prepare
ColumnMap prepare(const Analyzer::Expr *)
Definition: ScalarCodeGenerator.cpp:62

ScalarCodeGenerator::own_cgen_state_
std::unique_ptr< CgenState > own_cgen_state_
Definition: CodeGenerator.h:730

anonymous_namespace{ScalarCodeGenerator.cpp}::UsedColumnExpressions
Definition: ScalarCodeGenerator.cpp:22

ExecutorDeviceType::CPU

Type
Type
Definition: ResultSetReductionOps.h:33

ScalarCodeGenerator::generateNativeGPUCode
std::vector< void * > generateNativeGPUCode(Executor *executor, llvm::Function *func, llvm::Function *wrapper_func, const CompilationOptions &co)
Definition: ScalarCodeGenerator.cpp:180

ScalarExprVisitor
Definition: ScalarExprVisitor.h:23

CodeGenerator.h

CHECK
#define CHECK(condition)
Definition: Logger.h:291

SQLTypeInfo
Definition: sqltypes.h:332

ScalarCodeGenerator::module_
std::unique_ptr< llvm::Module > module_
Definition: CodeGenerator.h:728

kINT
Definition: sqltypes.h:72

ScalarCodeGenerator::generateNativeCode
std::vector< void * > generateNativeCode(Executor *executor, const CompiledExpression &compiled_expression, const CompilationOptions &co)
Definition: ScalarCodeGenerator.cpp:147

Analyzer::ColumnVar::get_rte_idx
int32_t get_rte_idx() const
Definition: Analyzer.h:202

CodeGenerator::GPUTarget
Definition: CodeGenerator.h:99

CudaMgr_Namespace::NvidiaDeviceArch::Kepler

CodeGenerator::initializeNVPTXBackend
static std::unique_ptr< llvm::TargetMachine > initializeNVPTXBackend(const CudaMgr_Namespace::NvidiaDeviceArch arch)
Definition: NativeCodegen.cpp:1518

run_benchmark_import.result
dictionary result
Definition: run_benchmark_import.py:441