37 LOG(
INFO) <<
"Query Engine CUDA streams enabled";
47 LOG(
INFO) <<
"Query Engine CUDA streams disabled";
85 throw std::runtime_error(
"QueryEngine instance hasn't been created");
95 s = std::make_shared<QueryEngine>(cuda_mgr, cpu_only);
std::unique_ptr< CodeCacheAccessor< CpuCompilationContext > > cpu_code_accessor
void checkCudaErrors(CUresult err)
CUstream getCudaStreamForDevice(int device_num)
CudaMgr_Namespace::CudaMgr * cuda_mgr_
std::unique_ptr< CodeCacheAccessor< CompilationContext > > tf_code_accessor
void setContext(const int device_num) const
static std::weak_ptr< QueryEngine > instance_
int getDeviceCount() const
CUstream getQueryEngineCudaStream()
static std::shared_ptr< QueryEngine > createInstance(CudaMgr_Namespace::CudaMgr *cuda_mgr, bool cpu_only)
static constexpr size_t code_cache_size
std::unique_lock< T > unique_lock
std::vector< CUstream > cuda_streams_
std::unique_ptr< CodeCacheAccessor< CpuCompilationContext > > s_stubs_accessor
QueryEngine(CudaMgr_Namespace::CudaMgr *cuda_mgr, bool cpu_only)
CUstream getQueryEngineCudaStreamForDevice(int device_num)
static std::shared_ptr< QueryEngine > getInstance()
bool g_query_engine_cuda_streams
std::unique_ptr< CodeCacheAccessor< GpuCompilationContext > > gpu_code_accessor
std::unique_ptr< CodeCacheAccessor< CpuCompilationContext > > s_code_accessor