45 LOG(
INFO) <<
"Query Engine CUDA streams enabled";
55 LOG(
INFO) <<
"Query Engine CUDA streams disabled";
93 throw std::runtime_error(
"QueryEngine instance hasn't been created");
103 s = std::make_shared<QueryEngine>(cuda_mgr, cpu_only);
std::unique_ptr< CodeCacheAccessor< CpuCompilationContext > > cpu_code_accessor
size_t g_gpu_code_cache_max_size_in_bytes
void checkCudaErrors(CUresult err)
CUstream getCudaStreamForDevice(int device_num)
CudaMgr_Namespace::CudaMgr * cuda_mgr_
std::unique_ptr< CodeCacheAccessor< CompilationContext > > tf_code_accessor
void setContext(const int device_num) const
static std::weak_ptr< QueryEngine > instance_
int getDeviceCount() const
CUstream getQueryEngineCudaStream()
static std::shared_ptr< QueryEngine > createInstance(CudaMgr_Namespace::CudaMgr *cuda_mgr, bool cpu_only)
std::unique_lock< T > unique_lock
size_t g_code_cache_max_num_items
std::vector< CUstream > cuda_streams_
std::unique_ptr< CodeCacheAccessor< CpuCompilationContext > > s_stubs_accessor
QueryEngine(CudaMgr_Namespace::CudaMgr *cuda_mgr, bool cpu_only)
CUstream getQueryEngineCudaStreamForDevice(int device_num)
static std::shared_ptr< QueryEngine > getInstance()
bool g_query_engine_cuda_streams
std::unique_ptr< CodeCacheAccessor< GpuCompilationContext > > gpu_code_accessor
std::unique_ptr< CodeCacheAccessor< CpuCompilationContext > > s_code_accessor