This is the Executor subclass which represents the CUDA device.
More...
#include <ginkgo/core/base/executor.hpp>
This is the Executor subclass which represents the CUDA device.
◆ create() [1/2]
static std::shared_ptr<CudaExecutor> gko::CudaExecutor::create |
( |
int |
device_id, |
|
|
std::shared_ptr< Executor > |
master, |
|
|
bool |
device_reset, |
|
|
allocation_mode |
alloc_mode = default_cuda_alloc_mode , |
|
|
CUstream_st * |
stream = nullptr |
|
) |
| |
|
static |
Creates a new CudaExecutor.
- Parameters
-
device_id | the CUDA device id of this device |
master | an executor on the host that is used to invoke the device kernels |
device_reset | this option no longer has any effect. |
alloc_mode | the allocation mode that the executor should operate on. See @allocation_mode for more details |
stream | the stream to execute operations on. |
◆ create() [2/2]
Creates a new CudaExecutor with a custom allocator and device stream.
- Parameters
-
device_id | the CUDA device id of this device |
master | an executor on the host that is used to invoke the device kernels. |
alloc | the allocator to use for device memory allocations. |
stream | the stream to execute operations on. |
◆ get_closest_numa()
int gko::CudaExecutor::get_closest_numa |
( |
| ) |
const |
|
inline |
Get the closest NUMA node.
- Returns
- the closest NUMA node closest to this device
◆ get_closest_pus()
std::vector<int> gko::CudaExecutor::get_closest_pus |
( |
| ) |
const |
|
inline |
Get the closest PUs.
- Returns
- the array of PUs closest to this device
◆ get_cublas_handle()
cublasContext* gko::CudaExecutor::get_cublas_handle |
( |
| ) |
const |
|
inline |
Get the cublas handle for this executor.
- Returns
- the cublas handle (cublasContext*) for this executor
◆ get_cusparse_handle()
cusparseContext* gko::CudaExecutor::get_cusparse_handle |
( |
| ) |
const |
|
inline |
Get the cusparse handle for this executor.
- Returns
- the cusparse handle (cusparseContext*) for this executor
◆ get_master() [1/2]
std::shared_ptr<const Executor> gko::CudaExecutor::get_master |
( |
| ) |
const |
|
overridevirtualnoexcept |
◆ get_master() [2/2]
std::shared_ptr<Executor> gko::CudaExecutor::get_master |
( |
| ) |
|
|
overridevirtualnoexcept |
◆ get_stream()
CUstream_st* gko::CudaExecutor::get_stream |
( |
| ) |
const |
|
inline |
Returns the CUDA stream used by this executor.
Can be nullptr for the default stream.
- Returns
- the stream used to execute kernels and memory operations.
The documentation for this class was generated from the following file: