17 #ifndef __STARPU_CUDA_H__
18 #define __STARPU_CUDA_H__
22 #if defined STARPU_USE_CUDA && !defined STARPU_DONT_INCLUDE_CUDA_HEADERS
24 #include <cuda_runtime.h>
25 #include <cuda_runtime_api.h>
27 #ifdef STARPU_HAVE_LIBNVIDIA_ML
49 #define STARPU_CUBLAS_REPORT_ERROR(status) starpu_cublas_report_error(__starpu_func__, __FILE__, __LINE__, status)
59 #define STARPU_CUDA_REPORT_ERROR(status) starpu_cuda_report_error(__starpu_func__, __FILE__, __LINE__, status)
89 int starpu_cuda_copy_async_sync(
void *src_ptr,
unsigned src_node,
void *dst_ptr,
unsigned dst_node,
size_t ssize, cudaStream_t stream,
enum cudaMemcpyKind kind);
106 size_t numblocks,
size_t ld_src,
size_t ld_dst,
107 cudaStream_t stream,
enum cudaMemcpyKind kind);
125 size_t numblocks_1,
size_t ld1_src,
size_t ld1_dst,
126 size_t numblocks_2,
size_t ld2_src,
size_t ld2_dst,
127 cudaStream_t stream,
enum cudaMemcpyKind kind);
136 #ifdef STARPU_HAVE_LIBNVIDIA_ML
140 nvmlDevice_t starpu_cuda_get_nvmldev(
unsigned devid);
void starpu_cuda_report_error(const char *func, const char *file, int line, cudaError_t status)
void starpu_cublas_report_error(const char *func, const char *file, int line, int status)
int starpu_cuda_copy_async_sync(void *src_ptr, unsigned src_node, void *dst_ptr, unsigned dst_node, size_t ssize, cudaStream_t stream, enum cudaMemcpyKind kind)
void starpu_cuda_set_device(unsigned devid)
int starpu_cuda_copy2d_async_sync(void *src_ptr, unsigned src_node, void *dst_ptr, unsigned dst_node, size_t blocksize, size_t numblocks, size_t ld_src, size_t ld_dst, cudaStream_t stream, enum cudaMemcpyKind kind)
const struct cudaDeviceProp * starpu_cuda_get_device_properties(unsigned workerid)
cudaStream_t starpu_cuda_get_local_stream(void)
int starpu_cuda_copy3d_async_sync(void *src_ptr, unsigned src_node, void *dst_ptr, unsigned dst_node, size_t blocksize, size_t numblocks_1, size_t ld1_src, size_t ld1_dst, size_t numblocks_2, size_t ld2_src, size_t ld2_dst, cudaStream_t stream, enum cudaMemcpyKind kind)