18#ifndef __DRIVER_CUDA_H__
19#define __DRIVER_CUDA_H__
23#include <common/config.h>
25void _starpu_cuda_preinit(
void);
29#include <cuda_runtime_api.h>
30#ifdef STARPU_HAVE_NVML_H
36#include <core/workers.h>
39#pragma GCC visibility push(hidden)
44extern int _starpu_nworker_per_cuda;
46void _starpu_cuda_init(
void);
47unsigned _starpu_get_cuda_device_count(
void);
48#ifdef STARPU_HAVE_HWLOC
50hwloc_obj_t _starpu_cuda_get_hwloc_obj(hwloc_topology_t topology,
int devid);
54#if defined(STARPU_USE_CUDA) || defined(STARPU_SIMGRID)
59void _starpu_init_cuda(
void);
60void _starpu_init_cublas_v2_func(
void);
61void _starpu_shutdown_cublas_v2_func(
void);
62void _starpu_cublas_v2_init(
void);
63void _starpu_cublas_v2_shutdown(
void);
64void *_starpu_cuda_worker(
void *);
65#ifdef STARPU_HAVE_NVML_H
66nvmlDevice_t _starpu_cuda_get_nvmldev(
struct cudaDeviceProp *props);
67extern __typeof__(nvmlInit) *_starpu_nvmlInit;
68extern __typeof__(nvmlDeviceGetNvLinkState) *_starpu_nvmlDeviceGetNvLinkState;
69extern __typeof__(nvmlDeviceGetNvLinkRemotePciInfo) *_starpu_nvmlDeviceGetNvLinkRemotePciInfo;
70extern __typeof__(nvmlDeviceGetHandleByIndex) *_starpu_nvmlDeviceGetHandleByIndex;
71extern __typeof__(nvmlDeviceGetHandleByPciBusId) *_starpu_nvmlDeviceGetHandleByPciBusId;
72extern __typeof__(nvmlDeviceGetIndex) *_starpu_nvmlDeviceGetIndex;
73extern __typeof__(nvmlDeviceGetPciInfo) *_starpu_nvmlDeviceGetPciInfo;
74extern __typeof__(nvmlDeviceGetUUID) *_starpu_nvmlDeviceGetUUID;
75#if HAVE_DECL_NVMLDEVICEGETTOTALENERGYCONSUMPTION
76extern __typeof__(nvmlDeviceGetTotalEnergyConsumption) *_starpu_nvmlDeviceGetTotalEnergyConsumption;
81# define _starpu_cuda_discover_devices(config) ((void) config)
84#pragma GCC visibility pop
#define STARPU_MAXNUMANODES
Definition: starpu_config.h:272
Definition: workers.h:441
Definition: workers.h:352
int devid[STARPU_NARCH][STARPU_NMAXDEVS]
Definition: workers.h:404
Definition: node_ops.h:92
Definition: workers.h:155