4 年之前 · c689d70e5e
--- a/ChangeLog
+++ b/ChangeLog
@@ -70,6 +70,7 @@ Small features:
 
																     instead of hyperthreads.
															
 
																   * New STARPU_TASK_PROGRESS environment variable to show task progression.
															
 
																   * Add STARPU_SIMGRID environment variable guard against native builds.
															
 
																+  * Add starpu_cuda_get_nvmldev function.
															
 
																 StarPU 1.3.7
															
 
																 ====================================================================
															
--- a/configure.ac
+++ b/configure.ac
@@ -1409,7 +1409,7 @@ if test x$enable_cuda = xyes; then
 
																 		AC_CHECK_DECLS([nvmlDeviceGetTotalEnergyConsumption], [
															
 
																 			AC_CHECK_FUNCS([nvmlDeviceGetTotalEnergyConsumption])
															
 
																 			], [], [[#include <nvml.h>]])
															
 
																-		AC_DEFINE([HAVE_LIBNVIDIA_ML], [1], [Define to 1 if you have the nvidia-ml library])
															
 
																+		AC_DEFINE([STARPU_HAVE_LIBNVIDIA_ML], [1], [Define to 1 if you have the nvidia-ml library])
															
 
																 		STARPU_CUDA_LDFLAGS="$STARPU_CUDA_LDFLAGS -lnvidia-ml"
															
 
																 	fi
															
 
																 	AC_MSG_CHECKING(whether nvidia-ml should be used)
															
--- a/include/starpu_config.h.in
+++ b/include/starpu_config.h.in
@@ -57,6 +57,14 @@
 
																 #undef STARPU_USE_CUDA
															
 
																 /**
															
 
																+   Defined when StarPU has been installed with
															
 
																+   NVidia-ML support. It should be used in your code to detect the
															
 
																+   availability of NVML-related functions.
															
 
																+   @ingroup API_CUDA_Extensions
															
 
																+*/
															
 
																+#undef STARPU_HAVE_LIBNVIDIA_ML
															
 
																+
															
 
																+/**
															
 
																    Defined when StarPU has been installed with OpenCL support. It
															
 
																    should be used in your code to detect the availability of OpenCL as
															
 
																    shown in \ref FullSourceCodeVectorScal.
															
--- a/include/starpu_cuda.h
+++ b/include/starpu_cuda.h
@@ -24,6 +24,10 @@
 
																 #include <cuda_runtime.h>
															
 
																 #include <cuda_runtime_api.h>
															
 
																+#ifdef STARPU_HAVE_LIBNVIDIA_ML
															
 
																+#include <nvml.h>
															
 
																+#endif
															
 
																+
															
 
																 #ifdef __cplusplus
															
 
																 extern "C"
															
 
																 {
															
@@ -129,6 +133,14 @@ int starpu_cuda_copy3d_async_sync(void *src_ptr, unsigned src_node, void *dst_pt
 
																 */
															
 
																 void starpu_cuda_set_device(unsigned devid);
															
 
																+#ifdef STARPU_HAVE_LIBNVIDIA_ML
															
 
																+/**
															
 
																+  Return the nvml device for a CUDA device
															
 
																+*/
															
 
																+nvmlDevice_t starpu_cuda_get_nvmldev(unsigned devid);
															
 
																+#endif
															
 
																+
															
 
																+
															
 
																 /** @} */
															
 
																 #ifdef __cplusplus
															
--- a/src/drivers/cuda/driver_cuda.c
+++ b/src/drivers/cuda/driver_cuda.c
@@ -31,7 +31,7 @@
 
																 #ifdef HAVE_CUDA_GL_INTEROP_H
															
 
																 #include <cuda_gl_interop.h>
															
 
																 #endif
															
 
																-#ifdef HAVE_LIBNVIDIA_ML
															
 
																+#ifdef STARPU_HAVE_LIBNVIDIA_ML
															
 
																 #include <nvml.h>
															
 
																 #endif
															
 
																 #include <datawizard/memory_manager.h>
															
@@ -63,7 +63,7 @@
 
																 static int ncudagpus = -1;
															
 
																 static size_t global_mem[STARPU_MAXCUDADEVS];
															
 
																-#ifdef HAVE_LIBNVIDIA_ML
															
 
																+#ifdef STARPU_HAVE_LIBNVIDIA_ML
															
 
																 static nvmlDevice_t nvmlDev[STARPU_MAXCUDADEVS];
															
 
																 #endif
															
 
																 int _starpu_cuda_bus_ids[STARPU_MAXCUDADEVS+STARPU_MAXNUMANODES][STARPU_MAXCUDADEVS+STARPU_MAXNUMANODES];
															
@@ -105,6 +105,13 @@ static size_t _starpu_cuda_get_global_mem_size(unsigned devid)
 
																 	return global_mem[devid];
															
 
																 }
															
 
																+#ifdef STARPU_HAVE_LIBNVIDIA_ML
															
 
																+nvmlDevice_t starpu_cuda_get_nvmldev(unsigned devid)
															
 
																+{
															
 
																+	return nvmlDev[devid];
															
 
																+}
															
 
																+#endif
															
 
																+
															
 
																 void
															
 
																 _starpu_cuda_discover_devices (struct _starpu_machine_config *config)
															
 
																 {
															
@@ -120,7 +127,7 @@ _starpu_cuda_discover_devices (struct _starpu_machine_config *config)
 
																 	if (STARPU_UNLIKELY(cures != cudaSuccess))
															
 
																 		cnt = 0;
															
 
																 	config->topology.nhwdevices[STARPU_CUDA_WORKER] = cnt;
															
 
																-#ifdef HAVE_LIBNVIDIA_ML
															
 
																+#ifdef STARPU_HAVE_LIBNVIDIA_ML
															
 
																 	nvmlInit();
															
 
																 #endif
															
 
																 #endif
															
@@ -738,7 +745,7 @@ int _starpu_cuda_driver_init(struct _starpu_worker_set *worker_set)
 
																 #if defined(STARPU_HAVE_BUSID) && !defined(STARPU_SIMGRID)
															
 
																 #if defined(STARPU_HAVE_DOMAINID) && !defined(STARPU_SIMGRID)
															
 
																-#ifdef HAVE_LIBNVIDIA_ML
															
 
																+#ifdef STARPU_HAVE_LIBNVIDIA_ML
															
 
																 		char busid[13];
															
 
																 		snprintf(busid, sizeof(busid), "%04x:%02x:%02x.0", props[devid].pciDomainID, props[devid].pciBusID, props[devid].pciDeviceID);
															
 
																 		nvmlDeviceGetHandleByPciBusId(busid, &nvmlDev[devid]);