12 年之前 · 8552a9d86b
--- a/src/core/topology.c
+++ b/src/core/topology.c
@@ -38,103 +38,28 @@
 
				 
			
 
				 static unsigned topology_is_initialized = 0;
			
 
				 
			
 
				-static void _starpu_initialize_workers_bindid(struct _starpu_machine_config *config);
			
 
				-
			
 
				 #if defined(STARPU_USE_CUDA) || defined(STARPU_USE_OPENCL)
			
 
				+
			
 
				 struct handle_entry
			
 
				 {
			
 
				 	UT_hash_handle hh;
			
 
				 	unsigned gpuid;
			
 
				 };
			
 
				+
			
 
				 #  ifdef STARPU_USE_CUDA
			
 
				-static void _starpu_initialize_workers_cuda_gpuid(struct _starpu_machine_config *config);
			
 
				 /* Entry in the `devices_using_cuda' hash table.  */
			
 
				 static struct handle_entry *devices_using_cuda;
			
 
				 #  endif
			
 
				-#  ifdef STARPU_USE_OPENCL
			
 
				-static void _starpu_initialize_workers_opencl_gpuid(struct _starpu_machine_config *config);
			
 
				-#  endif
			
 
				-static void _starpu_initialize_workers_gpuid(int *explicit_workers_gpuid,
			
 
				-                                             int *current, int *workers_gpuid, const char *varname, unsigned nhwgpus);
			
 
				+
			
 
				 static unsigned may_bind_automatically = 0;
			
 
				-#endif
			
 
				+
			
 
				+#endif // defined(STARPU_USE_CUDA) || defined(STARPU_USE_OPENCL)
			
 
				+
			
 
				 
			
 
				 /*
			
 
				  * Discover the topology of the machine
			
 
				  */
			
 
				 
			
 
				-#ifdef STARPU_USE_CUDA
			
 
				-static void _starpu_initialize_workers_cuda_gpuid(struct _starpu_machine_config *config)
			
 
				-{
			
 
				-	struct starpu_machine_topology *topology = &config->topology;
			
 
				-
			
 
				-        _starpu_initialize_workers_gpuid(config->conf->use_explicit_workers_cuda_gpuid==0?NULL:(int *)config->conf->workers_cuda_gpuid,
			
 
				-                                         &(config->current_cuda_gpuid), (int *)topology->workers_cuda_gpuid, "STARPU_WORKERS_CUDAID",
			
 
				-                                         topology->nhwcudagpus);
			
 
				-}
			
 
				-#endif
			
 
				-
			
 
				-#ifdef STARPU_USE_OPENCL
			
 
				-static void _starpu_initialize_workers_opencl_gpuid(struct _starpu_machine_config *config)
			
 
				-{
			
 
				-	struct starpu_machine_topology *topology = &config->topology;
			
 
				-
			
 
				-        _starpu_initialize_workers_gpuid(config->conf->use_explicit_workers_opencl_gpuid==0?NULL:(int *)config->conf->workers_opencl_gpuid,
			
 
				-                                         &(config->current_opencl_gpuid), (int *)topology->workers_opencl_gpuid, "STARPU_WORKERS_OPENCLID",
			
 
				-                                         topology->nhwopenclgpus);
			
 
				-
			
 
				-#ifdef STARPU_USE_CUDA
			
 
				-        // Detect devices which are already used with CUDA
			
 
				-        {
			
 
				-                unsigned tmp[STARPU_NMAXWORKERS];
			
 
				-                unsigned nb=0;
			
 
				-                int i;
			
 
				-                for(i=0 ; i<STARPU_NMAXWORKERS ; i++)
			
 
				-		{
			
 
				-			struct handle_entry *entry;
			
 
				-			int devid = config->topology.workers_opencl_gpuid[i];
			
 
				-
			
 
				-			HASH_FIND_INT(devices_using_cuda, &devid, entry);
			
 
				-			if (entry == NULL)
			
 
				-			{
			
 
				-                                tmp[nb] = topology->workers_opencl_gpuid[i];
			
 
				-                                nb++;
			
 
				-                        }
			
 
				-                }
			
 
				-                for(i=nb ; i<STARPU_NMAXWORKERS ; i++) tmp[i] = -1;
			
 
				-                memcpy(topology->workers_opencl_gpuid, tmp, sizeof(unsigned)*STARPU_NMAXWORKERS);
			
 
				-        }
			
 
				-#endif /* STARPU_USE_CUDA */
			
 
				-        {
			
 
				-                // Detect identical devices
			
 
				-		struct handle_entry *devices_already_used = NULL;
			
 
				-                unsigned tmp[STARPU_NMAXWORKERS];
			
 
				-                unsigned nb=0;
			
 
				-                int i;
			
 
				-
			
 
				-                for(i=0 ; i<STARPU_NMAXWORKERS ; i++)
			
 
				-		{
			
 
				-			int devid = topology->workers_opencl_gpuid[i];
			
 
				-			struct handle_entry *entry;
			
 
				-			HASH_FIND_INT(devices_already_used, &devid, entry);
			
 
				-			if (entry == NULL)
			
 
				-			{
			
 
				-				struct handle_entry *entry2;
			
 
				-				entry2 = (struct handle_entry *) malloc(sizeof(*entry2));
			
 
				-				STARPU_ASSERT(entry2 != NULL);
			
 
				-				entry2->gpuid = devid;
			
 
				-				HASH_ADD_INT(devices_already_used, gpuid, entry2);
			
 
				-                                tmp[nb] = devid;
			
 
				-                                nb ++;
			
 
				-                        }
			
 
				-                }
			
 
				-                for(i=nb ; i<STARPU_NMAXWORKERS ; i++) tmp[i] = -1;
			
 
				-                memcpy(topology->workers_opencl_gpuid, tmp, sizeof(unsigned)*STARPU_NMAXWORKERS);
			
 
				-        }
			
 
				-}
			
 
				-#endif
			
 
				-
			
 
				-
			
 
				 #if defined(STARPU_USE_CUDA) || defined(STARPU_USE_OPENCL)
			
 
				 static void _starpu_initialize_workers_gpuid(int *explicit_workers_gpuid,
			
 
				                                              int *current, int *workers_gpuid, const char *varname, unsigned nhwgpus)
			
@@ -212,6 +137,79 @@ static void _starpu_initialize_workers_gpuid(int *explicit_workers_gpuid,
 
				 #endif
			
 
				 
			
 
				 #ifdef STARPU_USE_CUDA
			
 
				+static void _starpu_initialize_workers_cuda_gpuid(struct _starpu_machine_config *config)
			
 
				+{
			
 
				+	struct starpu_machine_topology *topology = &config->topology;
			
 
				+
			
 
				+        _starpu_initialize_workers_gpuid(config->conf->use_explicit_workers_cuda_gpuid==0?NULL:(int *)config->conf->workers_cuda_gpuid,
			
 
				+                                         &(config->current_cuda_gpuid), (int *)topology->workers_cuda_gpuid, "STARPU_WORKERS_CUDAID",
			
 
				+                                         topology->nhwcudagpus);
			
 
				+}
			
 
				+#endif
			
 
				+
			
 
				+#ifdef STARPU_USE_OPENCL
			
 
				+static void _starpu_initialize_workers_opencl_gpuid(struct _starpu_machine_config *config)
			
 
				+{
			
 
				+	struct starpu_machine_topology *topology = &config->topology;
			
 
				+
			
 
				+        _starpu_initialize_workers_gpuid(config->conf->use_explicit_workers_opencl_gpuid==0?NULL:(int *)config->conf->workers_opencl_gpuid,
			
 
				+                                         &(config->current_opencl_gpuid), (int *)topology->workers_opencl_gpuid, "STARPU_WORKERS_OPENCLID",
			
 
				+                                         topology->nhwopenclgpus);
			
 
				+
			
 
				+#ifdef STARPU_USE_CUDA
			
 
				+        // Detect devices which are already used with CUDA
			
 
				+        {
			
 
				+                unsigned tmp[STARPU_NMAXWORKERS];
			
 
				+                unsigned nb=0;
			
 
				+                int i;
			
 
				+                for(i=0 ; i<STARPU_NMAXWORKERS ; i++)
			
 
				+		{
			
 
				+			struct handle_entry *entry;
			
 
				+			int devid = config->topology.workers_opencl_gpuid[i];
			
 
				+
			
 
				+			HASH_FIND_INT(devices_using_cuda, &devid, entry);
			
 
				+			if (entry == NULL)
			
 
				+			{
			
 
				+                                tmp[nb] = topology->workers_opencl_gpuid[i];
			
 
				+                                nb++;
			
 
				+                        }
			
 
				+                }
			
 
				+                for(i=nb ; i<STARPU_NMAXWORKERS ; i++) tmp[i] = -1;
			
 
				+                memcpy(topology->workers_opencl_gpuid, tmp, sizeof(unsigned)*STARPU_NMAXWORKERS);
			
 
				+        }
			
 
				+#endif /* STARPU_USE_CUDA */
			
 
				+        {
			
 
				+                // Detect identical devices
			
 
				+		struct handle_entry *devices_already_used = NULL;
			
 
				+                unsigned tmp[STARPU_NMAXWORKERS];
			
 
				+                unsigned nb=0;
			
 
				+                int i;
			
 
				+
			
 
				+                for(i=0 ; i<STARPU_NMAXWORKERS ; i++)
			
 
				+		{
			
 
				+			int devid = topology->workers_opencl_gpuid[i];
			
 
				+			struct handle_entry *entry;
			
 
				+			HASH_FIND_INT(devices_already_used, &devid, entry);
			
 
				+			if (entry == NULL)
			
 
				+			{
			
 
				+				struct handle_entry *entry2;
			
 
				+				entry2 = (struct handle_entry *) malloc(sizeof(*entry2));
			
 
				+				STARPU_ASSERT(entry2 != NULL);
			
 
				+				entry2->gpuid = devid;
			
 
				+				HASH_ADD_INT(devices_already_used, gpuid, entry2);
			
 
				+                                tmp[nb] = devid;
			
 
				+                                nb ++;
			
 
				+                        }
			
 
				+                }
			
 
				+                for(i=nb ; i<STARPU_NMAXWORKERS ; i++) tmp[i] = -1;
			
 
				+                memcpy(topology->workers_opencl_gpuid, tmp, sizeof(unsigned)*STARPU_NMAXWORKERS);
			
 
				+        }
			
 
				+}
			
 
				+#endif
			
 
				+
			
 
				+
			
 
				+
			
 
				+#ifdef STARPU_USE_CUDA
			
 
				 static inline int _starpu_get_next_cuda_gpuid(struct _starpu_machine_config *config)
			
 
				 {
			
 
				 	unsigned i = ((config->current_cuda_gpuid++) % config->topology.ncudagpus);
			
@@ -272,6 +270,80 @@ static void _starpu_init_topology(struct _starpu_machine_config *config)
 
				 	}
			
 
				 }
			
 
				 
			
 
				+/*
			
 
				+ * Bind workers on the different processors
			
 
				+ */
			
 
				+static void _starpu_initialize_workers_bindid(struct _starpu_machine_config *config)
			
 
				+{
			
 
				+	char *strval;
			
 
				+	unsigned i;
			
 
				+
			
 
				+	struct starpu_machine_topology *topology = &config->topology;
			
 
				+
			
 
				+	config->current_bindid = 0;
			
 
				+
			
 
				+	/* conf->workers_bindid indicates the successive cpu identifier that
			
 
				+	 * should be used to bind the workers. It should be either filled
			
 
				+	 * according to the user's explicit parameters (from starpu_conf) or
			
 
				+	 * according to the STARPU_WORKERS_CPUID env. variable. Otherwise, a
			
 
				+	 * round-robin policy is used to distributed the workers over the
			
 
				+	 * cpus. */
			
 
				+
			
 
				+	/* what do we use, explicit value, env. variable, or round-robin ? */
			
 
				+	if ((strval = getenv("STARPU_WORKERS_CPUID")))
			
 
				+	{
			
 
				+		/* STARPU_WORKERS_CPUID certainly contains less entries than
			
 
				+		 * STARPU_NMAXWORKERS, so we reuse its entries in a round robin
			
 
				+		 * fashion: "1 2" is equivalent to "1 2 1 2 1 2 .... 1 2". */
			
 
				+		unsigned wrap = 0;
			
 
				+		unsigned number_of_entries = 0;
			
 
				+
			
 
				+		char *endptr;
			
 
				+		/* we use the content of the STARPU_WORKERS_CUDAID env. variable */
			
 
				+		for (i = 0; i < STARPU_NMAXWORKERS; i++)
			
 
				+		{
			
 
				+			if (!wrap)
			
 
				+			{
			
 
				+				long int val;
			
 
				+				val = strtol(strval, &endptr, 10);
			
 
				+				if (endptr != strval)
			
 
				+				{
			
 
				+					topology->workers_bindid[i] = (unsigned)(val % topology->nhwcpus);
			
 
				+					strval = endptr;
			
 
				+				}
			
 
				+				else
			
 
				+				{
			
 
				+					/* there must be at least one entry */
			
 
				+					STARPU_ASSERT(i != 0);
			
 
				+					number_of_entries = i;
			
 
				+
			
 
				+					/* there is no more values in the string */
			
 
				+					wrap = 1;
			
 
				+
			
 
				+					topology->workers_bindid[i] = topology->workers_bindid[0];
			
 
				+				}
			
 
				+			}
			
 
				+			else
			
 
				+			{
			
 
				+				topology->workers_bindid[i] = topology->workers_bindid[i % number_of_entries];
			
 
				+			}
			
 
				+		}
			
 
				+	}
			
 
				+	else if (config->conf->use_explicit_workers_bindid)
			
 
				+	{
			
 
				+		/* we use the explicit value from the user */
			
 
				+		memcpy(topology->workers_bindid,
			
 
				+			config->conf->workers_bindid,
			
 
				+			STARPU_NMAXWORKERS*sizeof(unsigned));
			
 
				+	}
			
 
				+	else
			
 
				+	{
			
 
				+		/* by default, we take a round robin policy */
			
 
				+		for (i = 0; i < STARPU_NMAXWORKERS; i++)
			
 
				+			topology->workers_bindid[i] = (unsigned)(i % topology->nhwcpus);
			
 
				+	}
			
 
				+}
			
 
				+
			
 
				 unsigned _starpu_topology_get_nhwcpu(struct _starpu_machine_config *config)
			
 
				 {
			
 
				 	_starpu_init_topology(config);
			
@@ -511,79 +583,6 @@ static int _starpu_init_machine_config(struct _starpu_machine_config *config)
 
				 	return 0;
			
 
				 }
			
 
				 
			
 
				-/*
			
 
				- * Bind workers on the different processors
			
 
				- */
			
 
				-static void _starpu_initialize_workers_bindid(struct _starpu_machine_config *config)
			
 
				-{
			
 
				-	char *strval;
			
 
				-	unsigned i;
			
 
				-
			
 
				-	struct starpu_machine_topology *topology = &config->topology;
			
 
				-
			
 
				-	config->current_bindid = 0;
			
 
				-
			
 
				-	/* conf->workers_bindid indicates the successive cpu identifier that
			
 
				-	 * should be used to bind the workers. It should be either filled
			
 
				-	 * according to the user's explicit parameters (from starpu_conf) or
			
 
				-	 * according to the STARPU_WORKERS_CPUID env. variable. Otherwise, a
			
 
				-	 * round-robin policy is used to distributed the workers over the
			
 
				-	 * cpus. */
			
 
				-
			
 
				-	/* what do we use, explicit value, env. variable, or round-robin ? */
			
 
				-	if ((strval = getenv("STARPU_WORKERS_CPUID")))
			
 
				-	{
			
 
				-		/* STARPU_WORKERS_CPUID certainly contains less entries than
			
 
				-		 * STARPU_NMAXWORKERS, so we reuse its entries in a round robin
			
 
				-		 * fashion: "1 2" is equivalent to "1 2 1 2 1 2 .... 1 2". */
			
 
				-		unsigned wrap = 0;
			
 
				-		unsigned number_of_entries = 0;
			
 
				-
			
 
				-		char *endptr;
			
 
				-		/* we use the content of the STARPU_WORKERS_CUDAID env. variable */
			
 
				-		for (i = 0; i < STARPU_NMAXWORKERS; i++)
			
 
				-		{
			
 
				-			if (!wrap)
			
 
				-			{
			
 
				-				long int val;
			
 
				-				val = strtol(strval, &endptr, 10);
			
 
				-				if (endptr != strval)
			
 
				-				{
			
 
				-					topology->workers_bindid[i] = (unsigned)(val % topology->nhwcpus);
			
 
				-					strval = endptr;
			
 
				-				}
			
 
				-				else
			
 
				-				{
			
 
				-					/* there must be at least one entry */
			
 
				-					STARPU_ASSERT(i != 0);
			
 
				-					number_of_entries = i;
			
 
				-
			
 
				-					/* there is no more values in the string */
			
 
				-					wrap = 1;
			
 
				-
			
 
				-					topology->workers_bindid[i] = topology->workers_bindid[0];
			
 
				-				}
			
 
				-			}
			
 
				-			else
			
 
				-			{
			
 
				-				topology->workers_bindid[i] = topology->workers_bindid[i % number_of_entries];
			
 
				-			}
			
 
				-		}
			
 
				-	}
			
 
				-	else if (config->conf->use_explicit_workers_bindid)
			
 
				-	{
			
 
				-		/* we use the explicit value from the user */
			
 
				-		memcpy(topology->workers_bindid,
			
 
				-			config->conf->workers_bindid,
			
 
				-			STARPU_NMAXWORKERS*sizeof(unsigned));
			
 
				-	}
			
 
				-	else
			
 
				-	{
			
 
				-		/* by default, we take a round robin policy */
			
 
				-		for (i = 0; i < STARPU_NMAXWORKERS; i++)
			
 
				-			topology->workers_bindid[i] = (unsigned)(i % topology->nhwcpus);
			
 
				-	}
			
 
				-}
			
 
				 
			
 
				 /* This function gets the identifier of the next cpu on which to bind a
			
 
				  * worker. In case a list of preferred cpus was specified, we look for a an