13 years ago · 3d761fe47b
--- a/tests/datawizard/gpu_register.c
+++ b/tests/datawizard/gpu_register.c
@@ -1,6 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2011  Université de Bordeaux 1
			
 
				+ * Copyright (C) 2012 inria
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -20,42 +21,75 @@
 
				 #include "../helper.h"
			
 
				 #include "scal.h"
			
 
				 
			
 
				-int main(int argc, char **argv)
			
 
				+static int
			
 
				+submit_tasks(starpu_data_handle_t handle, int pieces, int n)
			
 
				 {
			
 
				-	int ret;
			
 
				+	int i, ret;
			
 
				+
			
 
				+	for (i = 0; i < pieces; i++)
			
 
				+	{
			
 
				+		struct starpu_task *task = starpu_task_create();
			
 
				+
			
 
				+		task->handles[0] = starpu_data_get_sub_data(handle, 1, i);
			
 
				+		task->cl = &scal_codelet;
			
 
				+		task->execute_on_a_specific_worker = 1;
			
 
				+		task->workerid = i%n;
			
 
				+
			
 
				+		ret = starpu_task_submit(task);
			
 
				+		if (ret == -ENODEV)
			
 
				+			return -ENODEV;
			
 
				+		STARPU_CHECK_RETURN_VALUE(ret, "starpu_task_submit");
			
 
				+	}
			
 
				+
			
 
				+	ret = starpu_task_wait_for_all();
			
 
				+	STARPU_CHECK_RETURN_VALUE(ret, "starpu_task_wait_for_all");
			
 
				+
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				+static int
			
 
				+find_a_worker(enum starpu_archtype type)
			
 
				+{
			
 
				+	int worker;
			
 
				+	int ret = starpu_worker_get_ids_by_type(type, &worker, 1);
			
 
				+	if (ret == 0)
			
 
				+		return -ENODEV;
			
 
				+	return worker;
			
 
				+}
			
 
				+
			
 
				+static int
			
 
				+check_result(unsigned *t, size_t size)
			
 
				+{
			
 
				+	int i;
			
 
				+	for (i = 0; i < size; i++)
			
 
				+	{
			
 
				+		if (t[i] != i*2)
			
 
				+		{
			
 
				+			FPRINTF(stderr,"t[%d] is %d instead of %d\n", i, t[i], 2*i);
			
 
				+			return 1;
			
 
				+		}
			
 
				+	}
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				 #ifdef STARPU_USE_CUDA
			
 
				 #if CUDART_VERSION >= 4000
			
 
				+static int
			
 
				+test_cuda(void)
			
 
				+{
			
 
				+	int ret;
			
 
				 	unsigned *foo_gpu;
			
 
				 	unsigned *foo;
			
 
				-	starpu_data_handle_t handle;
			
 
				 	int n, i, size, pieces;
			
 
				 	int devid;
			
 
				-	unsigned workerid;
			
 
				-	int chosen = -1;
			
 
				+	int chosen;
			
 
				 	cudaError_t cures;
			
 
				-#endif
			
 
				-#endif
			
 
				-	ret = starpu_init(NULL);
			
 
				-	if (ret == -ENODEV) return STARPU_TEST_SKIPPED;
			
 
				-	STARPU_CHECK_RETURN_VALUE(ret, "starpu_init");
			
 
				-
			
 
				-#ifdef STARPU_USE_CUDA
			
 
				-#if CUDART_VERSION >= 4000 /* We need thread-safety of CUDA */
			
 
				-	/* TODO OpenCL, too */
			
 
				-	for (workerid = 0; workerid < starpu_worker_get_count(); workerid++) {
			
 
				-		if (starpu_worker_get_type(workerid) == STARPU_CUDA_WORKER) {
			
 
				-			chosen = workerid;
			
 
				-			break;
			
 
				-		}
			
 
				-	}
			
 
				-
			
 
				-	if (chosen == -1)
			
 
				-		return STARPU_TEST_SKIPPED;
			
 
				+	starpu_data_handle_t handle;
			
 
				 
			
 
				-#ifdef STARPU_USE_OPENCL
			
 
				-	ret = starpu_opencl_load_opencl_from_file("tests/datawizard/scal_opencl.cl", &opencl_program, NULL);
			
 
				-	STARPU_CHECK_RETURN_VALUE(ret, "starpu_opencl_load_opencl_from_file");
			
 
				-#endif
			
 
				+	/* Find a CUDA worker */
			
 
				+	chosen = find_a_worker(STARPU_CUDA_WORKER);
			
 
				+	if (chosen == -ENODEV)
			
 
				+		return -ENODEV;
			
 
				 
			
 
				 	n = starpu_worker_get_count();
			
 
				 	size = 10 * n;
			
@@ -92,21 +126,9 @@ int main(int argc, char **argv)
 
				 
			
 
				 	starpu_data_partition(handle, &f);
			
 
				 
			
 
				-	for (i = 0; i < pieces; i++) {
			
 
				-		struct starpu_task *task = starpu_task_create();
			
 
				-
			
 
				-		task->handles[0] = starpu_data_get_sub_data(handle, 1, i);
			
 
				-		task->cl = &scal_codelet;
			
 
				-		task->execute_on_a_specific_worker = 1;
			
 
				-		task->workerid = i%n;
			
 
				-
			
 
				-		ret = starpu_task_submit(task);
			
 
				-		if (ret == -ENODEV) goto enodev;
			
 
				-		STARPU_CHECK_RETURN_VALUE(ret, "starpu_task_submit");
			
 
				-	}
			
 
				-
			
 
				-	ret = starpu_task_wait_for_all();
			
 
				-	STARPU_CHECK_RETURN_VALUE(ret, "starpu_task_wait_for_all");
			
 
				+	ret = submit_tasks(handle, pieces, n);
			
 
				+	if (ret == -ENODEV)
			
 
				+		return -ENODEV;
			
 
				 
			
 
				 	starpu_data_unpartition(handle, starpu_worker_get_memory_node(chosen));
			
 
				 	starpu_data_unregister(handle);
			
@@ -116,24 +138,152 @@ int main(int argc, char **argv)
 
				 	if (STARPU_UNLIKELY(cures))
			
 
				 		STARPU_CUDA_REPORT_ERROR(cures);
			
 
				 
			
 
				-	starpu_shutdown();
			
 
				+	return check_result(foo, size);
			
 
				+}
			
 
				+#endif
			
 
				+#endif
			
 
				 
			
 
				-	for (i = 0; i < size; i++) {
			
 
				-		if (foo[i] != i*2) {
			
 
				-			FPRINTF(stderr,"value %d is %d instead of %d\n", i, foo[i], 2*i);
			
 
				-			return EXIT_FAILURE;
			
 
				-		}
			
 
				-	}
			
 
				+#ifdef STARPU_USE_OPENCL
			
 
				+static int
			
 
				+test_opencl(void)
			
 
				+{
			
 
				+	int i;
			
 
				+	int ret;
			
 
				+	int chosen;
			
 
				+	int n;
			
 
				+	int size;
			
 
				+	int pieces;
			
 
				+	cl_mem foo_gpu;
			
 
				+	starpu_data_handle_t handle;
			
 
				+
			
 
				+	ret = starpu_opencl_load_opencl_from_file("tests/datawizard/scal_opencl.cl", &opencl_program, NULL);
			
 
				+	STARPU_CHECK_RETURN_VALUE(ret, "starpu_opencl_load_opencl_from_file");
			
 
				+
			
 
				+	/* Find an OpenCL worker */
			
 
				+	chosen = find_a_worker(STARPU_OPENCL_WORKER);
			
 
				+	if (chosen == -ENODEV)
			
 
				+		return -ENODEV;
			
 
				+
			
 
				+	n = starpu_worker_get_count();
			
 
				+	size = 10 * n;
			
 
				+
			
 
				+	int devid;
			
 
				+	cl_int err;
			
 
				+	cl_context context;
			
 
				+	cl_command_queue queue;
			
 
				+
			
 
				+	devid = starpu_worker_get_devid(chosen);
			
 
				+
			
 
				+	starpu_opencl_get_context(devid, &context);
			
 
				+	starpu_opencl_get_queue(devid, &queue);
			
 
				+
			
 
				+	foo_gpu = clCreateBuffer(context, CL_MEM_READ_WRITE, size*sizeof(int), NULL, &err);
			
 
				+	if (STARPU_UNLIKELY(err != CL_SUCCESS))
			
 
				+		STARPU_OPENCL_REPORT_ERROR(err);
			
 
				+
			
 
				+	unsigned int *foo = malloc(size*sizeof(*foo));
			
 
				+	for (i = 0; i < size; i++)
			
 
				+		foo[i] = i;
			
 
				+
			
 
				+	err = clEnqueueWriteBuffer(queue,
			
 
				+				foo_gpu,
			
 
				+				CL_TRUE,
			
 
				+				0,
			
 
				+				size*sizeof(int),
			
 
				+				foo,
			
 
				+				0,
			
 
				+				NULL,
			
 
				+				NULL);
			
 
				+	if (STARPU_UNLIKELY(err != CL_SUCCESS))
			
 
				+		STARPU_OPENCL_REPORT_ERROR(err);
			
 
				+
			
 
				+
			
 
				+	
			
 
				+	starpu_vector_data_register(&handle,
			
 
				+				    starpu_worker_get_memory_node(chosen),
			
 
				+				    (uintptr_t)foo_gpu,
			
 
				+				    size,
			
 
				+				    sizeof(int));
			
 
				+
			
 
				+	/* Broadcast the data to force in-place partitioning */
			
 
				+	for (i = 0; i < n; i++)
			
 
				+		starpu_data_prefetch_on_node(handle, starpu_worker_get_memory_node(i), 0);
			
 
				+
			
 
				+	/* Even with just one worker, split in at least two */
			
 
				+	if (n == 1)
			
 
				+		pieces = 2;
			
 
				+	else
			
 
				+		pieces = n;
			
 
				 
			
 
				-        return EXIT_SUCCESS;
			
 
				+	struct starpu_data_filter f =
			
 
				+	{
			
 
				+		.filter_func = starpu_block_filter_func_vector,
			
 
				+		.nchildren = pieces,
			
 
				+	};
			
 
				+
			
 
				+	starpu_data_partition(handle, &f);
			
 
				+	
			
 
				+	ret = submit_tasks(handle, pieces, n);
			
 
				+	if (ret == -ENODEV)
			
 
				+		return -ENODEV;
			
 
				 
			
 
				-enodev:
			
 
				+	starpu_data_unpartition(handle, starpu_worker_get_memory_node(chosen));
			
 
				 	starpu_data_unregister(handle);
			
 
				+
			
 
				+	STARPU_CHECK_RETURN_VALUE(ret, "starpu_task_wait_for_all");
			
 
				+	ret = starpu_opencl_unload_opencl(&opencl_program);
			
 
				+	STARPU_CHECK_RETURN_VALUE(ret, "starpu_opencl_load_opencl_from_file");
			
 
				+
			
 
				+	err = clEnqueueReadBuffer(queue,
			
 
				+		foo_gpu,
			
 
				+		CL_TRUE,
			
 
				+		0,
			
 
				+		size*sizeof(*foo),
			
 
				+		foo,
			
 
				+		0,
			
 
				+		NULL,
			
 
				+		NULL);
			
 
				+	if (STARPU_UNLIKELY(err != CL_SUCCESS))
			
 
				+		STARPU_OPENCL_REPORT_ERROR(err);
			
 
				+	return check_result(foo, size);
			
 
				+}
			
 
				+#endif /* !STARPU_USE_OPENCL */
			
 
				+
			
 
				+int main(int argc, char **argv)
			
 
				+{
			
 
				+	int skipped_cuda = 1, skipped_opencl = 1;
			
 
				+	int ret;
			
 
				+	ret = starpu_init(NULL);
			
 
				+	if (ret == -ENODEV)
			
 
				+		return STARPU_TEST_SKIPPED;
			
 
				+	STARPU_CHECK_RETURN_VALUE(ret, "starpu_init");
			
 
				+
			
 
				+#ifdef STARPU_USE_CUDA
			
 
				+#if CUDART_VERSION >= 4000 /* We need thread-safety of CUDA */
			
 
				+	ret = test_cuda();
			
 
				+	if (ret == 1)
			
 
				+		goto fail;
			
 
				+	else if (ret == 0)
			
 
				+		skipped_cuda = 0;
			
 
				+#endif
			
 
				 #endif
			
 
				+
			
 
				+#ifdef STARPU_USE_OPENCL
			
 
				+	ret = test_opencl();
			
 
				+	if (ret == 1)
			
 
				+		goto fail;
			
 
				+	else if (ret == 0)
			
 
				+		skipped_opencl = 0;
			
 
				 #endif
			
 
				-	fprintf(stderr, "WARNING: No one can execute this task\n");
			
 
				-	/* yes, we do not perform the computation but we did detect that no one
			
 
				- 	 * could perform the kernel, so this is not an error from StarPU */
			
 
				+
			
 
				+	starpu_shutdown();
			
 
				+
			
 
				+	if (skipped_cuda == 1 && skipped_opencl == 1)
			
 
				+		return STARPU_TEST_SKIPPED;
			
 
				+
			
 
				+	return EXIT_SUCCESS;
			
 
				+
			
 
				+fail:
			
 
				 	starpu_shutdown();
			
 
				-	return STARPU_TEST_SKIPPED;
			
 
				+	return EXIT_FAILURE;
			
 
				 }