123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125 |
- /* StarPU --- Runtime system for heterogeneous multicore architectures.
- *
- * Copyright (C) 2011-2020 Université de Bordeaux, CNRS (LaBRI UMR 5800), Inria
- *
- * StarPU is free software; you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation; either version 2.1 of the License, or (at
- * your option) any later version.
- *
- * StarPU is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- *
- * See the GNU Lesser General Public License in COPYING.LGPL for more details.
- */
- #include <starpu.h>
- #include "../test_interfaces.h"
- #define KERNEL_LOCATION "tests/datawizard/interfaces/tensor/tensor_opencl_kernel.cl"
- extern struct test_config tensor_config;
- static struct starpu_opencl_program opencl_program;
- void
- test_tensor_opencl_func(void *buffers[], void *args)
- {
- STARPU_SKIP_IF_VALGRIND;
- int id, devid, ret;
- int factor = *(int *) args;
- cl_int err;
- cl_kernel kernel;
- cl_command_queue queue;
- cl_event event;
- ret = starpu_opencl_load_opencl_from_file(KERNEL_LOCATION, &opencl_program, NULL);
- STARPU_CHECK_RETURN_VALUE(ret, "starpu_opencl_load_opencl_from_file");
- int nx = STARPU_TENSOR_GET_NX(buffers[0]);
- int ny = STARPU_TENSOR_GET_NY(buffers[0]);
- int nz = STARPU_TENSOR_GET_NZ(buffers[0]);
- int nt = STARPU_TENSOR_GET_NT(buffers[0]);
- unsigned ldy = STARPU_TENSOR_GET_LDY(buffers[0]);
- unsigned ldz = STARPU_TENSOR_GET_LDZ(buffers[0]);
- unsigned ldt = STARPU_TENSOR_GET_LDT(buffers[0]);
- cl_mem tensor = (cl_mem) STARPU_TENSOR_GET_DEV_HANDLE(buffers[0]);
- cl_context context;
- id = starpu_worker_get_id_check();
- devid = starpu_worker_get_devid(id);
- starpu_opencl_get_context(devid, &context);
- cl_mem fail = clCreateBuffer(context, CL_MEM_COPY_HOST_PTR,
- sizeof(int), &tensor_config.copy_failed, &err);
- if (err != CL_SUCCESS)
- STARPU_OPENCL_REPORT_ERROR(err);
- err = starpu_opencl_load_kernel(&kernel,
- &queue,
- &opencl_program,
- "tensor_opencl",
- devid);
- if (err != CL_SUCCESS)
- STARPU_OPENCL_REPORT_ERROR(err);
- int nargs;
- nargs = starpu_opencl_set_kernel_args(&err, &kernel,
- sizeof(tensor), &tensor,
- sizeof(nx), &nx,
- sizeof(ny), &ny,
- sizeof(nz), &nz,
- sizeof(nt), &nt,
- sizeof(ldy), &ldy,
- sizeof(ldz), &ldz,
- sizeof(ldt), &ldt,
- sizeof(factor), &factor,
- sizeof(fail), &fail,
- 0);
- if (nargs != 10)
- {
- fprintf(stderr, "Failed to set argument #%d\n", nargs);
- STARPU_OPENCL_REPORT_ERROR(err);
- }
-
- {
- size_t global[3] = {nx, ny, nz*nt};
- err = clEnqueueNDRangeKernel(queue,
- kernel,
- 3,
- NULL,
- global,
- NULL,
- 0,
- NULL,
- &event);
- if (err != CL_SUCCESS)
- STARPU_OPENCL_REPORT_ERROR(err);
- }
- err = clEnqueueReadBuffer(queue,
- fail,
- CL_TRUE,
- 0,
- sizeof(int),
- &tensor_config.copy_failed,
- 0,
- NULL,
- NULL);
- if (err != CL_SUCCESS)
- STARPU_OPENCL_REPORT_ERROR(err);
- clFinish(queue);
- starpu_opencl_collect_stats(event);
- clReleaseEvent(event);
- starpu_opencl_release_kernel(kernel);
- ret = starpu_opencl_unload_opencl(&opencl_program);
- STARPU_CHECK_RETURN_VALUE(ret, "starpu_opencl_unload_opencl");
- }
|