|
@@ -90,10 +90,8 @@ opencl_shadow_host(int bz, TYPE *ptr, int nx, int ny, int nz, int ldy, int ldz,
|
|
|
threads_per_dim_y /= 2;
|
|
|
#if 0
|
|
|
unsigned threads_per_dim_z = 4;
|
|
|
- size_t dimBlock[] = {threads_per_dim_x, threads_per_dim_y, threads_per_dim_z};
|
|
|
size_t dimGrid[] = {nx / threads_per_dim_x, ny / threads_per_dim_y, nz / threads_per_dim_z};
|
|
|
#else
|
|
|
- size_t dimBlock[] = {threads_per_dim_x, threads_per_dim_y, 1};
|
|
|
size_t dimGrid[] = {((nx + threads_per_dim_x-1) / threads_per_dim_x)*threads_per_dim_x, ((ny + threads_per_dim_y-1) / threads_per_dim_y)*threads_per_dim_y, 1};
|
|
|
#endif
|
|
|
|
|
@@ -115,7 +113,7 @@ opencl_shadow_host(int bz, TYPE *ptr, int nx, int ny, int nz, int ldy, int ldz,
|
|
|
clSetKernelArg(kernel, 7, sizeof(i), &i);
|
|
|
|
|
|
cl_event ev;
|
|
|
- cl_int err = clEnqueueNDRangeKernel(cq, kernel, 3, NULL, dimGrid, dimBlock, 0, NULL, &ev);
|
|
|
+ cl_int err = clEnqueueNDRangeKernel(cq, kernel, 3, NULL, dimGrid, NULL, 0, NULL, &ev);
|
|
|
if (err != CL_SUCCESS)
|
|
|
STARPU_OPENCL_REPORT_ERROR(err);
|
|
|
clWaitForEvents(1, &ev);
|