|
@@ -0,0 +1,50 @@
|
|
|
|
+/*
|
|
|
|
+ * StarPU
|
|
|
|
+ * Copyright (C) INRIA 2008-2010 (see AUTHORS file)
|
|
|
|
+ *
|
|
|
|
+ * This program is free software; you can redistribute it and/or modify
|
|
|
|
+ * it under the terms of the GNU Lesser General Public License as published by
|
|
|
|
+ * the Free Software Foundation; either version 2.1 of the License, or (at
|
|
|
|
+ * your option) any later version.
|
|
|
|
+ *
|
|
|
|
+ * This program is distributed in the hope that it will be useful, but
|
|
|
|
+ * WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
|
|
|
|
+ *
|
|
|
|
+ * See the GNU Lesser General Public License in COPYING.LGPL for more details.
|
|
|
|
+ */
|
|
|
|
+
|
|
|
|
+#include <starpu.h>
|
|
|
|
+#include <common/config.h>
|
|
|
|
+#include <datawizard/filters.h>
|
|
|
|
+
|
|
|
|
+void starpu_block_filter_func_block(void *father_interface, void *child_interface, struct starpu_data_filter *f, unsigned id, unsigned nparts)
|
|
|
|
+{
|
|
|
|
+ starpu_block_interface_t *block_father = father_interface;
|
|
|
|
+ starpu_block_interface_t *block_child = child_interface;
|
|
|
|
+
|
|
|
|
+ uint32_t nx = block_father->nx;
|
|
|
|
+ uint32_t ny = block_father->ny;
|
|
|
|
+ uint32_t nz = block_father->nz;
|
|
|
|
+ size_t elemsize = block_father->elemsize;
|
|
|
|
+
|
|
|
|
+ STARPU_ASSERT(nparts <= nx);
|
|
|
|
+
|
|
|
|
+ uint32_t chunk_size = (nx + nparts - 1)/nparts;
|
|
|
|
+ size_t offset = id*chunk_size*elemsize;
|
|
|
|
+
|
|
|
|
+ uint32_t child_nx = STARPU_MIN(chunk_size, nx - id*chunk_size);
|
|
|
|
+
|
|
|
|
+ block_child->nx = child_nx;
|
|
|
|
+ block_child->ny = ny;
|
|
|
|
+ block_child->nz = nz;
|
|
|
|
+ block_child->elemsize = elemsize;
|
|
|
|
+
|
|
|
|
+ if (block_father->ptr) {
|
|
|
|
+ block_child->ptr = block_father->ptr + offset;
|
|
|
|
+ block_child->ldy = block_father->ldy;
|
|
|
|
+ block_child->ldz = block_father->ldz;
|
|
|
|
+ block_child->dev_handle = block_father->dev_handle;
|
|
|
|
+ block_child->offset = block_father->offset + offset;
|
|
|
|
+ }
|
|
|
|
+}
|