/* GCC-StarPU
Copyright (C) 2012 Inria
GCC-StarPU is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
GCC-StarPU is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with GCC-StarPU. If not, see . */
#include
/* We must include starpu.h here, otherwise gcc will complain about a poisoned
malloc in xmmintrin.h. */
#include
#include
#include
#include
#include
#include
#include
#include
#include
#include
#ifdef HAVE_C_FAMILY_C_COMMON_H
# include
#elif HAVE_C_COMMON_H
# include
#endif
#include
#include
#include
#include
#include
/* Search path for OpenCL source files for the `opencl' pragma, as a
`TREE_LIST'. */
tree opencl_include_dirs = NULL_TREE;
/* Names of data structures defined in . */
static const char opencl_program_struct_tag[] = "starpu_opencl_program";
/* Return the type corresponding to OPENCL_PROGRAM_STRUCT_TAG. */
static tree
opencl_program_type (void)
{
tree t = TREE_TYPE (type_decl_for_struct_tag (opencl_program_struct_tag));
if (TYPE_SIZE (t) == NULL_TREE)
{
/* Incomplete type definition, for instance because
wasn't included. */
error_at (UNKNOWN_LOCATION, "StarPU OpenCL support is lacking");
t = error_mark_node;
}
return t;
}
static tree
opencl_kernel_type (void)
{
tree t = lookup_name (get_identifier ("cl_kernel"));
gcc_assert (t != NULL_TREE);
if (TREE_CODE (t) == TYPE_DECL)
t = TREE_TYPE (t);
gcc_assert (TYPE_P (t));
return t;
}
static tree
opencl_command_queue_type (void)
{
tree t = lookup_name (get_identifier ("cl_command_queue"));
gcc_assert (t != NULL_TREE);
if (TREE_CODE (t) == TYPE_DECL)
t = TREE_TYPE (t);
gcc_assert (TYPE_P (t));
return t;
}
static tree
opencl_event_type (void)
{
tree t = lookup_name (get_identifier ("cl_event"));
gcc_assert (t != NULL_TREE);
if (TREE_CODE (t) == TYPE_DECL)
t = TREE_TYPE (t);
gcc_assert (TYPE_P (t));
return t;
}
/* Return a private global string literal VAR_DECL, whose contents are the
LEN bytes at CONTENTS. */
static tree
build_string_variable (location_t loc, const char *name_seed,
const char *contents, size_t len)
{
tree decl;
decl = build_decl (loc, VAR_DECL, create_tmp_var_name (name_seed),
string_type_node);
TREE_PUBLIC (decl) = false;
TREE_STATIC (decl) = true;
TREE_USED (decl) = true;
DECL_INITIAL (decl) = /* XXX: off-by-one? */
build_string_literal (len + 1, contents);
DECL_ARTIFICIAL (decl) = true;
return decl;
}
/* Return a VAR_DECL for a string variable containing the contents of FILE,
which is looked for in each of the directories listed in SEARCH_PATH. If
FILE could not be found, return NULL_TREE. */
static tree
build_variable_from_file_contents (location_t loc,
const char *name_seed,
const char *file,
const_tree search_path)
{
gcc_assert (search_path != NULL_TREE
&& TREE_CODE (search_path) == TREE_LIST);
int err, dir_fd;
struct stat st;
const_tree dirs;
tree var = NULL_TREE;
/* Look for FILE in each directory in SEARCH_PATH, and pick the first one
that matches. */
for (err = ENOENT, dir_fd = -1, dirs = search_path;
(err != 0 || err == ENOENT) && dirs != NULL_TREE;
dirs = TREE_CHAIN (dirs))
{
gcc_assert (TREE_VALUE (dirs) != NULL_TREE
&& TREE_CODE (TREE_VALUE (dirs)) == STRING_CST);
dir_fd = open (TREE_STRING_POINTER (TREE_VALUE (dirs)),
O_DIRECTORY | O_RDONLY);
if (dir_fd < 0)
err = ENOENT;
else
{
err = fstatat (dir_fd, file, &st, 0);
if (err != 0)
close (dir_fd);
else
/* Leave DIRS unchanged so it can be referred to in diagnostics
below. */
break;
}
}
if (err != 0 || dir_fd < 0)
error_at (loc, "failed to access %qs: %m", file);
else if (st.st_size == 0)
{
error_at (loc, "source file %qs is empty", file);
close (dir_fd);
}
else
{
if (verbose_output_p)
inform (loc, "found file %qs in %qs",
file, TREE_STRING_POINTER (TREE_VALUE (dirs)));
int fd;
fd = openat (dir_fd, file, O_RDONLY);
close (dir_fd);
if (fd < 0)
error_at (loc, "failed to open %qs: %m", file);
else
{
void *contents;
contents = mmap (NULL, st.st_size, PROT_READ, MAP_SHARED, fd, 0);
if (contents == NULL)
error_at (loc, "failed to map contents of %qs: %m", file);
else
{
var = build_string_variable (loc, name_seed,
(char *) contents, st.st_size);
pushdecl (var);
munmap (contents, st.st_size);
}
close (fd);
}
}
return var;
}
/* Return an expression that, given the OpenCL error code in ERROR_VAR,
returns a string. */
static tree
build_opencl_error_string (tree error_var)
{
static tree clstrerror_fn;
LOOKUP_STARPU_FUNCTION (clstrerror_fn, "starpu_opencl_error_string");
return build_call_expr (clstrerror_fn, 1, error_var);
}
/* Return an error-checking `clSetKernelArg' call for argument ARG, at
index IDX, of KERNEL. */
static tree
build_opencl_set_kernel_arg_call (location_t loc, tree fn,
tree kernel, unsigned int idx,
tree arg)
{
gcc_assert (TREE_CODE (fn) == FUNCTION_DECL
&& TREE_TYPE (kernel) == opencl_kernel_type ());
static tree setkernarg_fn;
LOOKUP_STARPU_FUNCTION (setkernarg_fn, "clSetKernelArg");
tree call = build_call_expr (setkernarg_fn, 4, kernel,
build_int_cst (integer_type_node, idx),
size_in_bytes (TREE_TYPE (arg)),
build_addr (arg, fn));
tree error_var = build_decl (loc, VAR_DECL,
create_tmp_var_name ("setkernelarg_error"),
integer_type_node);
DECL_ARTIFICIAL (error_var) = true;
DECL_CONTEXT (error_var) = fn;
tree assignment = build2 (INIT_EXPR, TREE_TYPE (error_var),
error_var, call);
/* Build `if (ERROR_VAR != 0) error ();'. */
tree cond;
cond = build3 (COND_EXPR, void_type_node,
build2 (NE_EXPR, boolean_type_node,
error_var, integer_zero_node),
build_error_statements (loc, error_var,
build_opencl_error_string,
"failed to set OpenCL kernel "
"argument %d", idx),
NULL_TREE);
tree stmts = NULL_TREE;
append_to_statement_list (assignment, &stmts);
append_to_statement_list (cond, &stmts);
return build4 (TARGET_EXPR, void_type_node, error_var,
stmts, NULL_TREE, NULL_TREE);
}
/* Return the sequence of `clSetKernelArg' calls for KERNEL. */
static tree
build_opencl_set_kernel_arg_calls (location_t loc, tree task_impl,
tree kernel)
{
gcc_assert (task_implementation_p (task_impl));
size_t n;
tree arg, stmts = NULL_TREE;
for (arg = DECL_ARGUMENTS (task_impl), n = 0;
arg != NULL_TREE;
arg = TREE_CHAIN (arg), n++)
{
tree call = build_opencl_set_kernel_arg_call (loc, task_impl,
kernel, n, arg);
append_to_statement_list (call, &stmts);
}
return stmts;
}
/* Define a body for TASK_IMPL that loads OpenCL source from FILE and calls
KERNEL. */
static void
define_opencl_task_implementation (location_t loc, tree task_impl,
const char *file, const_tree kernel,
tree groupsize)
{
gcc_assert (task_implementation_p (task_impl)
&& task_implementation_where (task_impl) == STARPU_OPENCL);
gcc_assert (TREE_CODE (kernel) == STRING_CST);
gcc_assert (INTEGRAL_TYPE_P (TREE_TYPE (groupsize)));
local_define (tree, local_var, (tree type))
{
tree var = build_decl (loc, VAR_DECL,
create_tmp_var_name ("opencl_var"),
type);
DECL_ARTIFICIAL (var) = true;
DECL_CONTEXT (var) = task_impl;
return var;
};
if (!verbose_output_p)
/* No further warnings for this node. */
TREE_NO_WARNING (task_impl) = true;
static tree load_fn, load_kern_fn, enqueue_kern_fn, wid_fn, devid_fn, clfinish_fn,
collect_stats_fn, release_ev_fn;
if (load_fn == NULL_TREE)
{
load_fn =
lookup_name (get_identifier ("starpu_opencl_load_opencl_from_string"));
if (load_fn == NULL_TREE)
{
inform (loc, "no OpenCL support, task implementation %qE "
"not generated", DECL_NAME (task_impl));
return;
}
}
LOOKUP_STARPU_FUNCTION (load_kern_fn, "starpu_opencl_load_kernel");
LOOKUP_STARPU_FUNCTION (wid_fn, "starpu_worker_get_id");
LOOKUP_STARPU_FUNCTION (devid_fn, "starpu_worker_get_devid");
LOOKUP_STARPU_FUNCTION (enqueue_kern_fn, "clEnqueueNDRangeKernel");
LOOKUP_STARPU_FUNCTION (clfinish_fn, "clFinish");
LOOKUP_STARPU_FUNCTION (collect_stats_fn, "starpu_opencl_collect_stats");
LOOKUP_STARPU_FUNCTION (release_ev_fn, "clReleaseEvent");
if (verbose_output_p)
inform (loc, "defining %qE, with OpenCL kernel %qs from file %qs",
DECL_NAME (task_impl), TREE_STRING_POINTER (kernel), file);
tree source_var;
source_var = build_variable_from_file_contents (loc, "opencl_source",
file, opencl_include_dirs);
if (source_var != NULL_TREE)
{
/* Give TASK_IMPL an actual argument list. */
DECL_ARGUMENTS (task_impl) = build_function_arguments (task_impl);
tree prog_var, prog_loaded_var;
/* Global variable to hold the `starpu_opencl_program' object. */
prog_var = build_decl (loc, VAR_DECL,
create_tmp_var_name ("opencl_program"),
opencl_program_type ());
TREE_PUBLIC (prog_var) = false;
TREE_STATIC (prog_var) = true;
TREE_USED (prog_var) = true;
DECL_ARTIFICIAL (prog_var) = true;
pushdecl (prog_var);
/* Global variable indicating whether the program has already been
loaded. */
prog_loaded_var = build_decl (loc, VAR_DECL,
create_tmp_var_name ("opencl_prog_loaded"),
boolean_type_node);
TREE_PUBLIC (prog_loaded_var) = false;
TREE_STATIC (prog_loaded_var) = true;
TREE_USED (prog_loaded_var) = true;
DECL_ARTIFICIAL (prog_loaded_var) = true;
DECL_INITIAL (prog_loaded_var) = build_zero_cst (boolean_type_node);
pushdecl (prog_loaded_var);
/* Build `starpu_opencl_load_opencl_from_string (SOURCE_VAR,
&PROG_VAR, "")'. */
tree load = build_call_expr (load_fn, 3, source_var,
build_addr (prog_var, task_impl),
build_string_literal (1, ""));
tree load_stmts = NULL_TREE;
append_to_statement_list (load, &load_stmts);
append_to_statement_list (build2 (MODIFY_EXPR, boolean_type_node,
prog_loaded_var,
build_int_cst (boolean_type_node, 1)),
&load_stmts);
/* Build `if (!PROG_LOADED_VAR) { ...; PROG_LOADED_VAR = true; }'. */
tree load_cond = build3 (COND_EXPR, void_type_node,
prog_loaded_var,
NULL_TREE,
load_stmts);
/* Local variables. */
tree kernel_var, queue_var, event_var, group_size_var, ngroups_var,
error_var;
kernel_var = local_var (opencl_kernel_type ());
queue_var = local_var (opencl_command_queue_type ());
event_var = local_var (opencl_event_type ());
group_size_var = local_var (size_type_node);
ngroups_var = local_var (size_type_node);
error_var = local_var (integer_type_node);
/* Build `starpu_opencl_load_kernel (...)'.
TODO: Check return value. */
tree devid =
build_call_expr (devid_fn, 1, build_call_expr (wid_fn, 0));
tree load_kern = build_call_expr (load_kern_fn, 5,
build_addr (kernel_var, task_impl),
build_addr (queue_var, task_impl),
build_addr (prog_var, task_impl),
build_string_literal
(TREE_STRING_LENGTH (kernel) + 1,
TREE_STRING_POINTER (kernel)),
devid);
tree enqueue_kern =
build_call_expr (enqueue_kern_fn, 9,
queue_var, kernel_var,
build_int_cst (integer_type_node, 1),
null_pointer_node,
build_addr (group_size_var, task_impl),
build_addr (ngroups_var, task_impl),
integer_zero_node,
null_pointer_node,
build_addr (event_var, task_impl));
tree enqueue_err =
build2 (INIT_EXPR, TREE_TYPE (error_var), error_var, enqueue_kern);
tree enqueue_cond =
build3 (COND_EXPR, void_type_node,
build2 (NE_EXPR, boolean_type_node,
error_var, integer_zero_node),
build_error_statements (loc, error_var,
build_opencl_error_string,
"failed to enqueue kernel"),
NULL_TREE);
tree clfinish =
build_call_expr (clfinish_fn, 1, queue_var);
tree collect_stats =
build_call_expr (collect_stats_fn, 1, event_var);
tree release_ev =
build_call_expr (release_ev_fn, 1, event_var);
tree enqueue_stmts = NULL_TREE;
append_to_statement_list (enqueue_err, &enqueue_stmts);
append_to_statement_list (enqueue_cond, &enqueue_stmts);
/* TODO: Build `clFinish', `clReleaseEvent', & co. */
/* Put it all together. */
tree stmts = NULL_TREE;
append_to_statement_list (load_cond, &stmts);
append_to_statement_list (load_kern, &stmts);
append_to_statement_list (build_opencl_set_kernel_arg_calls (loc,
task_impl,
kernel_var),
&stmts);
/* TODO: Support user-provided values. */
append_to_statement_list (build2 (INIT_EXPR, TREE_TYPE (group_size_var),
group_size_var,
fold_convert (TREE_TYPE (group_size_var),
groupsize)),
&stmts);
append_to_statement_list (build2 (INIT_EXPR, TREE_TYPE (ngroups_var),
ngroups_var,
build_int_cst (TREE_TYPE (ngroups_var),
1)),
&stmts);
append_to_statement_list (build4 (TARGET_EXPR, void_type_node,
error_var, enqueue_stmts,
NULL_TREE, NULL_TREE),
&stmts);
append_to_statement_list (clfinish, &stmts);
append_to_statement_list (collect_stats, &stmts);
append_to_statement_list (release_ev, &stmts);
/* Bind the local vars. */
tree vars = chain_trees (kernel_var, queue_var, event_var,
group_size_var, ngroups_var, NULL_TREE);
tree bind = build3 (BIND_EXPR, void_type_node, vars, stmts,
build_block (vars, NULL_TREE, task_impl, NULL_TREE));
TREE_USED (task_impl) = true;
TREE_STATIC (task_impl) = true;
DECL_EXTERNAL (task_impl) = false;
DECL_ARTIFICIAL (task_impl) = true;
DECL_SAVED_TREE (task_impl) = bind;
DECL_INITIAL (task_impl) = BIND_EXPR_BLOCK (bind);
DECL_RESULT (task_impl) =
build_decl (loc, RESULT_DECL, NULL_TREE, void_type_node);
/* Compile TASK_IMPL. */
rest_of_decl_compilation (task_impl, true, 0);
allocate_struct_function (task_impl, false);
cgraph_finalize_function (task_impl, false);
cgraph_mark_needed_node (cgraph_get_node (task_impl));
/* Generate a wrapper for TASK_IMPL, and possibly the body of its task.
This needs to be done explicitly here, because otherwise
`handle_pre_genericize' would never see TASK_IMPL's task. */
tree task = task_implementation_task (task_impl);
if (!TREE_STATIC (task))
{
declare_codelet (task);
define_task (task);
/* Compile TASK's body. */
rest_of_decl_compilation (task, true, 0);
allocate_struct_function (task, false);
cgraph_finalize_function (task, false);
cgraph_mark_needed_node (cgraph_get_node (task));
}
}
else
DECL_SAVED_TREE (task_impl) = error_mark_node;
return;
}
/* Handle the `opencl' pragma, which defines an OpenCL task
implementation. */
void
handle_pragma_opencl (struct cpp_reader *reader)
{
tree args;
location_t loc;
loc = cpp_peek_token (reader, 0)->src_loc;
if (current_function_decl != NULL_TREE)
{
error_at (loc, "% pragma can only be used "
"at the top-level");
return;
}
args = read_pragma_expressions ("opencl", loc);
if (args == NULL_TREE)
return;
/* TODO: Add "number of groups" arguments. */
if (list_length (args) < 4)
{
error_at (loc, "wrong number of arguments for % pragma");
return;
}
if (task_implementation_p (TREE_VALUE (args)))
{
tree task_impl = TREE_VALUE (args);
if (task_implementation_where (task_impl) == STARPU_OPENCL)
{
args = TREE_CHAIN (args);
if (TREE_CODE (TREE_VALUE (args)) == STRING_CST)
{
tree file = TREE_VALUE (args);
args = TREE_CHAIN (args);
if (TREE_CODE (TREE_VALUE (args)) == STRING_CST)
{
tree kernel = TREE_VALUE (args);
args = TREE_CHAIN (args);
if (TREE_TYPE (TREE_VALUE (args)) != NULL_TREE &&
INTEGRAL_TYPE_P (TREE_TYPE (TREE_VALUE (args))))
{
tree groupsize = TREE_VALUE (args);
if (TREE_CHAIN (args) == NULL_TREE)
define_opencl_task_implementation (loc, task_impl,
TREE_STRING_POINTER (file),
kernel, groupsize);
else
error_at (loc, "junk after % pragma");
}
else
error_at (loc, "% argument must be an integral type");
}
else
error_at (loc, "% argument must be a string constant");
}
else
error_at (loc, "% argument must be a string constant");
}
else
error_at (loc, "%qE is not an OpenCL task implementation",
DECL_NAME (task_impl));
}
else
error_at (loc, "%qE is not a task implementation", TREE_VALUE (args));
}
/* Diagnose use of C types that are either nonexistent or different in
OpenCL. */
void
validate_opencl_argument_type (location_t loc, const_tree type)
{
/* When TYPE is a pointer type, get to the base element type. */
for (; POINTER_TYPE_P (type); type = TREE_TYPE (type));
if (!RECORD_OR_UNION_TYPE_P (type) && !VOID_TYPE_P (type))
{
tree decl = TYPE_NAME (type);
if (DECL_P (decl))
{
static const struct { const char *c; const char *cl; }
type_map[] =
{
/* Scalar types defined in OpenCL 1.2. See
. */
{ "char", "cl_char" },
{ "signed char", "cl_char" },
{ "unsigned char", "cl_uchar" },
{ "uchar", "cl_uchar" },
{ "short int", "cl_short" },
{ "unsigned short", "cl_ushort" },
{ "int", "cl_int" },
{ "unsigned int", "cl_uint" },
{ "uint", "cl_uint" },
{ "long int", "cl_long" },
{ "long unsigned int", "cl_ulong" },
{ "ulong", "cl_ulong" },
{ "float", "cl_float" },
{ "double", "cl_double" },
{ NULL, NULL }
};
const char *c_name = IDENTIFIER_POINTER (DECL_NAME (decl));
const char *cl_name =
({
size_t i;
for (i = 0; type_map[i].c != NULL; i++)
{
if (strcmp (type_map[i].c, c_name) == 0)
break;
}
type_map[i].cl;
});
if (cl_name != NULL)
{
tree cl_type = lookup_name (get_identifier (cl_name));
if (cl_type != NULL_TREE)
{
if (DECL_P (cl_type))
cl_type = TREE_TYPE (cl_type);
if (!lang_hooks.types_compatible_p ((tree) type, cl_type))
{
tree st, sclt;
st = c_common_signed_type ((tree) type);
sclt = c_common_signed_type (cl_type);
if (st == sclt)
warning_at (loc, 0, "C type %qE differs in signedness "
"from the same-named OpenCL type",
DECL_NAME (decl));
else
/* TYPE should be avoided because the it differs from
CL_TYPE, and thus cannot be used safely in
`clSetKernelArg'. */
warning_at (loc, 0, "C type %qE differs from the "
"same-named OpenCL type",
DECL_NAME (decl));
}
}
/* Otherwise we can't conclude. It could be that
wasn't included in the program, for instance. */
}
else
/* Recommend against use of `size_t', etc. */
warning_at (loc, 0, "%qE does not correspond to a known "
"OpenCL type", DECL_NAME (decl));
}
}
}