/* Translation of ISL AST to Gimple. Copyright (C) 2014-2015 Free Software Foundation, Inc. Contributed by Roman Gareev . This file is part of GCC. GCC is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 3, or (at your option) any later version. GCC is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with GCC; see the file COPYING3. If not see . */ #include "config.h" #ifdef HAVE_isl /* Workaround for GMP 5.1.3 bug, see PR56019. */ #include #include #include #include #include /* Since ISL-0.13, the extern is in val_gmp.h. */ #if !defined(HAVE_ISL_SCHED_CONSTRAINTS_COMPUTE_SCHEDULE) && defined(__cplusplus) extern "C" { #endif #include #if !defined(HAVE_ISL_SCHED_CONSTRAINTS_COMPUTE_SCHEDULE) && defined(__cplusplus) } #endif #endif #include "system.h" #include "coretypes.h" #include "alias.h" #include "backend.h" #include "tree.h" #include "gimple.h" #include "hard-reg-set.h" #include "options.h" #include "fold-const.h" #include "internal-fn.h" #include "gimple-iterator.h" #include "tree-ssa-loop.h" #include "tree-pass.h" #include "cfgloop.h" #include "tree-data-ref.h" #include "sese.h" #include "tree-ssa-loop-manip.h" #include "tree-scalar-evolution.h" #include "gimple-ssa.h" #include "tree-into-ssa.h" #include #ifdef HAVE_isl #include "graphite-poly.h" #include "graphite-isl-ast-to-gimple.h" /* This flag is set when an error occurred during the translation of ISL AST to Gimple. */ static bool graphite_regenerate_error; /* We always try to use signed 128 bit types, but fall back to smaller types in case a platform does not provide types of these sizes. In the future we should use isl to derive the optimal type for each subexpression. */ static int max_mode_int_precision = GET_MODE_PRECISION (mode_for_size (MAX_FIXED_MODE_SIZE, MODE_INT, 0)); static int graphite_expression_type_precision = 128 <= max_mode_int_precision ? 128 : max_mode_int_precision; struct ast_build_info { ast_build_info() : is_parallelizable(false) { }; bool is_parallelizable; }; /* Converts a GMP constant VAL to a tree and returns it. */ static tree gmp_cst_to_tree (tree type, mpz_t val) { tree t = type ? type : integer_type_node; mpz_t tmp; mpz_init (tmp); mpz_set (tmp, val); wide_int wi = wi::from_mpz (t, tmp, true); mpz_clear (tmp); return wide_int_to_tree (t, wi); } /* Verifies properties that GRAPHITE should maintain during translation. */ static inline void graphite_verify (void) { #ifdef ENABLE_CHECKING verify_loop_structure (); verify_loop_closed_ssa (true); #endif } /* IVS_PARAMS maps ISL's scattering and parameter identifiers to corresponding trees. */ typedef std::map ivs_params; /* Free all memory allocated for ISL's identifiers. */ void ivs_params_clear (ivs_params &ip) { std::map::iterator it; for (it = ip.begin (); it != ip.end (); it++) { isl_id_free (it->first); } } static tree gcc_expression_from_isl_expression (tree type, __isl_take isl_ast_expr *, ivs_params &ip); /* Return the tree variable that corresponds to the given isl ast identifier expression (an isl_ast_expr of type isl_ast_expr_id). FIXME: We should replace blind conversation of id's type with derivation of the optimal type when we get the corresponding isl support. Blindly converting type sizes may be problematic when we switch to smaller types. */ static tree gcc_expression_from_isl_ast_expr_id (tree type, __isl_keep isl_ast_expr *expr_id, ivs_params &ip) { gcc_assert (isl_ast_expr_get_type (expr_id) == isl_ast_expr_id); isl_id *tmp_isl_id = isl_ast_expr_get_id (expr_id); std::map::iterator res; res = ip.find (tmp_isl_id); isl_id_free (tmp_isl_id); gcc_assert (res != ip.end () && "Could not map isl_id to tree expression"); isl_ast_expr_free (expr_id); return fold_convert (type, res->second); } /* Converts an isl_ast_expr_int expression E to a GCC expression tree of type TYPE. */ static tree gcc_expression_from_isl_expr_int (tree type, __isl_take isl_ast_expr *expr) { gcc_assert (isl_ast_expr_get_type (expr) == isl_ast_expr_int); isl_val *val = isl_ast_expr_get_val (expr); mpz_t val_mpz_t; mpz_init (val_mpz_t); tree res; if (isl_val_get_num_gmp (val, val_mpz_t) == -1) res = NULL_TREE; else res = gmp_cst_to_tree (type, val_mpz_t); isl_val_free (val); isl_ast_expr_free (expr); mpz_clear (val_mpz_t); return res; } /* Converts a binary isl_ast_expr_op expression E to a GCC expression tree of type TYPE. */ static tree binary_op_to_tree (tree type, __isl_take isl_ast_expr *expr, ivs_params &ip) { isl_ast_expr *arg_expr = isl_ast_expr_get_op_arg (expr, 0); tree tree_lhs_expr = gcc_expression_from_isl_expression (type, arg_expr, ip); arg_expr = isl_ast_expr_get_op_arg (expr, 1); tree tree_rhs_expr = gcc_expression_from_isl_expression (type, arg_expr, ip); enum isl_ast_op_type expr_type = isl_ast_expr_get_op_type (expr); isl_ast_expr_free (expr); switch (expr_type) { case isl_ast_op_add: return fold_build2 (PLUS_EXPR, type, tree_lhs_expr, tree_rhs_expr); case isl_ast_op_sub: return fold_build2 (MINUS_EXPR, type, tree_lhs_expr, tree_rhs_expr); case isl_ast_op_mul: return fold_build2 (MULT_EXPR, type, tree_lhs_expr, tree_rhs_expr); case isl_ast_op_div: return fold_build2 (EXACT_DIV_EXPR, type, tree_lhs_expr, tree_rhs_expr); case isl_ast_op_pdiv_q: return fold_build2 (TRUNC_DIV_EXPR, type, tree_lhs_expr, tree_rhs_expr); case isl_ast_op_pdiv_r: return fold_build2 (TRUNC_MOD_EXPR, type, tree_lhs_expr, tree_rhs_expr); case isl_ast_op_fdiv_q: return fold_build2 (FLOOR_DIV_EXPR, type, tree_lhs_expr, tree_rhs_expr); case isl_ast_op_and: return fold_build2 (TRUTH_ANDIF_EXPR, type, tree_lhs_expr, tree_rhs_expr); case isl_ast_op_or: return fold_build2 (TRUTH_ORIF_EXPR, type, tree_lhs_expr, tree_rhs_expr); case isl_ast_op_eq: return fold_build2 (EQ_EXPR, type, tree_lhs_expr, tree_rhs_expr); case isl_ast_op_le: return fold_build2 (LE_EXPR, type, tree_lhs_expr, tree_rhs_expr); case isl_ast_op_lt: return fold_build2 (LT_EXPR, type, tree_lhs_expr, tree_rhs_expr); case isl_ast_op_ge: return fold_build2 (GE_EXPR, type, tree_lhs_expr, tree_rhs_expr); case isl_ast_op_gt: return fold_build2 (GT_EXPR, type, tree_lhs_expr, tree_rhs_expr); default: gcc_unreachable (); } } /* Converts a ternary isl_ast_expr_op expression E to a GCC expression tree of type TYPE. */ static tree ternary_op_to_tree (tree type, __isl_take isl_ast_expr *expr, ivs_params &ip) { gcc_assert (isl_ast_expr_get_op_type (expr) == isl_ast_op_minus); isl_ast_expr *arg_expr = isl_ast_expr_get_op_arg (expr, 0); tree tree_first_expr = gcc_expression_from_isl_expression (type, arg_expr, ip); arg_expr = isl_ast_expr_get_op_arg (expr, 1); tree tree_second_expr = gcc_expression_from_isl_expression (type, arg_expr, ip); arg_expr = isl_ast_expr_get_op_arg (expr, 2); tree tree_third_expr = gcc_expression_from_isl_expression (type, arg_expr, ip); isl_ast_expr_free (expr); return fold_build3 (COND_EXPR, type, tree_first_expr, tree_second_expr, tree_third_expr); } /* Converts a unary isl_ast_expr_op expression E to a GCC expression tree of type TYPE. */ static tree unary_op_to_tree (tree type, __isl_take isl_ast_expr *expr, ivs_params &ip) { gcc_assert (isl_ast_expr_get_op_type (expr) == isl_ast_op_minus); isl_ast_expr *arg_expr = isl_ast_expr_get_op_arg (expr, 0); tree tree_expr = gcc_expression_from_isl_expression (type, arg_expr, ip); isl_ast_expr_free (expr); return fold_build1 (NEGATE_EXPR, type, tree_expr); } /* Converts an isl_ast_expr_op expression E with unknown number of arguments to a GCC expression tree of type TYPE. */ static tree nary_op_to_tree (tree type, __isl_take isl_ast_expr *expr, ivs_params &ip) { enum tree_code op_code; switch (isl_ast_expr_get_op_type (expr)) { case isl_ast_op_max: op_code = MAX_EXPR; break; case isl_ast_op_min: op_code = MIN_EXPR; break; default: gcc_unreachable (); } isl_ast_expr *arg_expr = isl_ast_expr_get_op_arg (expr, 0); tree res = gcc_expression_from_isl_expression (type, arg_expr, ip); int i; for (i = 1; i < isl_ast_expr_get_op_n_arg (expr); i++) { arg_expr = isl_ast_expr_get_op_arg (expr, i); tree t = gcc_expression_from_isl_expression (type, arg_expr, ip); res = fold_build2 (op_code, type, res, t); } isl_ast_expr_free (expr); return res; } /* Converts an isl_ast_expr_op expression E to a GCC expression tree of type TYPE. */ static tree gcc_expression_from_isl_expr_op (tree type, __isl_take isl_ast_expr *expr, ivs_params &ip) { gcc_assert (isl_ast_expr_get_type (expr) == isl_ast_expr_op); switch (isl_ast_expr_get_op_type (expr)) { /* These isl ast expressions are not supported yet. */ case isl_ast_op_error: case isl_ast_op_call: case isl_ast_op_and_then: case isl_ast_op_or_else: case isl_ast_op_select: gcc_unreachable (); case isl_ast_op_max: case isl_ast_op_min: return nary_op_to_tree (type, expr, ip); case isl_ast_op_add: case isl_ast_op_sub: case isl_ast_op_mul: case isl_ast_op_div: case isl_ast_op_pdiv_q: case isl_ast_op_pdiv_r: case isl_ast_op_fdiv_q: case isl_ast_op_and: case isl_ast_op_or: case isl_ast_op_eq: case isl_ast_op_le: case isl_ast_op_lt: case isl_ast_op_ge: case isl_ast_op_gt: return binary_op_to_tree (type, expr, ip); case isl_ast_op_minus: return unary_op_to_tree (type, expr, ip); case isl_ast_op_cond: return ternary_op_to_tree (type, expr, ip); default: gcc_unreachable (); } return NULL_TREE; } /* Converts an ISL AST expression E back to a GCC expression tree of type TYPE. */ static tree gcc_expression_from_isl_expression (tree type, __isl_take isl_ast_expr *expr, ivs_params &ip) { switch (isl_ast_expr_get_type (expr)) { case isl_ast_expr_id: return gcc_expression_from_isl_ast_expr_id (type, expr, ip); case isl_ast_expr_int: return gcc_expression_from_isl_expr_int (type, expr); case isl_ast_expr_op: return gcc_expression_from_isl_expr_op (type, expr, ip); default: gcc_unreachable (); } return NULL_TREE; } /* Creates a new LOOP corresponding to isl_ast_node_for. Inserts an induction variable for the new LOOP. New LOOP is attached to CFG starting at ENTRY_EDGE. LOOP is inserted into the loop tree and becomes the child loop of the OUTER_LOOP. NEWIVS_INDEX binds ISL's scattering name to the induction variable created for the loop of STMT. The new induction variable is inserted in the NEWIVS vector and is of type TYPE. */ static struct loop * graphite_create_new_loop (edge entry_edge, __isl_keep isl_ast_node *node_for, loop_p outer, tree type, tree lb, tree ub, ivs_params &ip) { isl_ast_expr *for_inc = isl_ast_node_for_get_inc (node_for); tree stride = gcc_expression_from_isl_expression (type, for_inc, ip); tree ivvar = create_tmp_var (type, "graphite_IV"); tree iv, iv_after_increment; loop_p loop = create_empty_loop_on_edge (entry_edge, lb, stride, ub, ivvar, &iv, &iv_after_increment, outer ? outer : entry_edge->src->loop_father); isl_ast_expr *for_iterator = isl_ast_node_for_get_iterator (node_for); isl_id *id = isl_ast_expr_get_id (for_iterator); std::map::iterator res; res = ip.find (id); if (ip.count (id)) isl_id_free (res->first); ip[id] = iv; isl_ast_expr_free (for_iterator); return loop; } static edge translate_isl_ast (loop_p context_loop, __isl_keep isl_ast_node *node, edge next_e, ivs_params &ip); /* Create the loop for a isl_ast_node_for. - NEXT_E is the edge where new generated code should be attached. */ static edge translate_isl_ast_for_loop (loop_p context_loop, __isl_keep isl_ast_node *node_for, edge next_e, tree type, tree lb, tree ub, ivs_params &ip) { gcc_assert (isl_ast_node_get_type (node_for) == isl_ast_node_for); struct loop *loop = graphite_create_new_loop (next_e, node_for, context_loop, type, lb, ub, ip); edge last_e = single_exit (loop); edge to_body = single_succ_edge (loop->header); basic_block after = to_body->dest; /* Create a basic block for loop close phi nodes. */ last_e = single_succ_edge (split_edge (last_e)); /* Translate the body of the loop. */ isl_ast_node *for_body = isl_ast_node_for_get_body (node_for); next_e = translate_isl_ast (loop, for_body, to_body, ip); isl_ast_node_free (for_body); redirect_edge_succ_nodup (next_e, after); set_immediate_dominator (CDI_DOMINATORS, next_e->dest, next_e->src); if (flag_loop_parallelize_all) { isl_id *id = isl_ast_node_get_annotation (node_for); gcc_assert (id); ast_build_info *for_info = (ast_build_info *) isl_id_get_user (id); loop->can_be_parallel = for_info->is_parallelizable; free (for_info); isl_id_free (id); } return last_e; } /* We use this function to get the upper bound because of the form, which is used by isl to represent loops: for (iterator = init; cond; iterator += inc) { ... } The loop condition is an arbitrary expression, which contains the current loop iterator. (e.g. iterator + 3 < B && C > iterator + A) We have to know the upper bound of the iterator to generate a loop in Gimple form. It can be obtained from the special representation of the loop condition, which is generated by isl, if the ast_build_atomic_upper_bound option is set. In this case, isl generates a loop condition that consists of the current loop iterator, + an operator (< or <=) and an expression not involving the iterator, which is processed and returned by this function. (e.g iterator <= upper-bound-expression-without-iterator) */ static __isl_give isl_ast_expr * get_upper_bound (__isl_keep isl_ast_node *node_for) { gcc_assert (isl_ast_node_get_type (node_for) == isl_ast_node_for); isl_ast_expr *for_cond = isl_ast_node_for_get_cond (node_for); gcc_assert (isl_ast_expr_get_type (for_cond) == isl_ast_expr_op); isl_ast_expr *res; switch (isl_ast_expr_get_op_type (for_cond)) { case isl_ast_op_le: res = isl_ast_expr_get_op_arg (for_cond, 1); break; case isl_ast_op_lt: { // (iterator < ub) => (iterator <= ub - 1) isl_val *one = isl_val_int_from_si (isl_ast_expr_get_ctx (for_cond), 1); isl_ast_expr *ub = isl_ast_expr_get_op_arg (for_cond, 1); res = isl_ast_expr_sub (ub, isl_ast_expr_from_val (one)); break; } default: gcc_unreachable (); } isl_ast_expr_free (for_cond); return res; } /* All loops generated by create_empty_loop_on_edge have the form of a post-test loop: do { body of the loop; } while (lower bound < upper bound); We create a new if region protecting the loop to be executed, if the execution count is zero (lower bound > upper bound). */ static edge graphite_create_new_loop_guard (edge entry_edge, __isl_keep isl_ast_node *node_for, tree *type, tree *lb, tree *ub, ivs_params &ip) { gcc_assert (isl_ast_node_get_type (node_for) == isl_ast_node_for); tree cond_expr; edge exit_edge; *type = build_nonstandard_integer_type (graphite_expression_type_precision, 0); isl_ast_expr *for_init = isl_ast_node_for_get_init (node_for); *lb = gcc_expression_from_isl_expression (*type, for_init, ip); isl_ast_expr *upper_bound = get_upper_bound (node_for); *ub = gcc_expression_from_isl_expression (*type, upper_bound, ip); /* When ub is simply a constant or a parameter, use lb <= ub. */ if (TREE_CODE (*ub) == INTEGER_CST || TREE_CODE (*ub) == SSA_NAME) cond_expr = fold_build2 (LE_EXPR, boolean_type_node, *lb, *ub); else { tree one = (POINTER_TYPE_P (*type) ? convert_to_ptrofftype (integer_one_node) : fold_convert (*type, integer_one_node)); /* Adding +1 and using LT_EXPR helps with loop latches that have a loop iteration count of "PARAMETER - 1". For PARAMETER == 0 this becomes 2^k-1 due to integer overflow, and the condition lb <= ub is true, even if we do not want this. However lb < ub + 1 is false, as expected. */ tree ub_one = fold_build2 (POINTER_TYPE_P (*type) ? POINTER_PLUS_EXPR : PLUS_EXPR, *type, *ub, one); cond_expr = fold_build2 (LT_EXPR, boolean_type_node, *lb, ub_one); } exit_edge = create_empty_if_region_on_edge (entry_edge, cond_expr); return exit_edge; } /* Translates an isl_ast_node_for to Gimple. */ static edge translate_isl_ast_node_for (loop_p context_loop, __isl_keep isl_ast_node *node, edge next_e, ivs_params &ip) { gcc_assert (isl_ast_node_get_type (node) == isl_ast_node_for); tree type, lb, ub; edge last_e = graphite_create_new_loop_guard (next_e, node, &type, &lb, &ub, ip); edge true_e = get_true_edge_from_guard_bb (next_e->dest); translate_isl_ast_for_loop (context_loop, node, true_e, type, lb, ub, ip); return last_e; } /* Inserts in iv_map a tuple (OLD_LOOP->num, NEW_NAME) for the induction variables of the loops around GBB in SESE. FIXME: Instead of using a vec that maps each loop id to a possible chrec, we could consider using a map that maps loop ids to the corresponding tree expressions. */ static void build_iv_mapping (vec iv_map, gimple_bb_p gbb, __isl_keep isl_ast_expr *user_expr, ivs_params &ip, sese region) { gcc_assert (isl_ast_expr_get_type (user_expr) == isl_ast_expr_op && isl_ast_expr_get_op_type (user_expr) == isl_ast_op_call); int i; isl_ast_expr *arg_expr; for (i = 1; i < isl_ast_expr_get_op_n_arg (user_expr); i++) { arg_expr = isl_ast_expr_get_op_arg (user_expr, i); tree type = build_nonstandard_integer_type (graphite_expression_type_precision, 0); tree t = gcc_expression_from_isl_expression (type, arg_expr, ip); loop_p old_loop = gbb_loop_at_index (gbb, region, i - 1); iv_map[old_loop->num] = t; } } /* Translates an isl_ast_node_user to Gimple. FIXME: We should remove iv_map.create (loop->num + 1), if it is possible. */ static edge translate_isl_ast_node_user (__isl_keep isl_ast_node *node, edge next_e, ivs_params &ip) { gcc_assert (isl_ast_node_get_type (node) == isl_ast_node_user); isl_ast_expr *user_expr = isl_ast_node_user_get_expr (node); isl_ast_expr *name_expr = isl_ast_expr_get_op_arg (user_expr, 0); gcc_assert (isl_ast_expr_get_type (name_expr) == isl_ast_expr_id); isl_id *name_id = isl_ast_expr_get_id (name_expr); poly_bb_p pbb = (poly_bb_p) isl_id_get_user (name_id); gcc_assert (pbb); gimple_bb_p gbb = PBB_BLACK_BOX (pbb); vec iv_map; isl_ast_expr_free (name_expr); isl_id_free (name_id); gcc_assert (GBB_BB (gbb) != ENTRY_BLOCK_PTR_FOR_FN (cfun) && "The entry block should not even appear within a scop"); int nb_loops = number_of_loops (cfun); iv_map.create (nb_loops); iv_map.safe_grow_cleared (nb_loops); build_iv_mapping (iv_map, gbb, user_expr, ip, SCOP_REGION (pbb->scop)); isl_ast_expr_free (user_expr); next_e = copy_bb_and_scalar_dependences (GBB_BB (gbb), SCOP_REGION (pbb->scop), next_e, iv_map, &graphite_regenerate_error); iv_map.release (); mark_virtual_operands_for_renaming (cfun); update_ssa (TODO_update_ssa); return next_e; } /* Translates an isl_ast_node_block to Gimple. */ static edge translate_isl_ast_node_block (loop_p context_loop, __isl_keep isl_ast_node *node, edge next_e, ivs_params &ip) { gcc_assert (isl_ast_node_get_type (node) == isl_ast_node_block); isl_ast_node_list *node_list = isl_ast_node_block_get_children (node); int i; for (i = 0; i < isl_ast_node_list_n_ast_node (node_list); i++) { isl_ast_node *tmp_node = isl_ast_node_list_get_ast_node (node_list, i); next_e = translate_isl_ast (context_loop, tmp_node, next_e, ip); isl_ast_node_free (tmp_node); } isl_ast_node_list_free (node_list); return next_e; } /* Creates a new if region corresponding to ISL's cond. */ static edge graphite_create_new_guard (edge entry_edge, __isl_take isl_ast_expr *if_cond, ivs_params &ip) { tree type = build_nonstandard_integer_type (graphite_expression_type_precision, 0); tree cond_expr = gcc_expression_from_isl_expression (type, if_cond, ip); edge exit_edge = create_empty_if_region_on_edge (entry_edge, cond_expr); return exit_edge; } /* Translates an isl_ast_node_if to Gimple. */ static edge translate_isl_ast_node_if (loop_p context_loop, __isl_keep isl_ast_node *node, edge next_e, ivs_params &ip) { gcc_assert (isl_ast_node_get_type (node) == isl_ast_node_if); isl_ast_expr *if_cond = isl_ast_node_if_get_cond (node); edge last_e = graphite_create_new_guard (next_e, if_cond, ip); edge true_e = get_true_edge_from_guard_bb (next_e->dest); isl_ast_node *then_node = isl_ast_node_if_get_then (node); translate_isl_ast (context_loop, then_node, true_e, ip); isl_ast_node_free (then_node); edge false_e = get_false_edge_from_guard_bb (next_e->dest); isl_ast_node *else_node = isl_ast_node_if_get_else (node); if (isl_ast_node_get_type (else_node) != isl_ast_node_error) translate_isl_ast (context_loop, else_node, false_e, ip); isl_ast_node_free (else_node); return last_e; } /* Translates an ISL AST node NODE to GCC representation in the context of a SESE. */ static edge translate_isl_ast (loop_p context_loop, __isl_keep isl_ast_node *node, edge next_e, ivs_params &ip) { switch (isl_ast_node_get_type (node)) { case isl_ast_node_error: gcc_unreachable (); case isl_ast_node_for: return translate_isl_ast_node_for (context_loop, node, next_e, ip); case isl_ast_node_if: return translate_isl_ast_node_if (context_loop, node, next_e, ip); case isl_ast_node_user: return translate_isl_ast_node_user (node, next_e, ip); case isl_ast_node_block: return translate_isl_ast_node_block (context_loop, node, next_e, ip); default: gcc_unreachable (); } } /* Prints NODE to FILE. */ void print_isl_ast_node (FILE *file, __isl_keep isl_ast_node *node, __isl_keep isl_ctx *ctx) { isl_printer *prn = isl_printer_to_file (ctx, file); prn = isl_printer_set_output_format (prn, ISL_FORMAT_C); prn = isl_printer_print_ast_node (prn, node); prn = isl_printer_print_str (prn, "\n"); isl_printer_free (prn); } /* Add ISL's parameter identifiers and corresponding.trees to ivs_params */ static void add_parameters_to_ivs_params (scop_p scop, ivs_params &ip) { sese region = SCOP_REGION (scop); unsigned nb_parameters = isl_set_dim (scop->context, isl_dim_param); gcc_assert (nb_parameters == SESE_PARAMS (region).length ()); unsigned i; for (i = 0; i < nb_parameters; i++) { isl_id *tmp_id = isl_set_get_dim_id (scop->context, isl_dim_param, i); ip[tmp_id] = SESE_PARAMS (region)[i]; } } /* Generates a build, which specifies the constraints on the parameters. */ static __isl_give isl_ast_build * generate_isl_context (scop_p scop) { isl_set *context_isl = isl_set_params (isl_set_copy (scop->context)); return isl_ast_build_from_context (context_isl); } /* Get the maximal number of schedule dimensions in the scop SCOP. */ static int get_max_schedule_dimensions (scop_p scop) { int i; poly_bb_p pbb; int schedule_dims = 0; FOR_EACH_VEC_ELT (SCOP_BBS (scop), i, pbb) { int pbb_schedule_dims = isl_map_dim (pbb->transformed, isl_dim_out); if (pbb_schedule_dims > schedule_dims) schedule_dims = pbb_schedule_dims; } return schedule_dims; } /* Extend the schedule to NB_SCHEDULE_DIMS schedule dimensions. For schedules with different dimensionality, the isl AST generator can not define an order and will just randomly choose an order. The solution to this problem is to extend all schedules to the maximal number of schedule dimensions (using '0's for the remaining values). */ static __isl_give isl_map * extend_schedule (__isl_take isl_map *schedule, int nb_schedule_dims) { int tmp_dims = isl_map_dim (schedule, isl_dim_out); schedule = isl_map_add_dims (schedule, isl_dim_out, nb_schedule_dims - tmp_dims); isl_val *zero = isl_val_int_from_si (isl_map_get_ctx (schedule), 0); int i; for (i = tmp_dims; i < nb_schedule_dims; i++) { schedule = isl_map_fix_val (schedule, isl_dim_out, i, isl_val_copy (zero)); } isl_val_free (zero); return schedule; } /* Set the separation_class option for unroll and jam. */ static __isl_give isl_union_map * generate_luj_sepclass_opt (scop_p scop, __isl_take isl_union_set *domain, int dim, int cl) { isl_map *map; isl_space *space, *space_sep; isl_ctx *ctx; isl_union_map *mapu; int nsched = get_max_schedule_dimensions (scop); ctx = scop->ctx; space_sep = isl_space_alloc (ctx, 0, 1, 1); space_sep = isl_space_wrap (space_sep); space_sep = isl_space_set_tuple_name (space_sep, isl_dim_set, "separation_class"); space = isl_set_get_space (scop->context); space_sep = isl_space_align_params (space_sep, isl_space_copy(space)); space = isl_space_map_from_domain_and_range (space, space_sep); space = isl_space_add_dims (space,isl_dim_in, nsched); map = isl_map_universe (space); isl_map_fix_si (map,isl_dim_out,0,dim); isl_map_fix_si (map,isl_dim_out,1,cl); mapu = isl_union_map_intersect_domain (isl_union_map_from_map (map), domain); return (mapu); } /* Compute the separation class for loop unroll and jam. */ static __isl_give isl_union_set * generate_luj_sepclass (scop_p scop) { int i; poly_bb_p pbb; isl_union_set *domain_isl; domain_isl = isl_union_set_empty (isl_set_get_space (scop->context)); FOR_EACH_VEC_ELT (SCOP_BBS (scop), i, pbb) { isl_set *bb_domain; isl_set *bb_domain_s; if (pbb->map_sepclass == NULL) continue; if (isl_set_is_empty (pbb->domain)) continue; bb_domain = isl_set_copy (pbb->domain); bb_domain_s = isl_set_apply (bb_domain, pbb->map_sepclass); pbb->map_sepclass = NULL; domain_isl = isl_union_set_union (domain_isl, isl_union_set_from_set (bb_domain_s)); } return domain_isl; } /* Set the AST built options for loop unroll and jam. */ static __isl_give isl_union_map * generate_luj_options (scop_p scop) { isl_union_set *domain_isl; isl_union_map *options_isl_ss; isl_union_map *options_isl = isl_union_map_empty (isl_set_get_space (scop->context)); int dim = get_max_schedule_dimensions (scop) - 1; int dim1 = dim - PARAM_VALUE (PARAM_LOOP_UNROLL_JAM_DEPTH); if (!flag_loop_unroll_jam) return options_isl; domain_isl = generate_luj_sepclass (scop); options_isl_ss = generate_luj_sepclass_opt (scop, domain_isl, dim1, 0); options_isl = isl_union_map_union (options_isl, options_isl_ss); return options_isl; } /* Generates a schedule, which specifies an order used to visit elements in a domain. */ static __isl_give isl_union_map * generate_isl_schedule (scop_p scop) { int nb_schedule_dims = get_max_schedule_dimensions (scop); int i; poly_bb_p pbb; isl_union_map *schedule_isl = isl_union_map_empty (isl_set_get_space (scop->context)); FOR_EACH_VEC_ELT (SCOP_BBS (scop), i, pbb) { /* Dead code elimination: when the domain of a PBB is empty, don't generate code for the PBB. */ if (isl_set_is_empty (pbb->domain)) continue; isl_map *bb_schedule = isl_map_copy (pbb->transformed); bb_schedule = isl_map_intersect_domain (bb_schedule, isl_set_copy (pbb->domain)); bb_schedule = extend_schedule (bb_schedule, nb_schedule_dims); schedule_isl = isl_union_map_union (schedule_isl, isl_union_map_from_map (bb_schedule)); } return schedule_isl; } /* This method is executed before the construction of a for node. */ static __isl_give isl_id * ast_build_before_for (__isl_keep isl_ast_build *build, void *user) { isl_union_map *dependences = (isl_union_map *) user; ast_build_info *for_info = XNEW (struct ast_build_info); isl_union_map *schedule = isl_ast_build_get_schedule (build); isl_space *schedule_space = isl_ast_build_get_schedule_space (build); int dimension = isl_space_dim (schedule_space, isl_dim_out); for_info->is_parallelizable = !carries_deps (schedule, dependences, dimension); isl_union_map_free (schedule); isl_space_free (schedule_space); isl_id *id = isl_id_alloc (isl_ast_build_get_ctx (build), "", for_info); return id; } /* Set the separate option for all dimensions. This helps to reduce control overhead. Set the options for unroll and jam. */ static __isl_give isl_ast_build * set_options (__isl_take isl_ast_build *control, __isl_keep isl_union_map *schedule, __isl_take isl_union_map *opt_luj) { isl_ctx *ctx = isl_union_map_get_ctx (schedule); isl_space *range_space = isl_space_set_alloc (ctx, 0, 1); range_space = isl_space_set_tuple_name (range_space, isl_dim_set, "separate"); isl_union_set *range = isl_union_set_from_set (isl_set_universe (range_space)); isl_union_set *domain = isl_union_map_range (isl_union_map_copy (schedule)); domain = isl_union_set_universe (domain); isl_union_map *options = isl_union_map_from_domain_and_range (domain, range); options = isl_union_map_union (options, opt_luj); return isl_ast_build_set_options (control, options); } static __isl_give isl_ast_node * scop_to_isl_ast (scop_p scop, ivs_params &ip) { /* Generate loop upper bounds that consist of the current loop iterator, an operator (< or <=) and an expression not involving the iterator. If this option is not set, then the current loop iterator may appear several times in the upper bound. See the isl manual for more details. */ isl_options_set_ast_build_atomic_upper_bound (scop->ctx, true); add_parameters_to_ivs_params (scop, ip); isl_union_map *options_luj = generate_luj_options (scop); isl_union_map *schedule_isl = generate_isl_schedule (scop); isl_ast_build *context_isl = generate_isl_context (scop); context_isl = set_options (context_isl, schedule_isl, options_luj); isl_union_map *dependences = NULL; if (flag_loop_parallelize_all) { dependences = scop_get_dependences (scop); context_isl = isl_ast_build_set_before_each_for (context_isl, ast_build_before_for, dependences); } isl_ast_node *ast_isl = isl_ast_build_ast_from_schedule (context_isl, schedule_isl); if(dependences) isl_union_map_free (dependences); isl_ast_build_free (context_isl); return ast_isl; } /* GIMPLE Loop Generator: generates loops from STMT in GIMPLE form for the given SCOP. Return true if code generation succeeded. FIXME: This is not yet a full implementation of the code generator with ISL ASTs. Generation of GIMPLE code has to be completed. */ bool graphite_regenerate_ast_isl (scop_p scop) { loop_p context_loop; sese region = SCOP_REGION (scop); ifsese if_region = NULL; isl_ast_node *root_node; ivs_params ip; timevar_push (TV_GRAPHITE_CODE_GEN); graphite_regenerate_error = false; root_node = scop_to_isl_ast (scop, ip); if (dump_file && (dump_flags & TDF_DETAILS)) { fprintf (dump_file, "\nISL AST generated by ISL: \n"); print_isl_ast_node (dump_file, root_node, scop->ctx); fprintf (dump_file, "\n"); } recompute_all_dominators (); graphite_verify (); if_region = move_sese_in_condition (region); sese_insert_phis_for_liveouts (region, if_region->region->exit->src, if_region->false_region->exit, if_region->true_region->exit); recompute_all_dominators (); graphite_verify (); context_loop = SESE_ENTRY (region)->src->loop_father; translate_isl_ast (context_loop, root_node, if_region->true_region->entry, ip); mark_virtual_operands_for_renaming (cfun); update_ssa (TODO_update_ssa); graphite_verify (); scev_reset (); recompute_all_dominators (); graphite_verify (); if (graphite_regenerate_error) set_ifsese_condition (if_region, integer_zero_node); free (if_region->true_region); free (if_region->region); free (if_region); ivs_params_clear (ip); isl_ast_node_free (root_node); timevar_pop (TV_GRAPHITE_CODE_GEN); if (dump_file && (dump_flags & TDF_DETAILS)) { loop_p loop; int num_no_dependency = 0; FOR_EACH_LOOP (loop, 0) if (loop->can_be_parallel) num_no_dependency++; fprintf (dump_file, "\n%d loops carried no dependency.\n", num_no_dependency); } return !graphite_regenerate_error; } #endif