/* Integrated Register Allocator. Changing code and generating moves. Copyright (C) 2006, 2007, 2008 Free Software Foundation, Inc. Contributed by Vladimir Makarov . This file is part of GCC. GCC is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 3, or (at your option) any later version. GCC is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with GCC; see the file COPYING3. If not see . */ #include "config.h" #include "system.h" #include "coretypes.h" #include "tm.h" #include "regs.h" #include "rtl.h" #include "tm_p.h" #include "target.h" #include "flags.h" #include "obstack.h" #include "bitmap.h" #include "hard-reg-set.h" #include "basic-block.h" #include "expr.h" #include "recog.h" #include "params.h" #include "timevar.h" #include "tree-pass.h" #include "output.h" #include "reload.h" #include "errors.h" #include "df.h" #include "ira-int.h" typedef struct move *move_t; /* The structure represents an allocno move. Both allocnos have the same origional regno but different allocation. */ struct move { /* The allocnos involved in the move. */ ira_allocno_t from, to; /* The next move in the move sequence. */ move_t next; /* Used for finding dependencies. */ bool visited_p; /* The size of the following array. */ int deps_num; /* Moves on which given move depends on. Dependency can be cyclic. It means we need a temporary to generates the moves. Sequence A1->A2, B1->B2 where A1 and B2 are assigned to reg R1 and A2 and B1 are assigned to reg R2 is an example of the cyclic dependencies. */ move_t *deps; /* First insn generated for the move. */ rtx insn; }; /* Array of moves (indexed by BB index) which should be put at the start/end of the corresponding basic blocks. */ static move_t *at_bb_start, *at_bb_end; /* Max regno before renaming some pseudo-registers. For example, the same pseudo-register can be renamed in a loop if its allocation is different outside the loop. */ static int max_regno_before_changing; /* Return new move of allocnos TO and FROM. */ static move_t create_move (ira_allocno_t to, ira_allocno_t from) { move_t move; move = (move_t) ira_allocate (sizeof (struct move)); move->deps = NULL; move->deps_num = 0; move->to = to; move->from = from; move->next = NULL; move->insn = NULL_RTX; move->visited_p = false; return move; } /* Free memory for MOVE and its dependencies. */ static void free_move (move_t move) { if (move->deps != NULL) ira_free (move->deps); ira_free (move); } /* Free memory for list of the moves given by its HEAD. */ static void free_move_list (move_t head) { move_t next; for (; head != NULL; head = next) { next = head->next; free_move (head); } } /* Return TRUE if the the move list LIST1 and LIST2 are equal (two moves are equal if they involve the same allocnos). */ static bool eq_move_lists_p (move_t list1, move_t list2) { for (; list1 != NULL && list2 != NULL; list1 = list1->next, list2 = list2->next) if (list1->from != list2->from || list1->to != list2->to) return false; return list1 == list2; } /* This recursive function changes pseudo-registers in *LOC if it is necessary. The function returns TRUE if a change was done. */ static bool change_regs (rtx *loc) { int i, regno, result = false; const char *fmt; enum rtx_code code; rtx reg; if (*loc == NULL_RTX) return false; code = GET_CODE (*loc); if (code == REG) { regno = REGNO (*loc); if (regno < FIRST_PSEUDO_REGISTER) return false; if (regno >= max_regno_before_changing) /* It is a shared register which was changed already. */ return false; if (ira_curr_regno_allocno_map[regno] == NULL) return false; reg = ALLOCNO_REG (ira_curr_regno_allocno_map[regno]); if (reg == *loc) return false; *loc = reg; return true; } fmt = GET_RTX_FORMAT (code); for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--) { if (fmt[i] == 'e') result = change_regs (&XEXP (*loc, i)) || result; else if (fmt[i] == 'E') { int j; for (j = XVECLEN (*loc, i) - 1; j >= 0; j--) result = change_regs (&XVECEXP (*loc, i, j)) || result; } } return result; } /* Attach MOVE to the edge E. The move is attached to the head of the list if HEAD_P is TRUE. */ static void add_to_edge_list (edge e, move_t move, bool head_p) { move_t last; if (head_p || e->aux == NULL) { move->next = (move_t) e->aux; e->aux = move; } else { for (last = (move_t) e->aux; last->next != NULL; last = last->next) ; last->next = move; move->next = NULL; } } /* Create and return new pseudo-register with the same attributes as ORIGINAL_REG. */ static rtx create_new_reg (rtx original_reg) { rtx new_reg; new_reg = gen_reg_rtx (GET_MODE (original_reg)); ORIGINAL_REGNO (new_reg) = ORIGINAL_REGNO (original_reg); REG_USERVAR_P (new_reg) = REG_USERVAR_P (original_reg); REG_POINTER (new_reg) = REG_POINTER (original_reg); REG_ATTRS (new_reg) = REG_ATTRS (original_reg); if (internal_flag_ira_verbose > 3 && ira_dump_file != NULL) fprintf (ira_dump_file, " Creating newreg=%i from oldreg=%i\n", REGNO (new_reg), REGNO (original_reg)); return new_reg; } /* Return TRUE if loop given by SUBNODE inside the loop given by NODE. */ static bool subloop_tree_node_p (ira_loop_tree_node_t subnode, ira_loop_tree_node_t node) { for (; subnode != NULL; subnode = subnode->parent) if (subnode == node) return true; return false; } /* Set up member `reg' to REG for allocnos which has the same regno as ALLOCNO and which are inside the loop corresponding to ALLOCNO. */ static void set_allocno_reg (ira_allocno_t allocno, rtx reg) { int regno; ira_allocno_t a; ira_loop_tree_node_t node; node = ALLOCNO_LOOP_TREE_NODE (allocno); for (a = ira_regno_allocno_map[ALLOCNO_REGNO (allocno)]; a != NULL; a = ALLOCNO_NEXT_REGNO_ALLOCNO (a)) if (subloop_tree_node_p (ALLOCNO_LOOP_TREE_NODE (a), node)) ALLOCNO_REG (a) = reg; for (a = ALLOCNO_CAP (allocno); a != NULL; a = ALLOCNO_CAP (a)) ALLOCNO_REG (a) = reg; regno = ALLOCNO_REGNO (allocno); for (a = allocno;;) { if (a == NULL || (a = ALLOCNO_CAP (a)) == NULL) { node = node->parent; if (node == NULL) break; a = node->regno_allocno_map[regno]; } if (a == NULL) continue; if (ALLOCNO_CHILD_RENAMED_P (a)) break; ALLOCNO_CHILD_RENAMED_P (a) = true; } } /* Return true if there is an entry to given loop not from its parent (or grandparent) block. For example, it is possible for two adjacent loops inside another loop. */ static bool entered_from_non_parent_p (ira_loop_tree_node_t loop_node) { ira_loop_tree_node_t bb_node, src_loop_node, parent; edge e; edge_iterator ei; for (bb_node = loop_node->children; bb_node != NULL; bb_node = bb_node->next) if (bb_node->bb != NULL) { FOR_EACH_EDGE (e, ei, bb_node->bb->preds) if (e->src != ENTRY_BLOCK_PTR && (src_loop_node = IRA_BB_NODE (e->src)->parent) != loop_node) { for (parent = src_loop_node->parent; parent != NULL; parent = parent->parent) if (parent == loop_node) break; if (parent != NULL) /* That is an exit from a nested loop -- skip it. */ continue; for (parent = loop_node->parent; parent != NULL; parent = parent->parent) if (src_loop_node == parent) break; if (parent == NULL) return true; } } return false; } /* Set up ENTERED_FROM_NON_PARENT_P for each loop region. */ static void setup_entered_from_non_parent_p (void) { unsigned int i; loop_p loop; for (i = 0; VEC_iterate (loop_p, ira_loops.larray, i, loop); i++) if (ira_loop_nodes[i].regno_allocno_map != NULL) ira_loop_nodes[i].entered_from_non_parent_p = entered_from_non_parent_p (&ira_loop_nodes[i]); } /* Return TRUE if move of SRC_ALLOCNO (assigned to hard register) to DEST_ALLOCNO (assigned to memory) can be removed beacuse it does not change value of the destination. One possible reason for this is the situation when SRC_ALLOCNO is not modified in the corresponding loop. */ static bool store_can_be_removed_p (ira_allocno_t src_allocno, ira_allocno_t dest_allocno) { int regno, orig_regno; ira_allocno_t a; ira_loop_tree_node_t node; ira_assert (ALLOCNO_CAP_MEMBER (src_allocno) == NULL && ALLOCNO_CAP_MEMBER (dest_allocno) == NULL); orig_regno = ALLOCNO_REGNO (src_allocno); regno = REGNO (ALLOCNO_REG (dest_allocno)); for (node = ALLOCNO_LOOP_TREE_NODE (src_allocno); node != NULL; node = node->parent) { a = node->regno_allocno_map[orig_regno]; ira_assert (a != NULL); if (REGNO (ALLOCNO_REG (a)) == (unsigned) regno) /* We achieved the destination and everything is ok. */ return true; else if (bitmap_bit_p (node->modified_regnos, orig_regno)) return false; else if (node->entered_from_non_parent_p) /* If there is a path from a destination loop block to the source loop header containing basic blocks of non-parents (grandparents) of the source loop, we should have checked modifications of the pseudo on this path too to decide about possibility to remove the store. It could be done by solving a data-flow problem. Unfortunately such global solution would complicate IR flattening. Therefore we just prohibit removal of the store in such complicated case. */ return false; } gcc_unreachable (); } /* Generate and attach moves to the edge E. This looks at the final regnos of allocnos living on the edge with the same original regno to figure out when moves should be generated. */ static void generate_edge_moves (edge e) { ira_loop_tree_node_t src_loop_node, dest_loop_node; unsigned int regno; bitmap_iterator bi; ira_allocno_t src_allocno, dest_allocno, *src_map, *dest_map; move_t move; src_loop_node = IRA_BB_NODE (e->src)->parent; dest_loop_node = IRA_BB_NODE (e->dest)->parent; e->aux = NULL; if (src_loop_node == dest_loop_node) return; src_map = src_loop_node->regno_allocno_map; dest_map = dest_loop_node->regno_allocno_map; EXECUTE_IF_SET_IN_REG_SET (DF_LR_IN (e->dest), FIRST_PSEUDO_REGISTER, regno, bi) if (bitmap_bit_p (DF_LR_OUT (e->src), regno)) { src_allocno = src_map[regno]; dest_allocno = dest_map[regno]; if (REGNO (ALLOCNO_REG (src_allocno)) == REGNO (ALLOCNO_REG (dest_allocno))) continue; /* Remove unnecessary stores at the region exit. We should do this for readonly memory for sure and this is guaranteed by that we never generate moves on region borders (see checking ira_reg_equiv_invariant_p in function change_loop). */ if (ALLOCNO_HARD_REGNO (dest_allocno) < 0 && ALLOCNO_HARD_REGNO (src_allocno) >= 0 && store_can_be_removed_p (src_allocno, dest_allocno)) { ALLOCNO_MEM_OPTIMIZED_DEST (src_allocno) = dest_allocno; ALLOCNO_MEM_OPTIMIZED_DEST_P (dest_allocno) = true; if (internal_flag_ira_verbose > 3 && ira_dump_file != NULL) fprintf (ira_dump_file, " Remove r%d:a%d->a%d(mem)\n", regno, ALLOCNO_NUM (src_allocno), ALLOCNO_NUM (dest_allocno)); continue; } move = create_move (dest_allocno, src_allocno); add_to_edge_list (e, move, true); } } /* Bitmap of allocnos local for the current loop. */ static bitmap local_allocno_bitmap; /* This bitmap is used to find that we need to generate and to use a new pseudo-register when processing allocnos with the same original regno. */ static bitmap used_regno_bitmap; /* This bitmap contains regnos of allocnos which were renamed locally because the allocnos correspond to disjoint live ranges in loops with a common parent. */ static bitmap renamed_regno_bitmap; /* Change (if necessary) pseudo-registers inside loop given by loop tree node NODE. */ static void change_loop (ira_loop_tree_node_t node) { bitmap_iterator bi; unsigned int i; int regno; bool used_p; ira_allocno_t allocno, parent_allocno, *map; rtx insn, original_reg; enum reg_class cover_class; ira_loop_tree_node_t parent; if (node != ira_loop_tree_root) { if (node->bb != NULL) { FOR_BB_INSNS (node->bb, insn) if (INSN_P (insn) && change_regs (&insn)) { df_insn_rescan (insn); df_notes_rescan (insn); } return; } if (internal_flag_ira_verbose > 3 && ira_dump_file != NULL) fprintf (ira_dump_file, " Changing RTL for loop %d (header bb%d)\n", node->loop->num, node->loop->header->index); parent = ira_curr_loop_tree_node->parent; map = parent->regno_allocno_map; EXECUTE_IF_SET_IN_REG_SET (ira_curr_loop_tree_node->border_allocnos, 0, i, bi) { allocno = ira_allocnos[i]; regno = ALLOCNO_REGNO (allocno); cover_class = ALLOCNO_COVER_CLASS (allocno); parent_allocno = map[regno]; ira_assert (regno < ira_reg_equiv_len); /* We generate the same hard register move because the reload pass can put an allocno into memory in this case we will have live range splitting. If it does not happen such the same hard register moves will be removed. The worst case when the both allocnos are put into memory by the reload is very rare. */ if (parent_allocno != NULL && (ALLOCNO_HARD_REGNO (allocno) == ALLOCNO_HARD_REGNO (parent_allocno)) && (ALLOCNO_HARD_REGNO (allocno) < 0 || (parent->reg_pressure[cover_class] + 1 <= ira_available_class_regs[cover_class]) || TEST_HARD_REG_BIT (ira_prohibited_mode_move_regs [ALLOCNO_MODE (allocno)], ALLOCNO_HARD_REGNO (allocno)) /* don't create copies because reload can spill an allocno set by copy although the allocno will not get memory slot. */ || ira_reg_equiv_invariant_p[regno] || ira_reg_equiv_const[regno] != NULL_RTX)) continue; original_reg = ALLOCNO_REG (allocno); if (parent_allocno == NULL || REGNO (ALLOCNO_REG (parent_allocno)) == REGNO (original_reg)) { if (internal_flag_ira_verbose > 3 && ira_dump_file) fprintf (ira_dump_file, " %i vs parent %i:", ALLOCNO_HARD_REGNO (allocno), ALLOCNO_HARD_REGNO (parent_allocno)); set_allocno_reg (allocno, create_new_reg (original_reg)); } } } /* Rename locals: Local allocnos with same regno in different loops might get the different hard register. So we need to change ALLOCNO_REG. */ bitmap_and_compl (local_allocno_bitmap, ira_curr_loop_tree_node->all_allocnos, ira_curr_loop_tree_node->border_allocnos); EXECUTE_IF_SET_IN_REG_SET (local_allocno_bitmap, 0, i, bi) { allocno = ira_allocnos[i]; regno = ALLOCNO_REGNO (allocno); if (ALLOCNO_CAP_MEMBER (allocno) != NULL) continue; used_p = bitmap_bit_p (used_regno_bitmap, regno); bitmap_set_bit (used_regno_bitmap, regno); ALLOCNO_SOMEWHERE_RENAMED_P (allocno) = true; if (! used_p) continue; bitmap_set_bit (renamed_regno_bitmap, regno); set_allocno_reg (allocno, create_new_reg (ALLOCNO_REG (allocno))); } } /* Process to set up flag somewhere_renamed_p. */ static void set_allocno_somewhere_renamed_p (void) { unsigned int regno; ira_allocno_t allocno; ira_allocno_iterator ai; FOR_EACH_ALLOCNO (allocno, ai) { regno = ALLOCNO_REGNO (allocno); if (bitmap_bit_p (renamed_regno_bitmap, regno) && REGNO (ALLOCNO_REG (allocno)) == regno) ALLOCNO_SOMEWHERE_RENAMED_P (allocno) = true; } } /* Return TRUE if move lists on all edges given in vector VEC are equal. */ static bool eq_edge_move_lists_p (VEC(edge,gc) *vec) { move_t list; int i; list = (move_t) EDGE_I (vec, 0)->aux; for (i = EDGE_COUNT (vec) - 1; i > 0; i--) if (! eq_move_lists_p (list, (move_t) EDGE_I (vec, i)->aux)) return false; return true; } /* Look at all entry edges (if START_P) or exit edges of basic block BB and put move lists at the BB start or end if it is possible. In other words, this decreases code duplication of allocno moves. */ static void unify_moves (basic_block bb, bool start_p) { int i; edge e; move_t list; VEC(edge,gc) *vec; vec = (start_p ? bb->preds : bb->succs); if (EDGE_COUNT (vec) == 0 || ! eq_edge_move_lists_p (vec)) return; e = EDGE_I (vec, 0); list = (move_t) e->aux; if (! start_p && control_flow_insn_p (BB_END (bb))) return; e->aux = NULL; for (i = EDGE_COUNT (vec) - 1; i > 0; i--) { e = EDGE_I (vec, i); free_move_list ((move_t) e->aux); e->aux = NULL; } if (start_p) at_bb_start[bb->index] = list; else at_bb_end[bb->index] = list; } /* Last move (in move sequence being processed) setting up the corresponding hard register. */ static move_t hard_regno_last_set[FIRST_PSEUDO_REGISTER]; /* If the element value is equal to CURR_TICK then the corresponding element in `hard_regno_last_set' is defined and correct. */ static int hard_regno_last_set_check[FIRST_PSEUDO_REGISTER]; /* Last move (in move sequence being processed) setting up the corresponding allocno. */ static move_t *allocno_last_set; /* If the element value is equal to CURR_TICK then the corresponding element in . `allocno_last_set' is defined and correct. */ static int *allocno_last_set_check; /* Definition of vector of moves. */ DEF_VEC_P(move_t); DEF_VEC_ALLOC_P(move_t, heap); /* This vec contains moves sorted topologically (depth-first) on their dependency graph. */ static VEC(move_t,heap) *move_vec; /* The variable value is used to check correctness of values of elements of arrays `hard_regno_last_set' and `allocno_last_set_check'. */ static int curr_tick; /* This recursive function traverses dependencies of MOVE and produces topological sorting (in depth-first order). */ static void traverse_moves (move_t move) { int i; if (move->visited_p) return; move->visited_p = true; for (i = move->deps_num - 1; i >= 0; i--) traverse_moves (move->deps[i]); VEC_safe_push (move_t, heap, move_vec, move); } /* Remove unnecessary moves in the LIST, makes topological sorting, and removes cycles on hard reg dependencies by introducing new allocnos assigned to memory and additional moves. It returns the result move list. */ static move_t modify_move_list (move_t list) { int i, n, nregs, hard_regno; ira_allocno_t to, from, new_allocno; move_t move, new_move, set_move, first, last; if (list == NULL) return NULL; /* Creat move deps. */ curr_tick++; for (move = list; move != NULL; move = move->next) { to = move->to; if ((hard_regno = ALLOCNO_HARD_REGNO (to)) < 0) continue; nregs = hard_regno_nregs[hard_regno][ALLOCNO_MODE (to)]; for (i = 0; i < nregs; i++) { hard_regno_last_set[hard_regno + i] = move; hard_regno_last_set_check[hard_regno + i] = curr_tick; } } for (move = list; move != NULL; move = move->next) { from = move->from; to = move->to; if ((hard_regno = ALLOCNO_HARD_REGNO (from)) >= 0) { nregs = hard_regno_nregs[hard_regno][ALLOCNO_MODE (from)]; for (n = i = 0; i < nregs; i++) if (hard_regno_last_set_check[hard_regno + i] == curr_tick && (ALLOCNO_REGNO (hard_regno_last_set[hard_regno + i]->to) != ALLOCNO_REGNO (from))) n++; move->deps = (move_t *) ira_allocate (n * sizeof (move_t)); for (n = i = 0; i < nregs; i++) if (hard_regno_last_set_check[hard_regno + i] == curr_tick && (ALLOCNO_REGNO (hard_regno_last_set[hard_regno + i]->to) != ALLOCNO_REGNO (from))) move->deps[n++] = hard_regno_last_set[hard_regno + i]; move->deps_num = n; } } /* Toplogical sorting: */ VEC_truncate (move_t, move_vec, 0); for (move = list; move != NULL; move = move->next) traverse_moves (move); last = NULL; for (i = (int) VEC_length (move_t, move_vec) - 1; i >= 0; i--) { move = VEC_index (move_t, move_vec, i); move->next = NULL; if (last != NULL) last->next = move; last = move; } first = VEC_last (move_t, move_vec); /* Removing cycles: */ curr_tick++; VEC_truncate (move_t, move_vec, 0); for (move = first; move != NULL; move = move->next) { from = move->from; to = move->to; if ((hard_regno = ALLOCNO_HARD_REGNO (from)) >= 0) { nregs = hard_regno_nregs[hard_regno][ALLOCNO_MODE (from)]; for (i = 0; i < nregs; i++) if (hard_regno_last_set_check[hard_regno + i] == curr_tick && ALLOCNO_HARD_REGNO (hard_regno_last_set[hard_regno + i]->to) >= 0) { set_move = hard_regno_last_set[hard_regno + i]; /* It does not matter what loop_tree_node (of TO or FROM) to use for the new allocno because of subsequent IRA internal representation flattening. */ new_allocno = ira_create_allocno (ALLOCNO_REGNO (set_move->to), false, ALLOCNO_LOOP_TREE_NODE (set_move->to)); ALLOCNO_MODE (new_allocno) = ALLOCNO_MODE (set_move->to); ira_set_allocno_cover_class (new_allocno, ALLOCNO_COVER_CLASS (set_move->to)); ALLOCNO_ASSIGNED_P (new_allocno) = true; ALLOCNO_HARD_REGNO (new_allocno) = -1; ALLOCNO_REG (new_allocno) = create_new_reg (ALLOCNO_REG (set_move->to)); ALLOCNO_CONFLICT_ID (new_allocno) = ALLOCNO_NUM (new_allocno); /* Make it possibly conflicting with all earlier created allocnos. Cases where temporary allocnos created to remove the cycles are quite rare. */ ALLOCNO_MIN (new_allocno) = 0; ALLOCNO_MAX (new_allocno) = ira_allocnos_num - 1; new_move = create_move (set_move->to, new_allocno); set_move->to = new_allocno; VEC_safe_push (move_t, heap, move_vec, new_move); ira_move_loops_num++; if (internal_flag_ira_verbose > 2 && ira_dump_file != NULL) fprintf (ira_dump_file, " Creating temporary allocno a%dr%d\n", ALLOCNO_NUM (new_allocno), REGNO (ALLOCNO_REG (new_allocno))); } } if ((hard_regno = ALLOCNO_HARD_REGNO (to)) < 0) continue; nregs = hard_regno_nregs[hard_regno][ALLOCNO_MODE (to)]; for (i = 0; i < nregs; i++) { hard_regno_last_set[hard_regno + i] = move; hard_regno_last_set_check[hard_regno + i] = curr_tick; } } for (i = (int) VEC_length (move_t, move_vec) - 1; i >= 0; i--) { move = VEC_index (move_t, move_vec, i); move->next = NULL; last->next = move; last = move; } return first; } /* Generate RTX move insns from the move list LIST. This updates allocation cost using move execution frequency FREQ. */ static rtx emit_move_list (move_t list, int freq) { int cost; rtx result, insn; enum machine_mode mode; enum reg_class cover_class; start_sequence (); for (; list != NULL; list = list->next) { start_sequence (); emit_move_insn (ALLOCNO_REG (list->to), ALLOCNO_REG (list->from)); list->insn = get_insns (); end_sequence (); /* The reload needs to have set up insn codes. If the reload sets up insn codes by itself, it may fail because insns will have hard registers instead of pseudos and there may be no machine insn with given hard registers. */ for (insn = list->insn; insn != NULL_RTX; insn = NEXT_INSN (insn)) recog_memoized (insn); emit_insn (list->insn); mode = ALLOCNO_MODE (list->to); cover_class = ALLOCNO_COVER_CLASS (list->to); cost = 0; if (ALLOCNO_HARD_REGNO (list->to) < 0) { if (ALLOCNO_HARD_REGNO (list->from) >= 0) { cost = ira_memory_move_cost[mode][cover_class][0] * freq; ira_store_cost += cost; } } else if (ALLOCNO_HARD_REGNO (list->from) < 0) { if (ALLOCNO_HARD_REGNO (list->to) >= 0) { cost = ira_memory_move_cost[mode][cover_class][0] * freq; ira_load_cost += cost; } } else { cost = ira_register_move_cost[mode][cover_class][cover_class] * freq; ira_shuffle_cost += cost; } ira_overall_cost += cost; } result = get_insns (); end_sequence (); return result; } /* Generate RTX move insns from move lists attached to basic blocks and edges. */ static void emit_moves (void) { basic_block bb; edge_iterator ei; edge e; rtx insns, tmp; FOR_EACH_BB (bb) { if (at_bb_start[bb->index] != NULL) { at_bb_start[bb->index] = modify_move_list (at_bb_start[bb->index]); insns = emit_move_list (at_bb_start[bb->index], REG_FREQ_FROM_BB (bb)); tmp = BB_HEAD (bb); if (LABEL_P (tmp)) tmp = NEXT_INSN (tmp); if (NOTE_INSN_BASIC_BLOCK_P (tmp)) tmp = NEXT_INSN (tmp); if (tmp == BB_HEAD (bb)) emit_insn_before (insns, tmp); else if (tmp != NULL_RTX) emit_insn_after (insns, PREV_INSN (tmp)); else emit_insn_after (insns, get_last_insn ()); } if (at_bb_end[bb->index] != NULL) { at_bb_end[bb->index] = modify_move_list (at_bb_end[bb->index]); insns = emit_move_list (at_bb_end[bb->index], REG_FREQ_FROM_BB (bb)); ira_assert (! control_flow_insn_p (BB_END (bb))); emit_insn_after (insns, BB_END (bb)); } FOR_EACH_EDGE (e, ei, bb->succs) { if (e->aux == NULL) continue; ira_assert ((e->flags & EDGE_ABNORMAL) == 0 || ! EDGE_CRITICAL_P (e)); e->aux = modify_move_list ((move_t) e->aux); insert_insn_on_edge (emit_move_list ((move_t) e->aux, REG_FREQ_FROM_EDGE_FREQ (EDGE_FREQUENCY (e))), e); if (e->src->next_bb != e->dest) ira_additional_jumps_num++; } } } /* Update costs of A and corresponding allocnos on upper levels on the loop tree from reading (if READ_P) or writing A on an execution path with FREQ. */ static void update_costs (ira_allocno_t a, bool read_p, int freq) { ira_loop_tree_node_t parent; for (;;) { ALLOCNO_NREFS (a)++; ALLOCNO_FREQ (a) += freq; ALLOCNO_MEMORY_COST (a) += (ira_memory_move_cost[ALLOCNO_MODE (a)][ALLOCNO_COVER_CLASS (a)] [read_p ? 1 : 0] * freq); if (ALLOCNO_CAP (a) != NULL) a = ALLOCNO_CAP (a); else if ((parent = ALLOCNO_LOOP_TREE_NODE (a)->parent) == NULL || (a = parent->regno_allocno_map[ALLOCNO_REGNO (a)]) == NULL) break; } } /* Process moves from LIST with execution FREQ to add ranges, copies, and modify costs for allocnos involved in the moves. All regnos living through the list is in LIVE_THROUGH, and the loop tree node used to find corresponding allocnos is NODE. */ static void add_range_and_copies_from_move_list (move_t list, ira_loop_tree_node_t node, bitmap live_through, int freq) { int start, n; unsigned int regno; move_t move; ira_allocno_t to, from, a; ira_copy_t cp; allocno_live_range_t r; bitmap_iterator bi; HARD_REG_SET hard_regs_live; if (list == NULL) return; n = 0; EXECUTE_IF_SET_IN_BITMAP (live_through, FIRST_PSEUDO_REGISTER, regno, bi) n++; REG_SET_TO_HARD_REG_SET (hard_regs_live, live_through); /* This is a trick to guarantee that new ranges is not merged with the old ones. */ ira_max_point++; start = ira_max_point; for (move = list; move != NULL; move = move->next) { from = move->from; to = move->to; if (ALLOCNO_CONFLICT_ALLOCNO_ARRAY (to) == NULL) { if (internal_flag_ira_verbose > 2 && ira_dump_file != NULL) fprintf (ira_dump_file, " Allocate conflicts for a%dr%d\n", ALLOCNO_NUM (to), REGNO (ALLOCNO_REG (to))); ira_allocate_allocno_conflicts (to, n); } bitmap_clear_bit (live_through, ALLOCNO_REGNO (from)); bitmap_clear_bit (live_through, ALLOCNO_REGNO (to)); IOR_HARD_REG_SET (ALLOCNO_CONFLICT_HARD_REGS (from), hard_regs_live); IOR_HARD_REG_SET (ALLOCNO_CONFLICT_HARD_REGS (to), hard_regs_live); IOR_HARD_REG_SET (ALLOCNO_TOTAL_CONFLICT_HARD_REGS (from), hard_regs_live); IOR_HARD_REG_SET (ALLOCNO_TOTAL_CONFLICT_HARD_REGS (to), hard_regs_live); update_costs (from, true, freq); update_costs (to, false, freq); cp = ira_add_allocno_copy (from, to, freq, false, move->insn, NULL); if (internal_flag_ira_verbose > 2 && ira_dump_file != NULL) fprintf (ira_dump_file, " Adding cp%d:a%dr%d-a%dr%d\n", cp->num, ALLOCNO_NUM (cp->first), REGNO (ALLOCNO_REG (cp->first)), ALLOCNO_NUM (cp->second), REGNO (ALLOCNO_REG (cp->second))); r = ALLOCNO_LIVE_RANGES (from); if (r == NULL || r->finish >= 0) { ALLOCNO_LIVE_RANGES (from) = ira_create_allocno_live_range (from, start, ira_max_point, r); if (internal_flag_ira_verbose > 2 && ira_dump_file != NULL) fprintf (ira_dump_file, " Adding range [%d..%d] to allocno a%dr%d\n", start, ira_max_point, ALLOCNO_NUM (from), REGNO (ALLOCNO_REG (from))); } else r->finish = ira_max_point; ira_max_point++; ALLOCNO_LIVE_RANGES (to) = ira_create_allocno_live_range (to, ira_max_point, -1, ALLOCNO_LIVE_RANGES (to)); ira_max_point++; } for (move = list; move != NULL; move = move->next) { r = ALLOCNO_LIVE_RANGES (move->to); if (r->finish < 0) { r->finish = ira_max_point - 1; if (internal_flag_ira_verbose > 2 && ira_dump_file != NULL) fprintf (ira_dump_file, " Adding range [%d..%d] to allocno a%dr%d\n", r->start, r->finish, ALLOCNO_NUM (move->to), REGNO (ALLOCNO_REG (move->to))); } } EXECUTE_IF_SET_IN_BITMAP (live_through, FIRST_PSEUDO_REGISTER, regno, bi) { a = node->regno_allocno_map[regno]; if (ALLOCNO_MEM_OPTIMIZED_DEST (a) == NULL) { ALLOCNO_LIVE_RANGES (a) = ira_create_allocno_live_range (a, start, ira_max_point - 1, ALLOCNO_LIVE_RANGES (a)); if (internal_flag_ira_verbose > 2 && ira_dump_file != NULL) fprintf (ira_dump_file, " Adding range [%d..%d] to live through allocno a%dr%d\n", start, ira_max_point - 1, ALLOCNO_NUM (a), REGNO (ALLOCNO_REG (a))); } } } /* Process all move list to add ranges, conflicts, copies, and modify costs for allocnos involved in the moves. */ static void add_ranges_and_copies (void) { basic_block bb; edge_iterator ei; edge e; ira_loop_tree_node_t node; bitmap live_through; live_through = ira_allocate_bitmap (); FOR_EACH_BB (bb) { /* It does not matter what loop_tree_node (of source or destination block) to use for searching allocnos by their regnos because of subsequent IR flattening. */ node = IRA_BB_NODE (bb)->parent; bitmap_copy (live_through, DF_LR_IN (bb)); add_range_and_copies_from_move_list (at_bb_start[bb->index], node, live_through, REG_FREQ_FROM_BB (bb)); bitmap_copy (live_through, DF_LR_OUT (bb)); add_range_and_copies_from_move_list (at_bb_end[bb->index], node, live_through, REG_FREQ_FROM_BB (bb)); FOR_EACH_EDGE (e, ei, bb->succs) { bitmap_and (live_through, DF_LR_IN (e->dest), DF_LR_OUT (bb)); add_range_and_copies_from_move_list ((move_t) e->aux, node, live_through, REG_FREQ_FROM_EDGE_FREQ (EDGE_FREQUENCY (e))); } } ira_free_bitmap (live_through); } /* The entry function changes code and generates shuffling allocnos on region borders for the regional (LOOPS_P is TRUE in this case) register allocation. */ void ira_emit (bool loops_p) { basic_block bb; edge_iterator ei; edge e; ira_allocno_t a; ira_allocno_iterator ai; FOR_EACH_ALLOCNO (a, ai) ALLOCNO_REG (a) = regno_reg_rtx[ALLOCNO_REGNO (a)]; if (! loops_p) return; at_bb_start = (move_t *) ira_allocate (sizeof (move_t) * last_basic_block); memset (at_bb_start, 0, sizeof (move_t) * last_basic_block); at_bb_end = (move_t *) ira_allocate (sizeof (move_t) * last_basic_block); memset (at_bb_end, 0, sizeof (move_t) * last_basic_block); local_allocno_bitmap = ira_allocate_bitmap (); used_regno_bitmap = ira_allocate_bitmap (); renamed_regno_bitmap = ira_allocate_bitmap (); max_regno_before_changing = max_reg_num (); ira_traverse_loop_tree (true, ira_loop_tree_root, change_loop, NULL); set_allocno_somewhere_renamed_p (); ira_free_bitmap (used_regno_bitmap); ira_free_bitmap (renamed_regno_bitmap); ira_free_bitmap (local_allocno_bitmap); setup_entered_from_non_parent_p (); FOR_EACH_BB (bb) { at_bb_start[bb->index] = NULL; at_bb_end[bb->index] = NULL; FOR_EACH_EDGE (e, ei, bb->succs) if (e->dest != EXIT_BLOCK_PTR) generate_edge_moves (e); } allocno_last_set = (move_t *) ira_allocate (sizeof (move_t) * max_reg_num ()); allocno_last_set_check = (int *) ira_allocate (sizeof (int) * max_reg_num ()); memset (allocno_last_set_check, 0, sizeof (int) * max_reg_num ()); memset (hard_regno_last_set_check, 0, sizeof (hard_regno_last_set_check)); curr_tick = 0; FOR_EACH_BB (bb) unify_moves (bb, true); FOR_EACH_BB (bb) unify_moves (bb, false); move_vec = VEC_alloc (move_t, heap, ira_allocnos_num); emit_moves (); add_ranges_and_copies (); /* Clean up: */ FOR_EACH_BB (bb) { free_move_list (at_bb_start[bb->index]); free_move_list (at_bb_end[bb->index]); FOR_EACH_EDGE (e, ei, bb->succs) { free_move_list ((move_t) e->aux); e->aux = NULL; } } VEC_free (move_t, heap, move_vec); ira_free (allocno_last_set_check); ira_free (allocno_last_set); commit_edge_insertions (); ira_free (at_bb_end); ira_free (at_bb_start); }