diff options
Diffstat (limited to 'gcc/config/arm/arm.c')
-rw-r--r-- | gcc/config/arm/arm.c | 3432 |
1 files changed, 2997 insertions, 435 deletions
diff --git a/gcc/config/arm/arm.c b/gcc/config/arm/arm.c index 7bf05363b77..3a4acd79846 100644 --- a/gcc/config/arm/arm.c +++ b/gcc/config/arm/arm.c @@ -24,6 +24,8 @@ Boston, MA 02111-1307, USA. */ #include "config.h" #include "system.h" #include "rtl.h" +#include "tree.h" +#include "tm_p.h" #include "regs.h" #include "hard-reg-set.h" #include "real.h" @@ -34,41 +36,69 @@ Boston, MA 02111-1307, USA. */ #include "insn-attr.h" #include "flags.h" #include "reload.h" -#include "tree.h" #include "function.h" #include "expr.h" #include "toplev.h" #include "recog.h" #include "ggc.h" +#include "except.h" #include "tm_p.h" -#ifndef Mmode -#define Mmode enum machine_mode -#endif - -/* Some function declarations. */ -static HOST_WIDE_INT int_log2 PARAMS ((HOST_WIDE_INT)); -static char * output_multi_immediate PARAMS ((rtx *, char *, char *, int, HOST_WIDE_INT)); -static int arm_gen_constant PARAMS ((enum rtx_code, Mmode, HOST_WIDE_INT, rtx, rtx, int, int)); -static int arm_naked_function_p PARAMS ((tree)); -static void init_fpa_table PARAMS ((void)); -static enum machine_mode select_dominance_cc_mode PARAMS ((rtx, rtx, HOST_WIDE_INT)); -static HOST_WIDE_INT add_minipool_constant PARAMS ((rtx, Mmode)); -static void dump_minipool PARAMS ((rtx)); -static rtx find_barrier PARAMS ((rtx, int)); -static void push_minipool_fix PARAMS ((rtx, int, rtx *, Mmode, rtx)); -static void push_minipool_barrier PARAMS ((rtx, int)); -static void note_invalid_constants PARAMS ((rtx, int)); -static char * fp_const_from_val PARAMS ((REAL_VALUE_TYPE *)); -static int eliminate_lr2ip PARAMS ((rtx *)); -static char * shift_op PARAMS ((rtx, HOST_WIDE_INT *)); -static int pattern_really_clobbers_lr PARAMS ((rtx)); -static int function_really_clobbers_lr PARAMS ((rtx)); -static rtx emit_multi_reg_push PARAMS ((int)); -static rtx emit_sfm PARAMS ((int, int)); -static enum arm_cond_code get_arm_condition_code PARAMS ((rtx)); -static int const_ok_for_op PARAMS ((HOST_WIDE_INT, enum rtx_code)); -static void arm_add_gc_roots PARAMS ((void)); +/* Forward definitions of types. */ +typedef struct minipool_node Mnode; +typedef struct minipool_fixup Mfix; + +/* In order to improve the layout of the prototypes below + some short type abbreviations are defined here. */ +#define Hint HOST_WIDE_INT +#define Mmode enum machine_mode +#define Ulong unsigned long + +/* Forward function declarations. */ +static void arm_add_gc_roots PARAMS ((void)); +static int arm_gen_constant PARAMS ((enum rtx_code, Mmode, Hint, rtx, rtx, int, int)); +static int arm_naked_function_p PARAMS ((tree)); +static Ulong bit_count PARAMS ((signed int)); +static int const_ok_for_op PARAMS ((Hint, enum rtx_code)); +static int eliminate_lr2ip PARAMS ((rtx *)); +static rtx emit_multi_reg_push PARAMS ((int)); +static rtx emit_sfm PARAMS ((int, int)); +static char * fp_const_from_val PARAMS ((REAL_VALUE_TYPE *)); +static int function_really_clobbers_lr PARAMS ((rtx)); +static arm_cc get_arm_condition_code PARAMS ((rtx)); +static void init_fpa_table PARAMS ((void)); +static Hint int_log2 PARAMS ((Hint)); +static rtx is_jump_table PARAMS ((rtx)); +static char * output_multi_immediate PARAMS ((rtx *, char *, char *, int, Hint)); +static int pattern_really_clobbers_lr PARAMS ((rtx)); +static void print_multi_reg PARAMS ((FILE *, char *, int, int, int)); +static Mmode select_dominance_cc_mode PARAMS ((rtx, rtx, Hint)); +static char * shift_op PARAMS ((rtx, Hint *)); +static void arm_init_machine_status PARAMS ((struct function *)); +static void arm_mark_machine_status PARAMS ((struct function *)); +static int number_of_first_bit_set PARAMS ((int)); +static void replace_symbols_in_block PARAMS ((tree, rtx, rtx)); +static void thumb_exit PARAMS ((FILE *, int, rtx)); +static void thumb_pushpop PARAMS ((FILE *, int, int)); +static char * thumb_condition_code PARAMS ((rtx, int)); +static rtx is_jump_table PARAMS ((rtx)); +static Hint get_jump_table_size PARAMS ((rtx)); +static Mnode * move_minipool_fix_forward_ref PARAMS ((Mnode *, Mnode *, Hint)); +static Mnode * add_minipool_forward_ref PARAMS ((Mfix *)); +static Mnode * move_minipool_fix_backward_ref PARAMS ((Mnode *, Mnode *, Hint)); +static Mnode * add_minipool_backward_ref PARAMS ((Mfix *)); +static void assign_minipool_offsets PARAMS ((Mfix *)); +static void arm_print_value PARAMS ((FILE *, rtx)); +static void dump_minipool PARAMS ((rtx)); +static int arm_barrier_cost PARAMS ((rtx)); +static Mfix * create_fix_barrier PARAMS ((Mfix *, Hint)); +static void push_minipool_barrier PARAMS ((rtx, Hint)); +static void push_minipool_fix PARAMS ((rtx, Hint, rtx *, Mmode, rtx)); +static void note_invalid_constants PARAMS ((rtx, Hint)); + +#undef Hint +#undef Mmode +#undef Ulong /* The maximum number of insns skipped which will be conditionalised if possible. */ @@ -110,9 +140,10 @@ int arm_structure_size_boundary = DEFAULT_STRUCTURE_SIZE_BOUNDARY; #define FL_LDSCHED (1 << 7) /* Load scheduling necessary */ #define FL_STRONG (1 << 8) /* StrongARM */ -/* The bits in this mask specify which instructions we are allowed to - generate. */ +/* The bits in this mask specify which instructions we are + allowed to generate. */ static int insn_flags = 0; + /* The bits in this mask specify which instruction scheduling options should be used. Note - there is an overlap with the FL_FAST_MULT. For some hardware we want to be able to generate the multiply instructions, but to @@ -158,7 +189,7 @@ int lr_save_eliminated; /* Set to 1 when a return insn is output, this means that the epilogue is not needed. */ -static int return_used_this_function; +int return_used_this_function; /* Set to 1 after arm_reorg has started. Reset to start at the start of the next function. */ @@ -180,8 +211,6 @@ char * arm_condition_codes[] = "hi", "ls", "ge", "lt", "gt", "le", "al", "nv" }; -static enum arm_cond_code get_arm_condition_code (); - #define streq(string1, string2) (strcmp (string1, string2) == 0) /* Initialization code. */ @@ -208,7 +237,7 @@ static struct processors all_cores[] = {"arm620", FL_CO_PROC | FL_MODE26 | FL_MODE32 }, {"arm7", FL_CO_PROC | FL_MODE26 | FL_MODE32 }, /* arm7m doesn't exist on its own, but only with D, (and I), but - those don't alter the code, so arm7m is sometimes used. */ + those don't alter the code, so arm7m is sometimes used. */ {"arm7m", FL_CO_PROC | FL_MODE26 | FL_MODE32 | FL_FAST_MULT }, {"arm7d", FL_CO_PROC | FL_MODE26 | FL_MODE32 }, {"arm7dm", FL_CO_PROC | FL_MODE26 | FL_MODE32 | FL_FAST_MULT }, @@ -267,11 +296,11 @@ struct arm_cpu_select arm_select[] = }; /* Return the number of bits set in value' */ -static unsigned int +static unsigned long bit_count (value) signed int value; { - unsigned int count = 0; + unsigned long count = 0; while (value) { @@ -375,23 +404,22 @@ arm_override_options () switch that require certain abilities from the cpu. */ sought = 0; - if (TARGET_INTERWORK) + if (TARGET_INTERWORK || TARGET_THUMB) { sought |= (FL_THUMB | FL_MODE32); /* Force apcs-32 to be used for interworking. */ target_flags |= ARM_FLAG_APCS_32; - /* There are no ARM processor that supports both APCS-26 and + /* There are no ARM processors that support both APCS-26 and interworking. Therefore we force FL_MODE26 to be removed from insn_flags here (if it was set), so that the search below will always be able to find a compatible processor. */ insn_flags &= ~ FL_MODE26; } - - if (! TARGET_APCS_32) + else if (! TARGET_APCS_32) sought |= FL_MODE26; - + if (sought != 0 && ((sought & insn_flags) != sought)) { /* Try to locate a CPU type that supports all of the abilities @@ -471,6 +499,30 @@ arm_override_options () target_flags &= ~ARM_FLAG_INTERWORK; } + if (TARGET_THUMB && !(insn_flags & FL_THUMB)) + { + warning ("target CPU does not supoport THUMB instructions."); + target_flags &= ~ARM_FLAG_THUMB; + } + + if (TARGET_APCS_FRAME && TARGET_THUMB) + { + /* warning ("ignoring -mapcs-frame because -mthumb was used."); */ + target_flags &= ~ARM_FLAG_APCS_FRAME; + } + + /* TARGET_BACKTRACE calls leaf_function_p, which causes a crash if done + from here where no function is being compiled currently. */ + if ((target_flags & (THUMB_FLAG_LEAF_BACKTRACE | THUMB_FLAG_BACKTRACE)) + && TARGET_ARM) + warning ("enabling backtrace support is only meaningful when compiling for the Thumb."); + + if (TARGET_ARM && TARGET_CALLEE_INTERWORKING) + warning ("enabling callee interworking support is only meaningful when compiling for the Thumb."); + + if (TARGET_ARM && TARGET_CALLER_INTERWORKING) + warning ("enabling caller interworking support is only meaningful when compiling for the Thumb."); + /* If interworking is enabled then APCS-32 must be selected as well. */ if (TARGET_INTERWORK) { @@ -479,7 +531,7 @@ arm_override_options () target_flags |= ARM_FLAG_APCS_32; } - if (TARGET_APCS_STACK && ! TARGET_APCS) + if (TARGET_APCS_STACK && ! TARGET_APCS_FRAME) { warning ("-mapcs-stack-check incompatible with -mno-apcs-frame"); target_flags |= ARM_FLAG_APCS_FRAME; @@ -494,8 +546,13 @@ arm_override_options () if (TARGET_APCS_REENT) warning ("APCS reentrant code not supported. Ignored"); - if (write_symbols != NO_DEBUG && flag_omit_frame_pointer) - warning ("-g with -fomit-frame-pointer may not give sensible debugging"); + /* If this target is normally configured to use APCS frames, warn if they + are turned off and debugging is turned on. */ + if (TARGET_ARM + && write_symbols != NO_DEBUG + && ! TARGET_APCS_FRAME + && (TARGET_DEFAULT & ARM_FLAG_APCS_FRAME)) + warning ("-g with -mno-apcs-frame may not give sensible debugging"); /* If stack checking is disabled, we can use r10 as the PIC register, which keeps r9 available. */ @@ -512,8 +569,8 @@ arm_override_options () arm_ld_sched = (tune_flags & FL_LDSCHED) != 0; arm_is_strong = (tune_flags & FL_STRONG) != 0; - arm_is_6_or_7 = ((tune_flags & (FL_MODE26 | FL_MODE32)) - && !(tune_flags & FL_ARCH4)) != 0; + arm_is_6_or_7 = (((tune_flags & (FL_MODE26 | FL_MODE32)) + && !(tune_flags & FL_ARCH4))) != 0; /* Default value for floating point code... if no co-processor bus, then schedule for emulated floating point. Otherwise, @@ -574,7 +631,13 @@ arm_override_options () else arm_pic_register = pic_register; } - + + if (TARGET_THUMB && flag_schedule_insns) + { + /* Don't warn since it's on by default in -O2. */ + flag_schedule_insns = 0; + } + /* If optimizing for space, don't synthesize constants. For processors with load scheduling, it never costs more than 2 cycles to load a constant, and the load scheduler may well reduce that to 1. */ @@ -602,7 +665,6 @@ arm_add_gc_roots () ggc_add_rtx_root (&arm_target_insn, 1); /* Not sure this is really a root */ /* XXX: What about the minipool tables? */ } - /* Return 1 if it is possible to return using a single instruction. */ int @@ -611,11 +673,16 @@ use_return_insn (iscond) { int regno; - if (!reload_completed + /* Never use a return instruction before reload has run. */ + if (! reload_completed + /* Or if the function is variadic. */ || current_function_pretend_args_size || current_function_anonymous_args + /* Of if the function calls __builtin_eh_return () */ + || cfun->machine->eh_epilogue_sp_ofs != NULL + /* Or if there is no frame pointer and there is a stack adjustment. */ || ((get_frame_size () + current_function_outgoing_args_size != 0) - && !(TARGET_APCS && frame_pointer_needed))) + && ! frame_pointer_needed)) return 0; /* Can't be done if interworking with Thumb, and any registers have been @@ -623,10 +690,11 @@ use_return_insn (iscond) if they aren't taken and registers have been stacked. */ if (iscond && arm_is_strong && frame_pointer_needed) return 0; + if ((iscond && arm_is_strong) || TARGET_INTERWORK) { - for (regno = 0; regno < 16; regno++) + for (regno = 0; regno <= LAST_ARM_REGNUM; regno++) if (regs_ever_live[regno] && ! call_used_regs[regno]) return 0; @@ -636,9 +704,10 @@ use_return_insn (iscond) /* Can't be done if any of the FPU regs are pushed, since this also requires an insn. */ - for (regno = 16; regno < 24; regno++) - if (regs_ever_live[regno] && ! call_used_regs[regno]) - return 0; + if (TARGET_HARD_FLOAT) + for (regno = FIRST_ARM_FP_REGNUM; regno <= LAST_ARM_FP_REGNUM; regno++) + if (regs_ever_live[regno] && ! call_used_regs[regno]) + return 0; /* If a function is naked, don't use the "return" insn. */ if (arm_naked_function_p (current_function_decl)) @@ -657,10 +726,10 @@ const_ok_for_arm (i) /* For machines with >32 bit HOST_WIDE_INT, the bits above bit 31 must be all zero, or all one. */ - if ((i & ~(unsigned HOST_WIDE_INT) 0xffffffffUL) != 0 - && ((i & ~(unsigned HOST_WIDE_INT) 0xffffffffUL) + if ((i & ~(unsigned HOST_WIDE_INT) 0xffffffff) != 0 + && ((i & ~(unsigned HOST_WIDE_INT) 0xffffffff) != ((~(unsigned HOST_WIDE_INT) 0) - & ~(unsigned HOST_WIDE_INT) 0xffffffffUL))) + & ~(unsigned HOST_WIDE_INT) 0xffffffff))) return FALSE; /* Fast return for 0 and powers of 2 */ @@ -669,11 +738,11 @@ const_ok_for_arm (i) do { - if ((i & mask & (unsigned HOST_WIDE_INT) 0xffffffffUL) == 0) + if ((i & mask & (unsigned HOST_WIDE_INT) 0xffffffff) == 0) return TRUE; mask = - (mask << 2) | ((mask & (unsigned HOST_WIDE_INT) 0xffffffffUL) - >> (32 - 2)) | ~((unsigned HOST_WIDE_INT) 0xffffffffUL); + (mask << 2) | ((mask & (unsigned HOST_WIDE_INT) 0xffffffff) + >> (32 - 2)) | ~((unsigned HOST_WIDE_INT) 0xffffffff); } while (mask != ~(unsigned HOST_WIDE_INT) 0xFF); return FALSE; @@ -758,7 +827,7 @@ arm_split_constant (code, mode, val, target, source, subtargets) have subtraction of a constant. */ if (code == MINUS) emit_insn (gen_rtx_SET (VOIDmode, target, - gen_rtx (code, mode, temp, source))); + gen_rtx_MINUS (mode, temp, source))); else emit_insn (gen_rtx_SET (VOIDmode, target, gen_rtx (code, mode, source, temp))); @@ -772,7 +841,7 @@ arm_split_constant (code, mode, val, target, source, subtargets) /* As above, but extra parameter GENERATE which, if clear, suppresses RTL generation. */ -int +static int arm_gen_constant (code, mode, val, target, source, subtargets, generate) enum rtx_code code; enum machine_mode mode; @@ -794,9 +863,9 @@ arm_gen_constant (code, mode, val, target, source, subtargets, generate) int set_zero_bit_copies = 0; int insns = 0; unsigned HOST_WIDE_INT temp1, temp2; - unsigned HOST_WIDE_INT remainder = val & 0xffffffffUL; + unsigned HOST_WIDE_INT remainder = val & (unsigned HOST_WIDE_INT)0xffffffff; - /* find out which operations are safe for a given CODE. Also do a quick + /* Find out which operations are safe for a given CODE. Also do a quick check for degenerate cases; these can occur when DImode operations are split. */ switch (code) @@ -813,7 +882,7 @@ arm_gen_constant (code, mode, val, target, source, subtargets, generate) break; case IOR: - if (remainder == 0xffffffffUL) + if (remainder == (unsigned HOST_WIDE_INT)0xffffffff) { if (generate) emit_insn (gen_rtx_SET (VOIDmode, target, @@ -837,7 +906,7 @@ arm_gen_constant (code, mode, val, target, source, subtargets, generate) emit_insn (gen_rtx_SET (VOIDmode, target, const0_rtx)); return 1; } - if (remainder == 0xffffffffUL) + if (remainder == (unsigned HOST_WIDE_INT)0xffffffff) { if (reload_completed && rtx_equal_p (target, source)) return 0; @@ -857,7 +926,7 @@ arm_gen_constant (code, mode, val, target, source, subtargets, generate) emit_insn (gen_rtx_SET (VOIDmode, target, source)); return 1; } - if (remainder == 0xffffffffUL) + if (remainder == (unsigned HOST_WIDE_INT)0xffffffff) { if (generate) emit_insn (gen_rtx_SET (VOIDmode, target, @@ -985,15 +1054,16 @@ arm_gen_constant (code, mode, val, target, source, subtargets, generate) word. We only look for the simplest cases, to do more would cost too much. Be careful, however, not to generate this when the alternative would take fewer insns. */ - if (val & 0xffff0000UL) + if (val & (unsigned HOST_WIDE_INT)0xffff0000) { - temp1 = remainder & 0xffff0000UL; + temp1 = remainder & (unsigned HOST_WIDE_INT)0xffff0000; temp2 = remainder & 0x0000ffff; /* Overlaps outside this range are best done using other methods. */ for (i = 9; i < 24; i++) { - if ((((temp2 | (temp2 << i)) & 0xffffffffUL) == remainder) + if ((((temp2 | (temp2 << i)) + & (unsigned HOST_WIDE_INT)0xffffffff) == remainder) && ! const_ok_for_arm (temp2)) { rtx new_src = (subtargets @@ -1131,11 +1201,11 @@ arm_gen_constant (code, mode, val, target, source, subtargets, generate) /* See if two shifts will do 2 or more insn's worth of work. */ if (clear_sign_bit_copies >= 16 && clear_sign_bit_copies < 24) { - HOST_WIDE_INT shift_mask = ((0xffffffffUL + HOST_WIDE_INT shift_mask = ((((unsigned HOST_WIDE_INT)0xffffffff) << (32 - clear_sign_bit_copies)) - & 0xffffffffUL); + & (unsigned HOST_WIDE_INT)0xffffffff); - if ((remainder | shift_mask) != 0xffffffffUL) + if ((remainder | shift_mask) != (unsigned HOST_WIDE_INT)0xffffffff) { if (generate) { @@ -1168,7 +1238,7 @@ arm_gen_constant (code, mode, val, target, source, subtargets, generate) { HOST_WIDE_INT shift_mask = (1 << clear_zero_bit_copies) - 1; - if ((remainder | shift_mask) != 0xffffffffUL) + if ((remainder | shift_mask) != (unsigned HOST_WIDE_INT)0xffffffff) { if (generate) { @@ -1210,9 +1280,9 @@ arm_gen_constant (code, mode, val, target, source, subtargets, generate) num_bits_set++; if (code == AND || (can_invert && num_bits_set > 16)) - remainder = (~remainder) & 0xffffffffUL; + remainder = (~remainder) & (unsigned HOST_WIDE_INT)0xffffffff; else if (code == PLUS && num_bits_set > 16) - remainder = (-remainder) & 0xffffffffUL; + remainder = (-remainder) & (unsigned HOST_WIDE_INT)0xffffffff; else { can_invert = 0; @@ -1392,11 +1462,15 @@ arm_return_in_memory (type) if (! AGGREGATE_TYPE_P (type)) /* All simple types are returned in registers. */ return 0; - + + /* For the arm-wince targets we choose to be compitable with Microsoft's + ARM and Thumb compilers, which always return aggregates in memory. */ +#ifndef ARM_WINCE + if (int_size_in_bytes (type) > 4) /* All structures/unions bigger than one word are returned in memory. */ return 1; - + if (TREE_CODE (type) == RECORD_TYPE) { tree field; @@ -1417,13 +1491,17 @@ arm_return_in_memory (type) if (field == NULL) return 0; /* An empty structure. Allowed by an extension to ANSI C. */ - /* Check that the first field is valid for returning in a register... */ + /* Check that the first field is valid for returning in a register. */ + + /* ... Floats are not allowed */ if (FLOAT_TYPE_P (TREE_TYPE (field))) return 1; + /* ... Aggregates that are not themselves valid for returning in + a register are not allowed. */ if (RETURN_IN_MEMORY (TREE_TYPE (field))) return 1; - + /* Now check the remaining fields, if any. Only bitfields are allowed, since they are not addressable. */ for (field = TREE_CHAIN (field); @@ -1462,8 +1540,9 @@ arm_return_in_memory (type) return 0; } +#endif /* not ARM_WINCE */ - /* Put other aggregates in memory. */ + /* Return all other types in memory. */ return 1; } @@ -1622,20 +1701,6 @@ arm_comp_type_attributes (type1, type2) return 1; } -/* Check the ARM specific attributes on the given function decl. - If any of them would prevent the function from being inlined, - return a tesxtual description of why not. Otherwise return NULL. */ -const char * -arm_function_attribute_inlineable_p (fndecl) - tree fndecl; -{ - if (lookup_attribute ("naked", DECL_MACHINE_ATTRIBUTES (fndecl))) - return "naked functions cannot be inlined"; - - /* Allow functions with short_call and long_call attributes to be inlined. */ - return NULL; -} - /* Encode long_call or short_call attribute by prefixing symbol name in DECL with a special character FLAG. */ void @@ -1771,7 +1836,8 @@ int legitimate_pic_operand_p (x) rtx x; { - if (CONSTANT_P (x) && flag_pic + if (CONSTANT_P (x) + && flag_pic && (GET_CODE (x) == SYMBOL_REF || (GET_CODE (x) == CONST && GET_CODE (XEXP (x, 0)) == PLUS @@ -1884,15 +1950,15 @@ legitimize_pic_address (orig, mode, reg) current_function_uses_pic_offset_table = 1; if (NEED_GOT_RELOC) - { - rtx pic_ref, address = gen_reg_rtx (Pmode); - - emit_insn (gen_pic_load_addr (address, orig)); - pic_ref = gen_rtx_PLUS (Pmode, pic_offset_table_rtx, address); - - emit_move_insn (address, pic_ref); - return address; - } + { + rtx pic_ref, address = gen_reg_rtx (Pmode); + + emit_insn (gen_pic_load_addr (address, orig)); + pic_ref = gen_rtx_PLUS (Pmode, pic_offset_table_rtx, address); + + emit_move_insn (address, pic_ref); + return address; + } } return orig; @@ -1927,8 +1993,8 @@ arm_finalize_pic () global_offset_table = gen_rtx_SYMBOL_REF (Pmode, "_GLOBAL_OFFSET_TABLE_"); /* On the ARM the PC register contains 'dot + 8' at the time of the - addition. */ - pic_tmp = plus_constant (gen_rtx_LABEL_REF (Pmode, l1), 8); + addition, on the Thumb it is 'dot + 4'. */ + pic_tmp = plus_constant (gen_rtx_LABEL_REF (Pmode, l1), TARGET_ARM ? 8 : 4); if (GOT_PCREL) pic_tmp2 = gen_rtx_CONST (VOIDmode, gen_rtx_PLUS (Pmode, global_offset_table, pc_rtx)); @@ -1938,7 +2004,10 @@ arm_finalize_pic () pic_rtx = gen_rtx_CONST (Pmode, gen_rtx_MINUS (Pmode, pic_tmp2, pic_tmp)); emit_insn (gen_pic_load_addr (pic_offset_table_rtx, pic_rtx)); - emit_insn (gen_pic_add_dot_plus_eight (pic_offset_table_rtx, l1)); + if (TARGET_ARM) + emit_insn (gen_pic_add_dot_plus_eight (pic_offset_table_rtx, l1)); + else + emit_insn (gen_pic_add_dot_plus_four (pic_offset_table_rtx, l1)); seq = gen_sequence (); end_sequence (); @@ -1957,19 +2026,144 @@ arm_finalize_pic () #define REG_OR_SUBREG_RTX(X) \ (GET_CODE (X) == REG ? (X) : SUBREG_REG (X)) -#define ARM_FRAME_RTX(X) \ - ((X) == frame_pointer_rtx || (X) == stack_pointer_rtx \ - || (X) == arg_pointer_rtx) +#ifndef COSTS_N_INSNS +#define COSTS_N_INSNS(N) ((N) * 4 - 2) +#endif int -arm_rtx_costs (x, code) +arm_rtx_costs (x, code, outer) rtx x; enum rtx_code code; + enum rtx_code outer; { enum machine_mode mode = GET_MODE (x); enum rtx_code subcode; int extra_cost; + if (TARGET_THUMB) + { + switch (code) + { + case ASHIFT: + case ASHIFTRT: + case LSHIFTRT: + case ROTATERT: + case PLUS: + case MINUS: + case COMPARE: + case NEG: + case NOT: + return COSTS_N_INSNS (1); + + case MULT: + if (GET_CODE (XEXP (x, 1)) == CONST_INT) + { + int cycles = 0; + unsigned HOST_WIDE_INT i = INTVAL (XEXP (x, 1)); + + while (i) + { + i >>= 2; + cycles ++; + } + return COSTS_N_INSNS (2) + cycles; + } + return COSTS_N_INSNS (1) + 16; + + case SET: + return (COSTS_N_INSNS (1) + + 4 * ((GET_CODE (SET_SRC (x)) == MEM) + + GET_CODE (SET_DEST (x)) == MEM)); + + case CONST_INT: + if (outer == SET) + { + if ((unsigned HOST_WIDE_INT) INTVAL (x) < 256) + return 0; + if (thumb_shiftable_const (INTVAL (x))) + return COSTS_N_INSNS (2); + return COSTS_N_INSNS (3); + } + else if (outer == PLUS + && INTVAL (x) < 256 && INTVAL (x) > -256) + return 0; + else if (outer == COMPARE + && (unsigned HOST_WIDE_INT) INTVAL (x) < 256) + return 0; + else if (outer == ASHIFT || outer == ASHIFTRT + || outer == LSHIFTRT) + return 0; + return COSTS_N_INSNS (2); + + case CONST: + case CONST_DOUBLE: + case LABEL_REF: + case SYMBOL_REF: + return COSTS_N_INSNS (3); + + case UDIV: + case UMOD: + case DIV: + case MOD: + return 100; + + case TRUNCATE: + return 99; + + case AND: + case XOR: + case IOR: + /* XXX guess. */ + return 8; + + case ADDRESSOF: + case MEM: + /* XXX another guess. */ + /* Memory costs quite a lot for the first word, but subsequent words + load at the equivalent of a single insn each. */ + return (10 + 4 * ((GET_MODE_SIZE (mode) - 1) / UNITS_PER_WORD) + + (CONSTANT_POOL_ADDRESS_P (x) ? 4 : 0)); + + case IF_THEN_ELSE: + /* XXX a guess. */ + if (GET_CODE (XEXP (x, 1)) == PC || GET_CODE (XEXP (x, 2)) == PC) + return 14; + return 2; + + case ZERO_EXTEND: + /* XXX still guessing. */ + switch (GET_MODE (XEXP (x, 0))) + { + case QImode: + return (1 + (mode == DImode ? 4 : 0) + + (GET_CODE (XEXP (x, 0)) == MEM ? 10 : 0)); + + case HImode: + return (4 + (mode == DImode ? 4 : 0) + + (GET_CODE (XEXP (x, 0)) == MEM ? 10 : 0)); + + case SImode: + return (1 + (GET_CODE (XEXP (x, 0)) == MEM ? 10 : 0)); + + default: + return 99; + } + + default: + return 99; +#if 0 + case FFS: + case FLOAT: + case FIX: + case UNSIGNED_FIX: + /* XXX guess */ + fprintf (stderr, "unexpected code for thumb in rtx_costs: %s\n", + rtx_name[code]); + abort (); +#endif + } + } + switch (code) { case MEM: @@ -2112,7 +2306,7 @@ arm_rtx_costs (x, code) if (GET_CODE (XEXP (x, 1)) == CONST_INT) { unsigned HOST_WIDE_INT i = (INTVAL (XEXP (x, 1)) - & (unsigned HOST_WIDE_INT) 0xffffffffUL); + & (unsigned HOST_WIDE_INT) 0xffffffff); int add_cost = const_ok_for_arm (i) ? 4 : 8; int j; @@ -2188,6 +2382,32 @@ arm_rtx_costs (x, code) } abort (); + case CONST_INT: + if (const_ok_for_arm (INTVAL (x))) + return outer == SET ? 2 : -1; + else if (outer == AND + && const_ok_for_arm (~ INTVAL (x))) + return -1; + else if ((outer == COMPARE + || outer == PLUS || outer == MINUS) + && const_ok_for_arm (- INTVAL (x))) + return -1; + else + return 5; + + case CONST: + case LABEL_REF: + case SYMBOL_REF: + return 6; + + case CONST_DOUBLE: + if (const_double_rtx_ok_for_fpu (x)) + return outer == SET ? 2 : -1; + else if ((outer == COMPARE || outer == PLUS) + && neg_const_double_rtx_ok_for_fpu (x)) + return -1; + return 7; + default: return 99; } @@ -2203,10 +2423,15 @@ arm_adjust_cost (insn, link, dep, cost) rtx i_pat, d_pat; /* XXX This is not strictly true for the FPA. */ - if (REG_NOTE_KIND(link) == REG_DEP_ANTI - || REG_NOTE_KIND(link) == REG_DEP_OUTPUT) + if (REG_NOTE_KIND (link) == REG_DEP_ANTI + || REG_NOTE_KIND (link) == REG_DEP_OUTPUT) return 0; + /* Call insns don't incur a stall, even if they follow a load. */ + if (REG_NOTE_KIND (link) == 0 + && GET_CODE (insn) == CALL_INSN) + return 1; + if ((i_pat = single_set (insn)) != NULL && GET_CODE (SET_SRC (i_pat)) == MEM && (d_pat = single_set (dep)) != NULL @@ -2325,6 +2550,7 @@ s_register_operand (op, mode) /* We don't consider registers whose class is NO_REGS to be a register operand. */ + /* XXX might have to check for lo regs only for thumb ??? */ return (GET_CODE (op) == REG && (REGNO (op) >= FIRST_PSEUDO_REGISTER || REGNO_REG_CLASS (REGNO (op)) != NO_REGS)); @@ -2356,7 +2582,7 @@ reg_or_int_operand (op, mode) /* Return 1 if OP is an item in memory, given that we are in reload. */ int -reload_memory_operand (op, mode) +arm_reload_memory_operand (op, mode) rtx op; enum machine_mode mode ATTRIBUTE_UNUSED; { @@ -2369,13 +2595,21 @@ reload_memory_operand (op, mode) } /* Return 1 if OP is a valid memory address, but not valid for a signed byte - memory access (architecture V4) */ + memory access (architecture V4). + MODE is QImode if called when computing contraints, or VOIDmode when + emitting patterns. In this latter case we cannot use memory_operand() + because it will fail on badly formed MEMs, which is precisly what we are + trying to catch. */ int bad_signed_byte_operand (op, mode) rtx op; - enum machine_mode mode; + enum machine_mode mode ATTRIBUTE_UNUSED; { - if (! memory_operand (op, mode) || GET_CODE (op) != MEM) +#if 0 + if ((mode == QImode && ! memory_operand (op, mode)) || GET_CODE (op) != MEM) + return 0; +#endif + if (GET_CODE (op) != MEM) return 0; op = XEXP (op, 0); @@ -2429,6 +2663,9 @@ arm_add_operand (op, mode) rtx op; enum machine_mode mode; { + if (TARGET_THUMB) + return thumb_cmp_operand (op, mode); + return (s_register_operand (op, mode) || (GET_CODE (op) == CONST_INT && (const_ok_for_arm (INTVAL (op)) @@ -2556,7 +2793,7 @@ power_of_two_operand (op, mode) { if (GET_CODE (op) == CONST_INT) { - HOST_WIDE_INT value = INTVAL(op); + HOST_WIDE_INT value = INTVAL (op); return value != 0 && (value & (value - 1)) == 0; } return FALSE; @@ -2595,6 +2832,27 @@ di_operand (op, mode) } } +/* Like di_operand, but don't accept constants. */ +int +nonimmediate_di_operand (op, mode) + rtx op; + enum machine_mode mode; +{ + if (s_register_operand (op, mode)) + return TRUE; + + if (mode != VOIDmode && GET_MODE (op) != VOIDmode && GET_MODE (op) != DImode) + return FALSE; + + if (GET_CODE (op) == SUBREG) + op = SUBREG_REG (op); + + if (GET_CODE (op) == MEM) + return memory_address_p (DImode, XEXP (op, 0)); + + return FALSE; +} + /* Return TRUE for a valid operand of a DFmode operation when -msoft-float. Either: REG, SUBREG, CONST_DOUBLE or MEM(DImode_address). Note that this disallows MEM(REG+REG), but allows @@ -2630,16 +2888,36 @@ soft_df_operand (op, mode) } } -/* Return TRUE for valid index operands. */ +/* Like soft_df_operand, but don't accept constants. */ +int +nonimmediate_soft_df_operand (op, mode) + rtx op; + enum machine_mode mode; +{ + if (s_register_operand (op, mode)) + return TRUE; + + if (mode != VOIDmode && GET_MODE (op) != mode) + return FALSE; + + if (GET_CODE (op) == SUBREG) + op = SUBREG_REG (op); + if (GET_CODE (op) == MEM) + return memory_address_p (DFmode, XEXP (op, 0)); + return FALSE; +} + +/* Return TRUE for valid index operands. */ int index_operand (op, mode) rtx op; enum machine_mode mode; { - return (s_register_operand(op, mode) + return (s_register_operand (op, mode) || (immediate_operand (op, mode) - && INTVAL (op) < 4096 && INTVAL (op) > -4096)); + && (GET_CODE (op) != CONST_INT + || (INTVAL (op) < 4096 && INTVAL (op) > -4096)))); } /* Return TRUE for valid shifts by a constant. This also accepts any @@ -2653,7 +2931,8 @@ const_shift_operand (op, mode) { return (power_of_two_operand (op, mode) || (immediate_operand (op, mode) - && (INTVAL (op) < 32 && INTVAL (op) > 0))); + && (GET_CODE (op) != CONST_INT + || (INTVAL (op) < 32 && INTVAL (op) > 0)))); } /* Return TRUE for arithmetic operators which can be combined with a multiply @@ -2746,11 +3025,14 @@ cc_register (x, mode) if (mode == VOIDmode) { mode = GET_MODE (x); + if (GET_MODE_CLASS (mode) != MODE_CC) return FALSE; } - if (mode == GET_MODE (x) && GET_CODE (x) == REG && REGNO (x) == 24) + if ( GET_MODE (x) == mode + && GET_CODE (x) == REG + && REGNO (x) == CC_REGNUM) return TRUE; return FALSE; @@ -2767,21 +3049,19 @@ dominant_cc_register (x, mode) if (mode == VOIDmode) { mode = GET_MODE (x); + if (GET_MODE_CLASS (mode) != MODE_CC) return FALSE; } - if (mode != CC_DNEmode && mode != CC_DEQmode + if ( mode != CC_DNEmode && mode != CC_DEQmode && mode != CC_DLEmode && mode != CC_DLTmode && mode != CC_DGEmode && mode != CC_DGTmode && mode != CC_DLEUmode && mode != CC_DLTUmode && mode != CC_DGEUmode && mode != CC_DGTUmode) return FALSE; - if (mode == GET_MODE (x) && GET_CODE (x) == REG && REGNO (x) == 24) - return TRUE; - - return FALSE; + return cc_register (x, mode); } /* Return TRUE if X references a SYMBOL_REF. */ @@ -2796,6 +3076,7 @@ symbol_mentioned_p (x) return 1; fmt = GET_RTX_FORMAT (GET_CODE (x)); + for (i = GET_RTX_LENGTH (GET_CODE (x)) - 1; i >= 0; i--) { if (fmt[i] == 'E') @@ -2896,7 +3177,6 @@ adjacent_mem_locations (a, b) /* Return 1 if OP is a load multiple operation. It is known to be parallel and the first section will be tested. */ - int load_multiple_operation (op, mode) rtx op; @@ -3061,7 +3341,7 @@ load_multiple_sequence (operands, nops, regs, base, load_offset) /* Convert a subreg of a mem into the mem itself. */ if (GET_CODE (operands[nops + i]) == SUBREG) - operands[nops + i] = alter_subreg(operands[nops + i]); + operands[nops + i] = alter_subreg (operands[nops + i]); if (GET_CODE (operands[nops + i]) != MEM) abort (); @@ -3086,7 +3366,7 @@ load_multiple_sequence (operands, nops, regs, base, load_offset) { if (i == 0) { - base_reg = REGNO(reg); + base_reg = REGNO (reg); unsorted_regs[0] = (GET_CODE (operands[i]) == REG ? REGNO (operands[i]) : REGNO (SUBREG_REG (operands[i]))); @@ -3296,7 +3576,7 @@ store_multiple_sequence (operands, nops, regs, base, load_offset) /* Convert a subreg of a mem into the mem itself. */ if (GET_CODE (operands[nops + i]) == SUBREG) - operands[nops + i] = alter_subreg(operands[nops + i]); + operands[nops + i] = alter_subreg (operands[nops + i]); if (GET_CODE (operands[nops + i]) != MEM) abort (); @@ -3462,7 +3742,6 @@ multi_register_push (op, mode) return 1; } - /* Routines for use with attributes. */ @@ -3472,9 +3751,14 @@ multi_register_push (op, mode) Supported attributes: - naked: don't output any prologue or epilogue code, - the user is assumed to do the right thing. -*/ + naked: + don't output any prologue or epilogue code, the user is assumed + to do the right thing. + + interfacearm: + Always assume that this function will be entered in ARM mode, + not Thumb mode, and that the caller wishes to be returned to in + ARM mode. */ int arm_valid_machine_decl_attribute (decl, attr, args) tree decl; @@ -3486,11 +3770,16 @@ arm_valid_machine_decl_attribute (decl, attr, args) if (is_attribute_p ("naked", attr)) return TREE_CODE (decl) == FUNCTION_DECL; + +#ifdef ARM_PE + if (is_attribute_p ("interfacearm", attr)) + return TREE_CODE (decl) == FUNCTION_DECL; +#endif /* ARM_PE */ + return 0; } /* Return non-zero if FUNC is a naked function. */ - static int arm_naked_function_p (func) tree func; @@ -3626,7 +3915,7 @@ arm_gen_movstrqi (operands) fin_dst = dst = copy_to_mode_reg (SImode, st_dst); fin_src = src = copy_to_mode_reg (SImode, st_src); - in_words_to_go = (INTVAL (operands[2]) + 3) / 4; + in_words_to_go = NUM_INTS (INTVAL (operands[2])); out_words_to_go = INTVAL (operands[2]) / 4; last_bytes = INTVAL (operands[2]) & 3; @@ -3712,13 +4001,13 @@ arm_gen_movstrqi (operands) part_bytes_reg = copy_to_mode_reg (SImode, mem); } + if (last_bytes && part_bytes_reg == NULL) + abort (); + if (BYTES_BIG_ENDIAN && last_bytes) { rtx tmp = gen_reg_rtx (SImode); - if (part_bytes_reg == NULL) - abort (); - /* The bytes we want are in the top end of the word. */ emit_insn (gen_lshrsi3 (tmp, part_bytes_reg, GEN_INT (8 * (4 - last_bytes)))); @@ -3743,26 +4032,32 @@ arm_gen_movstrqi (operands) } else { - while (last_bytes) + if (last_bytes > 1) { - if (part_bytes_reg == NULL) - abort (); - - mem = gen_rtx_MEM (QImode, dst); + mem = gen_rtx_MEM (HImode, dst); RTX_UNCHANGING_P (mem) = dst_unchanging_p; MEM_IN_STRUCT_P (mem) = dst_in_struct_p; MEM_SCALAR_P (mem) = dst_scalar_p; - emit_move_insn (mem, gen_rtx_SUBREG (QImode, part_bytes_reg, 0)); - - if (--last_bytes) + emit_move_insn (mem, gen_rtx_SUBREG (HImode, part_bytes_reg, 0)); + last_bytes -= 2; + if (last_bytes) { rtx tmp = gen_reg_rtx (SImode); - emit_insn (gen_addsi3 (dst, dst, const1_rtx)); - emit_insn (gen_lshrsi3 (tmp, part_bytes_reg, GEN_INT (8))); + emit_insn (gen_addsi3 (dst, dst, GEN_INT (2))); + emit_insn (gen_lshrsi3 (tmp, part_bytes_reg, GEN_INT (16))); part_bytes_reg = tmp; } } + + if (last_bytes) + { + mem = gen_rtx_MEM (QImode, dst); + RTX_UNCHANGING_P (mem) = dst_unchanging_p; + MEM_IN_STRUCT_P (mem) = dst_in_struct_p; + MEM_SCALAR_P (mem) = dst_scalar_p; + emit_move_insn (mem, gen_rtx_SUBREG (QImode, part_bytes_reg, 0)); + } } return 1; @@ -3772,7 +4067,7 @@ arm_gen_movstrqi (operands) into the top 16 bits of the word. We can assume that the address is known to be alignable and of the form reg, or plus (reg, const). */ rtx -gen_rotated_half_load (memref) +arm_gen_rotated_half_load (memref) rtx memref; { HOST_WIDE_INT offset = 0; @@ -3987,12 +4282,12 @@ arm_select_cc_mode (op, x, y) floating point compare: I don't think that it is needed on the arm. */ rtx -gen_compare_reg (code, x, y) +arm_gen_compare_reg (code, x, y) enum rtx_code code; rtx x, y; { enum machine_mode mode = SELECT_CC_MODE (code, x, y); - rtx cc_reg = gen_rtx_REG (mode, 24); + rtx cc_reg = gen_rtx_REG (mode, CC_REGNUM); emit_insn (gen_rtx_SET (VOIDmode, cc_reg, gen_rtx_COMPARE (mode, x, y))); @@ -4065,9 +4360,9 @@ arm_reload_in_hi (operands) if (lo == 4095) lo &= 0x7ff; - hi = ((((offset - lo) & (HOST_WIDE_INT) 0xFFFFFFFFUL) - ^ (HOST_WIDE_INT) 0x80000000UL) - - (HOST_WIDE_INT) 0x80000000UL); + hi = ((((offset - lo) & (HOST_WIDE_INT) 0xffffffff) + ^ (HOST_WIDE_INT) 0x80000000) + - (HOST_WIDE_INT) 0x80000000); if (hi + lo != offset) abort (); @@ -4211,9 +4506,9 @@ arm_reload_out_hi (operands) if (lo == 4095) lo &= 0x7ff; - hi = ((((offset - lo) & (HOST_WIDE_INT) 0xFFFFFFFFUL) - ^ (HOST_WIDE_INT) 0x80000000UL) - - (HOST_WIDE_INT) 0x80000000UL); + hi = ((((offset - lo) & (HOST_WIDE_INT) 0xffffffff) + ^ (HOST_WIDE_INT) 0x80000000) + - (HOST_WIDE_INT) 0x80000000); if (hi + lo != offset) abort (); @@ -4280,6 +4575,54 @@ arm_reload_out_hi (operands) } } +/* Print a symbolic form of X to the debug file, F. */ +static void +arm_print_value (f, x) + FILE * f; + rtx x; +{ + switch (GET_CODE (x)) + { + case CONST_INT: + fprintf (f, HOST_WIDE_INT_PRINT_HEX, INTVAL (x)); + return; + + case CONST_DOUBLE: + fprintf (f, "<0x%lx,0x%lx>", (long)XWINT (x, 2), (long)XWINT (x, 3)); + return; + + case CONST_STRING: + fprintf (f, "\"%s\"", XSTR (x, 0)); + return; + + case SYMBOL_REF: + fprintf (f, "`%s'", XSTR (x, 0)); + return; + + case LABEL_REF: + fprintf (f, "L%d", INSN_UID (XEXP (x, 0))); + return; + + case CONST: + arm_print_value (f, XEXP (x, 0)); + return; + + case PLUS: + arm_print_value (f, XEXP (x, 0)); + fprintf (f, "+"); + arm_print_value (f, XEXP (x, 1)); + return; + + case PC: + fprintf (f, "pc"); + return; + + default: + fprintf (f, "????"); + return; + } +} + /* Routines for manipulation of the constant pool. */ /* Arm instructions cannot load a large constant directly into a @@ -4334,202 +4677,674 @@ arm_reload_out_hi (operands) Possible enhancements to the algorithm (not implemented) are: - 1) ARM instructions (but not Thumb) can use negative offsets, so we - could reference back to a previous pool rather than forwards to a - new one. For large functions this may reduce the number of pools - required. - - 2) For some processors and object formats, there may be benefit in + 1) For some processors and object formats, there may be benefit in aligning the pools to the start of cache lines; this alignment would need to be taken into account when calculating addressability of a pool. */ -typedef struct +/* These typedefs are located at the start of this file, so that + they can be used in the prototypes there. This comment is to + remind readers of that fact so that the following structures + can be understood more easily. + + typedef struct minipool_node Mnode; + typedef struct minipool_fixup Mfix; */ + +struct minipool_node +{ + /* Doubly linked chain of entries. */ + Mnode * next; + Mnode * prev; + /* The maximum offset into the code that this entry can be placed. While + pushing fixes for forward references, all entries are sorted in order + of increasing max_address. */ + HOST_WIDE_INT max_address; + /* Similarly for a entry inserted for a backwards ref. */ + HOST_WIDE_INT min_address; + /* The number of fixes referencing this entry. This can become zero + if we "unpush" an entry. In this case we ignore the entry when we + come to emit the code. */ + int refcount; + /* The offset from the start of the minipool. */ + HOST_WIDE_INT offset; + /* The value in table. */ + rtx value; + /* The mode of value. */ + enum machine_mode mode; + int fix_size; +}; + +struct minipool_fixup { - rtx value; /* Value in table */ - HOST_WIDE_INT next_offset; - enum machine_mode mode; /* Mode of value */ -} minipool_node; + Mfix * next; + rtx insn; + HOST_WIDE_INT address; + rtx * loc; + enum machine_mode mode; + int fix_size; + rtx value; + Mnode * minipool; + HOST_WIDE_INT forwards; + HOST_WIDE_INT backwards; +}; -/* The maximum number of constants that can fit into one pool, since - the pc relative range is 0...4092 bytes and constants are at least 4 - bytes long. */ -#define MAX_MINIPOOL_SIZE (4092/4) -static minipool_node minipool_vector[MAX_MINIPOOL_SIZE]; -static int minipool_size; -static rtx minipool_vector_label; +/* Fixes less than a word need padding out to a word boundary. */ +#define MINIPOOL_FIX_SIZE(mode) \ + (GET_MODE_SIZE ((mode)) >= 4 ? GET_MODE_SIZE ((mode)) : 4) -/* Add a constant to the pool and return its offset within the current - pool. +static Mnode * minipool_vector_head; +static Mnode * minipool_vector_tail; +static rtx minipool_vector_label; + +/* The linked list of all minipool fixes required for this function. */ +Mfix * minipool_fix_head; +Mfix * minipool_fix_tail; +/* The fix entry for the current minipool, once it has been placed. */ +Mfix * minipool_barrier; + +/* Determines if INSN is the start of a jump table. Returns the end + of the TABLE or NULL_RTX. */ +static rtx +is_jump_table (insn) + rtx insn; +{ + rtx table; + + if (GET_CODE (insn) == JUMP_INSN + && JUMP_LABEL (insn) != NULL + && ((table = next_real_insn (JUMP_LABEL (insn))) + == next_real_insn (insn)) + && table != NULL + && GET_CODE (table) == JUMP_INSN + && (GET_CODE (PATTERN (table)) == ADDR_VEC + || GET_CODE (PATTERN (table)) == ADDR_DIFF_VEC)) + return table; + + return NULL_RTX; +} - X is the rtx we want to replace. MODE is its mode. On return, - ADDRESS_ONLY will be non-zero if we really want the address of such - a constant, not the constant itself. */ static HOST_WIDE_INT -add_minipool_constant (x, mode) - rtx x; - enum machine_mode mode; +get_jump_table_size (insn) + rtx insn; { - int i; - HOST_WIDE_INT offset; + rtx body = PATTERN (insn); + int elt = GET_CODE (body) == ADDR_DIFF_VEC ? 1 : 0; + + return GET_MODE_SIZE (GET_MODE (body)) * XVECLEN (body, elt); +} + +/* Move a minipool fix MP from its current location to before MAX_MP. + If MAX_MP is NULL, then MP doesn't need moving, but the addressing + contrains may need updating. */ +static Mnode * +move_minipool_fix_forward_ref (mp, max_mp, max_address) + Mnode * mp; + Mnode * max_mp; + HOST_WIDE_INT max_address; +{ + /* This should never be true and the code below assumes these are + different. */ + if (mp == max_mp) + abort (); + + if (max_mp == NULL) + { + if (max_address < mp->max_address) + mp->max_address = max_address; + } + else + { + if (max_address > max_mp->max_address - mp->fix_size) + mp->max_address = max_mp->max_address - mp->fix_size; + else + mp->max_address = max_address; + + /* Unlink MP from its current position. Since max_mp is non-null, + mp->prev must be non-null. */ + mp->prev->next = mp->next; + if (mp->next != NULL) + mp->next->prev = mp->prev; + else + minipool_vector_tail = mp->prev; + + /* Re-insert it before MAX_MP. */ + mp->next = max_mp; + mp->prev = max_mp->prev; + max_mp->prev = mp; + + if (mp->prev != NULL) + mp->prev->next = mp; + else + minipool_vector_head = mp; + } + + /* Save the new entry. */ + max_mp = mp; + + /* Scan over the preceeding entries and adjust their addresses as + required. */ + while (mp->prev != NULL + && mp->prev->max_address > mp->max_address - mp->prev->fix_size) + { + mp->prev->max_address = mp->max_address - mp->prev->fix_size; + mp = mp->prev; + } + + return max_mp; +} + +/* Add a constant to the minipool for a forward reference. Returns the + node added or NULL if the constant will not fit in this pool. */ +static Mnode * +add_minipool_forward_ref (fix) + Mfix * fix; +{ + /* If set, max_mp is the first pool_entry that has a lower + constraint than the one we are trying to add. */ + Mnode * max_mp = NULL; + HOST_WIDE_INT max_address = fix->address + fix->forwards; + Mnode * mp; - /* First, see if we've already got it. */ - for (i = 0; i < minipool_size; i++) + /* If this fix's address is greater than the address of the first + entry, then we can't put the fix in this pool. We subtract the + size of the current fix to ensure that if the table is fully + packed we still have enough room to insert this value by suffling + the other fixes forwards. */ + if (minipool_vector_head && + fix->address >= minipool_vector_head->max_address - fix->fix_size) + return NULL; + + /* Scan the pool to see if a constant with the same value has + already been added. While we are doing this, also note the + location where we must insert the constant if it doesn't already + exist. */ + for (mp = minipool_vector_head; mp != NULL; mp = mp->next) + { + if (GET_CODE (fix->value) == GET_CODE (mp->value) + && fix->mode == mp->mode + && (GET_CODE (fix->value) != CODE_LABEL + || (CODE_LABEL_NUMBER (fix->value) + == CODE_LABEL_NUMBER (mp->value))) + && rtx_equal_p (fix->value, mp->value)) + { + /* More than one fix references this entry. */ + mp->refcount++; + return move_minipool_fix_forward_ref (mp, max_mp, max_address); + } + + /* Note the insertion point if necessary. */ + if (max_mp == NULL + && mp->max_address > max_address) + max_mp = mp; + } + + /* The value is not currently in the minipool, so we need to create + a new entry for it. If MAX_MP is NULL, the entry will be put on + the end of the list since the placement is less constrained than + any existing entry. Otherwise, we insert the new fix before + MAX_MP and, if neceesary, adjust the constraints on the other + entries. */ + mp = xmalloc (sizeof (* mp)); + mp->fix_size = fix->fix_size; + mp->mode = fix->mode; + mp->value = fix->value; + mp->refcount = 1; + /* Not yet required for a backwards ref. */ + mp->min_address = -65536; + + if (max_mp == NULL) + { + mp->max_address = max_address; + mp->next = NULL; + mp->prev = minipool_vector_tail; + + if (mp->prev == NULL) + { + minipool_vector_head = mp; + minipool_vector_label = gen_label_rtx (); + } + else + mp->prev->next = mp; + + minipool_vector_tail = mp; + } + else { - if (GET_CODE (x) == minipool_vector[i].value->code - && mode == minipool_vector[i].mode) + if (max_address > max_mp->max_address - mp->fix_size) + mp->max_address = max_mp->max_address - mp->fix_size; + else + mp->max_address = max_address; + + mp->next = max_mp; + mp->prev = max_mp->prev; + max_mp->prev = mp; + if (mp->prev != NULL) + mp->prev->next = mp; + else + minipool_vector_head = mp; + } + + /* Save the new entry. */ + max_mp = mp; + + /* Scan over the preceeding entries and adjust their addresses as + required. */ + while (mp->prev != NULL + && mp->prev->max_address > mp->max_address - mp->prev->fix_size) + { + mp->prev->max_address = mp->max_address - mp->prev->fix_size; + mp = mp->prev; + } + + return max_mp; +} + +static Mnode * +move_minipool_fix_backward_ref (mp, min_mp, min_address) + Mnode * mp; + Mnode * min_mp; + HOST_WIDE_INT min_address; +{ + HOST_WIDE_INT offset; + + /* This should never be true, and the code below assumes these are + different. */ + if (mp == min_mp) + abort (); + + if (min_mp == NULL) + { + if (min_address > mp->min_address) + mp->min_address = min_address; + } + else + { + /* We will adjust this below if it is too loose. */ + mp->min_address = min_address; + + /* Unlink MP from its current position. Since min_mp is non-null, + mp->next must be non-null. */ + mp->next->prev = mp->prev; + if (mp->prev != NULL) + mp->prev->next = mp->next; + else + minipool_vector_head = mp->next; + + /* Reinsert it after MIN_MP. */ + mp->prev = min_mp; + mp->next = min_mp->next; + min_mp->next = mp; + if (mp->next != NULL) + mp->next->prev = mp; + else + minipool_vector_tail = mp; + } + + min_mp = mp; + + offset = 0; + for (mp = minipool_vector_head; mp != NULL; mp = mp->next) + { + mp->offset = offset; + if (mp->refcount > 0) + offset += mp->fix_size; + + if (mp->next && mp->next->min_address < mp->min_address + mp->fix_size) + mp->next->min_address = mp->min_address + mp->fix_size; + } + + return min_mp; +} + +/* Add a constant to the minipool for a backward reference. Returns the + node added or NULL if the constant will not fit in this pool. + + Note that the code for insertion for a backwards reference can be + somewhat confusing because the calculated offsets for each fix do + not take into account the size of the pool (which is still under + construction. */ +static Mnode * +add_minipool_backward_ref (fix) + Mfix * fix; +{ + /* If set, min_mp is the last pool_entry that has a lower constraint + than the one we are trying to add. */ + Mnode * min_mp = NULL; + /* This can be negative, since it is only a constraint. */ + HOST_WIDE_INT min_address = fix->address - fix->backwards; + Mnode * mp; + + /* If we can't reach the current pool from this insn, or if we can't + insert this entry at the end of the pool without pushing other + fixes out of range, then we don't try. This ensures that we + can't fail later on. */ + if (min_address >= minipool_barrier->address + || (minipool_vector_tail->min_address + fix->fix_size + >= minipool_barrier->address)) + return NULL; + + /* Scan the pool to see if a constant with the same value has + already been added. While we are doing this, also note the + location where we must insert the constant if it doesn't already + exist. */ + for (mp = minipool_vector_tail; mp != NULL; mp = mp->prev) + { + if (GET_CODE (fix->value) == GET_CODE (mp->value) + && fix->mode == mp->mode + && (GET_CODE (fix->value) != CODE_LABEL + || (CODE_LABEL_NUMBER (fix->value) + == CODE_LABEL_NUMBER (mp->value))) + && rtx_equal_p (fix->value, mp->value) + /* Check that there is enough slack to move this entry to the + end of the table (this is conservative). */ + && (mp->max_address + > (minipool_barrier->address + + minipool_vector_tail->offset + + minipool_vector_tail->fix_size))) { - if (GET_CODE (x) == CODE_LABEL) + mp->refcount++; + return move_minipool_fix_backward_ref (mp, min_mp, min_address); + } + + if (min_mp != NULL) + mp->min_address += fix->fix_size; + else + { + /* Note the insertion point if necessary. */ + if (mp->min_address < min_address) + min_mp = mp; + else if (mp->max_address + < minipool_barrier->address + mp->offset + fix->fix_size) { - if (XINT (x, 3) != XINT (minipool_vector[i].value, 3)) - continue; + /* Inserting before this entry would push the fix beyond + its maximum address (which can happen if we have + re-located a forwards fix); force the new fix to come + after it. */ + min_mp = mp; + min_address = mp->min_address + fix->fix_size; } - if (rtx_equal_p (x, minipool_vector[i].value)) - return minipool_vector[i].next_offset - GET_MODE_SIZE (mode); } } - /* Need a new one. */ - minipool_vector[minipool_size].next_offset = GET_MODE_SIZE (mode); - offset = 0; - if (minipool_size == 0) - minipool_vector_label = gen_label_rtx (); + /* We need to create a new entry. */ + mp = xmalloc (sizeof (* mp)); + mp->fix_size = fix->fix_size; + mp->mode = fix->mode; + mp->value = fix->value; + mp->refcount = 1; + mp->max_address = minipool_barrier->address + 65536; + + mp->min_address = min_address; + + if (min_mp == NULL) + { + mp->prev = NULL; + mp->next = minipool_vector_head; + + if (mp->next == NULL) + { + minipool_vector_tail = mp; + minipool_vector_label = gen_label_rtx (); + } + else + mp->next->prev = mp; + + minipool_vector_head = mp; + } + else + { + mp->next = min_mp->next; + mp->prev = min_mp; + min_mp->next = mp; + + if (mp->next != NULL) + mp->next->prev = mp; + else + minipool_vector_tail = mp; + } + + /* Save the new entry. */ + min_mp = mp; + + if (mp->prev) + mp = mp->prev; else - minipool_vector[minipool_size].next_offset - += (offset = minipool_vector[minipool_size - 1].next_offset); + mp->offset = 0; + + /* Scan over the following entries and adjust their offsets. */ + while (mp->next != NULL) + { + if (mp->next->min_address < mp->min_address + mp->fix_size) + mp->next->min_address = mp->min_address + mp->fix_size; + + if (mp->refcount) + mp->next->offset = mp->offset + mp->fix_size; + else + mp->next->offset = mp->offset; + + mp = mp->next; + } + + return min_mp; +} + +static void +assign_minipool_offsets (barrier) + Mfix * barrier; +{ + HOST_WIDE_INT offset = 0; + Mnode * mp; + + minipool_barrier = barrier; - minipool_vector[minipool_size].value = x; - minipool_vector[minipool_size].mode = mode; - minipool_size++; - return offset; + for (mp = minipool_vector_head; mp != NULL; mp = mp->next) + { + mp->offset = offset; + + if (mp->refcount > 0) + offset += mp->fix_size; + } } -/* Output the literal table. */ +/* Output the literal table */ static void dump_minipool (scan) rtx scan; { - int i; + Mnode * mp; + Mnode * nmp; + + if (rtl_dump_file) + fprintf (rtl_dump_file, + ";; Emitting minipool after insn %u; address %ld\n", + INSN_UID (scan), (unsigned long) minipool_barrier->address); scan = emit_label_after (gen_label_rtx (), scan); scan = emit_insn_after (gen_align_4 (), scan); scan = emit_label_after (minipool_vector_label, scan); - for (i = 0; i < minipool_size; i++) + for (mp = minipool_vector_head; mp != NULL; mp = nmp) { - minipool_node *p = minipool_vector + i; - - switch (GET_MODE_SIZE (p->mode)) + if (mp->refcount > 0) { - case 4: - scan = emit_insn_after (gen_consttable_4 (p->value), scan); - break; + if (rtl_dump_file) + { + fprintf (rtl_dump_file, + ";; Offset %u, min %ld, max %ld ", + (unsigned) mp->offset, (unsigned long) mp->min_address, + (unsigned long) mp->max_address); + arm_print_value (rtl_dump_file, mp->value); + fputc ('\n', rtl_dump_file); + } - case 8: - scan = emit_insn_after (gen_consttable_8 (p->value), scan); - break; + switch (mp->fix_size) + { +#ifdef HAVE_consttable_1 + case 1: + scan = emit_insn_after (gen_consttable_1 (mp->value), scan); + break; - default: - abort (); - break; +#endif +#ifdef HAVE_consttable_2 + case 2: + scan = emit_insn_after (gen_consttable_2 (mp->value), scan); + break; + +#endif +#ifdef HAVE_consttable_4 + case 4: + scan = emit_insn_after (gen_consttable_4 (mp->value), scan); + break; + +#endif +#ifdef HAVE_consttable_8 + case 8: + scan = emit_insn_after (gen_consttable_8 (mp->value), scan); + break; + +#endif + default: + abort (); + break; + } } + + nmp = mp->next; + free (mp); } + minipool_vector_head = minipool_vector_tail = NULL; scan = emit_insn_after (gen_consttable_end (), scan); scan = emit_barrier_after (scan); - minipool_size = 0; } -/* Find the last barrier less than MAX_COUNT bytes from FROM, or - create one. */ -static rtx -find_barrier (from, max_count) - rtx from; - int max_count; +/* Return the cost of forcibly inserting a barrier after INSN. */ +static int +arm_barrier_cost (insn) + rtx insn; { - int count = 0; - rtx found_barrier = 0; - rtx last = from; + /* Basing the location of the pool on the loop depth is preferable, + but at the moment, the basic block information seems to be + corrupt by this stage of the compilation. */ + int base_cost = 50; + rtx next = next_nonnote_insn (insn); + + if (next != NULL && GET_CODE (next) == CODE_LABEL) + base_cost -= 20; + + switch (GET_CODE (insn)) + { + case CODE_LABEL: + /* It will always be better to place the table before the label, rather + than after it. */ + return 50; + + case INSN: + case CALL_INSN: + return base_cost; + + case JUMP_INSN: + return base_cost - 10; + + default: + return base_cost + 10; + } +} + +/* Find the best place in the insn stream in the range + (FIX->address,MAX_ADDRESS) to forcibly insert a minipool barrier. + Create the barrier by inserting a jump and add a new fix entry for + it. */ +static Mfix * +create_fix_barrier (fix, max_address) + Mfix * fix; + HOST_WIDE_INT max_address; +{ + HOST_WIDE_INT count = 0; + rtx barrier; + rtx from = fix->insn; + rtx selected = from; + int selected_cost; + HOST_WIDE_INT selected_address; + Mfix * new_fix; + HOST_WIDE_INT max_count = max_address - fix->address; + rtx label = gen_label_rtx (); + + selected_cost = arm_barrier_cost (from); + selected_address = fix->address; while (from && count < max_count) { rtx tmp; - + int new_cost; + + /* This code shouldn't have been called if there was a natural barrier + within range. */ if (GET_CODE (from) == BARRIER) - found_barrier = from; + abort (); /* Count the length of this insn. */ - if (GET_CODE (from) == JUMP_INSN - && JUMP_LABEL (from) != 0 - && ((tmp = next_real_insn (JUMP_LABEL (from))) - == next_real_insn (from)) - && tmp != NULL - && GET_CODE (tmp) == JUMP_INSN - && (GET_CODE (PATTERN (tmp)) == ADDR_VEC - || GET_CODE (PATTERN (tmp)) == ADDR_DIFF_VEC)) - { - int elt = GET_CODE (PATTERN (tmp)) == ADDR_DIFF_VEC ? 1 : 0; - count += (get_attr_length (from) - + GET_MODE_SIZE (SImode) * XVECLEN (PATTERN (tmp), elt)); + count += get_attr_length (from); + + /* If there is a jump table, add its length. */ + tmp = is_jump_table (from); + if (tmp != NULL) + { + count += get_jump_table_size (tmp); + + /* Jump tables aren't in a basic block, so base the cost on + the dispatch insn. If we select this location, we will + still put the pool after the table. */ + new_cost = arm_barrier_cost (from); + + if (count < max_count && new_cost <= selected_cost) + { + selected = tmp; + selected_cost = new_cost; + selected_address = fix->address + count; + } + /* Continue after the dispatch table. */ - last = from; from = NEXT_INSN (tmp); continue; } - else - count += get_attr_length (from); - last = from; + new_cost = arm_barrier_cost (from); + + if (count < max_count && new_cost <= selected_cost) + { + selected = from; + selected_cost = new_cost; + selected_address = fix->address + count; + } + from = NEXT_INSN (from); } - if (! found_barrier) - { - /* We didn't find a barrier in time to - dump our stuff, so we'll make one. */ - rtx label = gen_label_rtx (); - - if (from) - from = PREV_INSN (last); - else - from = get_last_insn (); - - /* Walk back to be just before any jump. */ - while (GET_CODE (from) == JUMP_INSN - || GET_CODE (from) == NOTE - || GET_CODE (from) == CODE_LABEL) - from = PREV_INSN (from); - - from = emit_jump_insn_after (gen_jump (label), from); - JUMP_LABEL (from) = label; - found_barrier = emit_barrier_after (from); - emit_label_after (label, found_barrier); - } + /* Create a new JUMP_INSN that branches around a barrier. */ + from = emit_jump_insn_after (gen_jump (label), selected); + JUMP_LABEL (from) = label; + barrier = emit_barrier_after (from); + emit_label_after (label, barrier); - return found_barrier; -} + /* Create a minipool barrier entry for the new barrier. */ + new_fix = (Mfix *) oballoc (sizeof (* new_fix)); + new_fix->insn = barrier; + new_fix->address = selected_address; + new_fix->next = fix->next; + fix->next = new_fix; -struct minipool_fixup -{ - struct minipool_fixup *next; - rtx insn; - int address; - rtx *loc; - enum machine_mode mode; - rtx value; - int range; -}; - -struct minipool_fixup *minipool_fix_head; -struct minipool_fixup *minipool_fix_tail; + return new_fix; +} +/* Record that there is a natural barrier in the insn stream at + ADDRESS. */ static void push_minipool_barrier (insn, address) rtx insn; - int address; + HOST_WIDE_INT address; { - struct minipool_fixup *fix - = (struct minipool_fixup *) oballoc (sizeof (struct minipool_fixup)); + Mfix * fix = (Mfix *) oballoc (sizeof (* fix)); fix->insn = insn; fix->address = address; @@ -4543,21 +5358,26 @@ push_minipool_barrier (insn, address) minipool_fix_tail = fix; } +/* Record INSN, which will need fixing up to load a value from the + minipool. ADDRESS is the offset of the insn since the start of the + function; LOC is a pointer to the part of the insn which requires + fixing; VALUE is the constant that must be loaded, which is of type + MODE. */ static void push_minipool_fix (insn, address, loc, mode, value) rtx insn; - int address; - rtx *loc; + HOST_WIDE_INT address; + rtx * loc; enum machine_mode mode; rtx value; { - struct minipool_fixup *fix - = (struct minipool_fixup *) oballoc (sizeof (struct minipool_fixup)); + Mfix * fix = (Mfix *) oballoc (sizeof (* fix)); #ifdef AOF_ASSEMBLER /* PIC symbol refereneces need to be converted into offsets into the based area. */ - if (flag_pic && GET_MODE == SYMBOL_REF) + /* XXX This shouldn't be done here. */ + if (flag_pic && GET_CODE (value) == SYMBOL_REF) value = aof_pic_entry (value); #endif /* AOF_ASSEMBLER */ @@ -4565,17 +5385,32 @@ push_minipool_fix (insn, address, loc, mode, value) fix->address = address; fix->loc = loc; fix->mode = mode; + fix->fix_size = MINIPOOL_FIX_SIZE (mode); fix->value = value; - fix->range = get_attr_pool_range (insn); + fix->forwards = get_attr_pool_range (insn); + fix->backwards = get_attr_neg_pool_range (insn); + fix->minipool = NULL; /* If an insn doesn't have a range defined for it, then it isn't expecting to be reworked by this code. Better to abort now than to generate duff assembly code. */ - if (fix->range == 0) + if (fix->forwards == 0 && fix->backwards == 0) abort (); + if (rtl_dump_file) + { + fprintf (rtl_dump_file, + ";; %smode fixup for i%d; addr %lu, range (%ld,%ld): ", + GET_MODE_NAME (mode), + INSN_UID (insn), (unsigned long) address, + -1 * (long)fix->backwards, (long)fix->forwards); + arm_print_value (rtl_dump_file, fix->value); + fprintf (rtl_dump_file, "\n"); + } + /* Add it to the chain of fixes. */ fix->next = NULL; + if (minipool_fix_head != NULL) minipool_fix_tail->next = fix; else @@ -4584,21 +5419,21 @@ push_minipool_fix (insn, address, loc, mode, value) minipool_fix_tail = fix; } +/* Scan INSN and note any of its operands that need fixing. */ static void note_invalid_constants (insn, address) rtx insn; - int address; + HOST_WIDE_INT address; { int opno; - /* Extract the operands of the insn. */ - extract_insn(insn); + extract_insn (insn); - /* Find the alternative selected. */ if (! constrain_operands (1)) fatal_insn_not_found (insn); - /* Preprocess the constraints, to extract some useful information. */ + /* Fill in recog_op_alt with information about the constraints of this + insn. */ preprocess_constraints (); for (opno = 0; opno < recog_data.n_operands; opno++) @@ -4618,14 +5453,18 @@ note_invalid_constants (insn, address) if (CONSTANT_P (op)) push_minipool_fix (insn, address, recog_data.operand_loc[opno], recog_data.operand_mode[opno], op); +#if 0 + /* RWE: Now we look correctly at the operands for the insn, + this shouldn't be needed any more. */ #ifndef AOF_ASSEMBLER + /* XXX Is this still needed? */ else if (GET_CODE (op) == UNSPEC && XINT (op, 1) == 3) push_minipool_fix (insn, address, recog_data.operand_loc[opno], recog_data.operand_mode[opno], XVECEXP (op, 0, 0)); #endif - else if (recog_data.operand_mode[opno] == SImode - && GET_CODE (op) == MEM +#endif + else if (GET_CODE (op) == MEM && GET_CODE (XEXP (op, 0)) == SYMBOL_REF && CONSTANT_POOL_ADDRESS_P (XEXP (op, 0))) push_minipool_fix (insn, address, recog_data.operand_loc[opno], @@ -4640,8 +5479,8 @@ arm_reorg (first) rtx first; { rtx insn; - int address = 0; - struct minipool_fixup *fix; + HOST_WIDE_INT address = 0; + Mfix * fix; minipool_fix_head = minipool_fix_tail = NULL; @@ -4655,7 +5494,7 @@ arm_reorg (first) { if (GET_CODE (insn) == BARRIER) - push_minipool_barrier(insn, address); + push_minipool_barrier (insn, address); else if (GET_CODE (insn) == INSN || GET_CODE (insn) == CALL_INSN || GET_CODE (insn) == JUMP_INSN) { @@ -4663,104 +5502,121 @@ arm_reorg (first) note_invalid_constants (insn, address); address += get_attr_length (insn); + /* If the insn is a vector jump, add the size of the table and skip the table. */ - if (GET_CODE (insn) == JUMP_INSN - && JUMP_LABEL (insn) != NULL - && ((table = next_real_insn (JUMP_LABEL (insn))) - == next_real_insn (insn)) - && table != NULL - && GET_CODE (table) == JUMP_INSN - && (GET_CODE (PATTERN (table)) == ADDR_VEC - || GET_CODE (PATTERN (table)) == ADDR_DIFF_VEC)) + if ((table = is_jump_table (insn)) != NULL) { - int elt = GET_CODE (PATTERN (table)) == ADDR_DIFF_VEC ? 1 : 0; - - address += GET_MODE_SIZE (SImode) * XVECLEN (PATTERN (table), - elt); + address += get_jump_table_size (table); insn = table; } } } + fix = minipool_fix_head; + /* Now scan the fixups and perform the required changes. */ - for (fix = minipool_fix_head; fix; fix = fix->next) + while (fix) { - struct minipool_fixup *ftmp; - struct minipool_fixup *last_barrier = NULL; - int max_range; - rtx barrier; - struct minipool_fixup *this_fix; - int new_minipool_size = 0; + Mfix * ftmp; + Mfix * fdel; + Mfix * last_added_fix; + Mfix * last_barrier = NULL; + Mfix * this_fix; /* Skip any further barriers before the next fix. */ while (fix && GET_CODE (fix->insn) == BARRIER) fix = fix->next; + /* No more fixes. */ if (fix == NULL) break; - ftmp = fix; - max_range = fix->address + fix->range; + last_added_fix = NULL; - /* Find all the other fixes that can live in the same pool. */ - while (ftmp->next && ftmp->next->address < max_range - && (GET_CODE (ftmp->next->insn) == BARRIER - /* Ensure we can reach the constant inside the pool. */ - || ftmp->next->range > new_minipool_size)) + for (ftmp = fix; ftmp; ftmp = ftmp->next) { - ftmp = ftmp->next; if (GET_CODE (ftmp->insn) == BARRIER) - last_barrier = ftmp; - else { - /* Does this fix constrain the range we can search? */ - if (ftmp->address + ftmp->range - new_minipool_size < max_range) - max_range = ftmp->address + ftmp->range - new_minipool_size; + if (ftmp->address >= minipool_vector_head->max_address) + break; - new_minipool_size += GET_MODE_SIZE (ftmp->mode); + last_barrier = ftmp; } + else if ((ftmp->minipool = add_minipool_forward_ref (ftmp)) == NULL) + break; + + last_added_fix = ftmp; /* Keep track of the last fix added. */ } - /* If we found a barrier, drop back to that; any fixes that we could - have reached but come after the barrier will now go in the next - mini-pool. */ + /* If we found a barrier, drop back to that; any fixes that we + could have reached but come after the barrier will now go in + the next mini-pool. */ if (last_barrier != NULL) { - barrier = last_barrier->insn; + /* Reduce the refcount for those fixes that won't go into this + pool after all. */ + for (fdel = last_barrier->next; + fdel && fdel != ftmp; + fdel = fdel->next) + { + fdel->minipool->refcount--; + fdel->minipool = NULL; + } + ftmp = last_barrier; } - /* ftmp is last fix that we can fit into this pool and we - failed to find a barrier that we could use. Insert a new - barrier in the code and arrange to jump around it. */ else { + /* ftmp is first fix that we can't fit into this pool and + there no natural barriers that we could use. Insert a + new barrier in the code somewhere between the previous + fix and this one, and arrange to jump around it. */ + HOST_WIDE_INT max_address; + + /* The last item on the list of fixes must be a barrier, so + we can never run off the end of the list of fixes without + last_barrier being set. */ + if (ftmp == NULL) + abort (); + + max_address = minipool_vector_head->max_address; /* Check that there isn't another fix that is in range that we couldn't fit into this pool because the pool was already too large: we need to put the pool before such an instruction. */ - if (ftmp->next && ftmp->next->address < max_range) - max_range = ftmp->address; + if (ftmp->address < max_address) + max_address = ftmp->address; - barrier = find_barrier (ftmp->insn, max_range - ftmp->address); + last_barrier = create_fix_barrier (last_added_fix, max_address); + } + + assign_minipool_offsets (last_barrier); + + while (ftmp) + { + if (GET_CODE (ftmp->insn) != BARRIER + && ((ftmp->minipool = add_minipool_backward_ref (ftmp)) + == NULL)) + break; + + ftmp = ftmp->next; } /* Scan over the fixes we have identified for this pool, fixing them up and adding the constants to the pool itself. */ - for (this_fix = fix; this_fix && ftmp->next != this_fix; + for (this_fix = fix; this_fix && ftmp != this_fix; this_fix = this_fix->next) if (GET_CODE (this_fix->insn) != BARRIER) { - int offset = add_minipool_constant (this_fix->value, - this_fix->mode); rtx addr = plus_constant (gen_rtx_LABEL_REF (VOIDmode, minipool_vector_label), - offset); + this_fix->minipool->offset); *this_fix->loc = gen_rtx_MEM (this_fix->mode, addr); } - dump_minipool (barrier); + dump_minipool (last_barrier->insn); fix = ftmp; } @@ -4769,7 +5625,6 @@ arm_reorg (first) instruction generation. */ after_arm_reorg = 1; } - /* Routines to output assembly language. */ @@ -4816,7 +5671,7 @@ fp_const_from_val (r) INSTR is the possibly suffixed base register. HAT unequals zero if a hat must follow the register list. */ -void +static void print_multi_reg (stream, instr, reg, mask, hat) FILE * stream; char * instr; @@ -4831,7 +5686,7 @@ print_multi_reg (stream, instr, reg, mask, hat) asm_fprintf (stream, instr, reg); fputs (", {", stream); - for (i = 0; i < 16; i++) + for (i = 0; i <= LAST_ARM_REGNUM; i++) if (mask & (1 << i)) { if (not_first) @@ -5094,8 +5949,8 @@ output_move_double (operands) bcopy ((char *) &CONST_DOUBLE_LOW (operands[1]), (char *) &u, sizeof (u)); REAL_VALUE_TO_TARGET_DOUBLE (u.d, l); - otherops[1] = GEN_INT(l[1]); - operands[1] = GEN_INT(l[0]); + otherops[1] = GEN_INT (l[1]); + operands[1] = GEN_INT (l[0]); } else if (GET_MODE (operands[1]) != VOIDmode) abort (); @@ -5324,11 +6179,10 @@ output_mov_immediate (operands) n_ones++; if (n_ones > 16) /* Shorter to use MVN with BIC in this case. */ - output_multi_immediate(operands, "mvn%?\t%0, %1", "bic%?\t%0, %0, %1", 1, - ~n); + output_multi_immediate (operands, "mvn%?\t%0, %1", "bic%?\t%0, %0, %1", 1, + ~n); else - output_multi_immediate(operands, "mov%?\t%0, %1", "orr%?\t%0, %0, %1", 1, - n); + output_multi_immediate (operands, "mov%?\t%0, %1", "orr%?\t%0, %0, %1", 1, n); return ""; } @@ -5373,7 +6227,7 @@ output_multi_immediate (operands, instr1, instr2, immed_op, n) HOST_WIDE_INT n; { #if HOST_BITS_PER_WIDE_INT > 32 - n &= 0xffffffff; + n &= (unsigned HOST_WIDE_INT)0xffffffff; #endif if (n == 0) @@ -5739,6 +6593,7 @@ function_really_clobbers_lr (first) if (GET_CODE (next) == INSN && GET_CODE (PATTERN (next)) == USE && (GET_CODE (XVECEXP (PATTERN (insn), 0, 0)) == SET) + && (GET_CODE (XEXP (PATTERN (next), 0)) == REG) && (REGNO (SET_DEST (XVECEXP (PATTERN (insn), 0, 0))) == REGNO (XEXP (PATTERN (next), 0)))) if ((next = next_nonnote_insn (next)) == NULL) @@ -5768,8 +6623,12 @@ output_return_instruction (operand, really_return, reverse) int reg, live_regs = 0; int volatile_func = arm_volatile_func (); + /* If a function is naked, don't use the "return" insn. */ + if (arm_naked_function_p (current_function_decl)) + return ""; + return_used_this_function = 1; - + if (TARGET_ABORT_NORETURN && volatile_func) { /* If this function was declared non-returning, and we have found a tail @@ -5791,11 +6650,17 @@ output_return_instruction (operand, really_return, reverse) if (current_function_calls_alloca && ! really_return) abort (); - + for (reg = 0; reg <= 10; reg++) if (regs_ever_live[reg] && ! call_used_regs[reg]) live_regs++; + if (! TARGET_APCS_FRAME + && ! frame_pointer_needed + && regs_ever_live[HARD_FRAME_POINTER_REGNUM] + && ! call_used_regs[HARD_FRAME_POINTER_REGNUM]) + live_regs++; + if (flag_pic && ! TARGET_SINGLE_PIC_BASE && regs_ever_live[PIC_OFFSET_TABLE_REGNUM]) live_regs++; @@ -5814,10 +6679,14 @@ output_return_instruction (operand, really_return, reverse) /* FIXME: We ought to handle the case TARGET_APCS_32 is true, really_return is true, and only the PC needs restoring. */ && ! really_return) - { - output_asm_insn (reverse ? "ldr%?%D0\t%|lr, [%|sp], #4" - : "ldr%?%d0\t%|lr, [%|sp], #4", &operand); - } + output_asm_insn (reverse ? "ldr%?%D0\t%|lr, [%|sp], #4" + : "ldr%?%d0\t%|lr, [%|sp], #4", &operand); + else if (live_regs == 1 + && regs_ever_live[LR_REGNUM] + && ! lr_save_eliminated + && TARGET_APCS_32) + output_asm_insn (reverse ? "ldr%?%D0\t%|pc, [%|sp], #4" + : "ldr%?%d0\t%|pc, [%|sp], #4", &operand); else if (live_regs) { if (lr_save_eliminated || ! regs_ever_live[LR_REGNUM]) @@ -5856,12 +6725,23 @@ output_return_instruction (operand, really_return, reverse) } else { + if (! TARGET_APCS_FRAME + && regs_ever_live[HARD_FRAME_POINTER_REGNUM] + && ! call_used_regs[HARD_FRAME_POINTER_REGNUM]) + { + strcat (instr, "%|"); + strcat (instr, reg_names[HARD_FRAME_POINTER_REGNUM]); + strcat (instr, ", "); + } + strcat (instr, "%|"); + if (TARGET_INTERWORK && really_return) strcat (instr, reg_names[IP_REGNUM]); else strcat (instr, really_return ? reg_names[PC_REGNUM] : reg_names[LR_REGNUM]); } + strcat (instr, (TARGET_APCS_32 || !really_return) ? "}" : "}^"); output_asm_insn (instr, &operand); @@ -5938,12 +6818,12 @@ arm_poke_function_name (stream, name) unsigned long length; rtx x; - length = strlen (name) + 1; - alignlength = (length + 3) & ~3; + length = strlen (name) + 1; + alignlength = ROUND_UP (length); ASM_OUTPUT_ASCII (stream, name, length); ASM_OUTPUT_ALIGN (stream, 2); - x = GEN_INT (0xff000000UL + alignlength); + x = GEN_INT (((unsigned HOST_WIDE_INT)0xff000000) + alignlength); ASM_OUTPUT_INT (stream, x); } @@ -5956,7 +6836,7 @@ arm_poke_function_name (stream, name) lr is not clobbered in any other way, then there is no need to push lr onto the stack. */ void -output_func_prologue (f, frame_size) +output_arm_prologue (f, frame_size) FILE * f; int frame_size; { @@ -5993,6 +6873,12 @@ output_func_prologue (f, frame_size) if (regs_ever_live[reg] && ! call_used_regs[reg]) live_regs_mask |= (1 << reg); + if (! TARGET_APCS_FRAME + && ! frame_pointer_needed + && regs_ever_live[HARD_FRAME_POINTER_REGNUM] + && ! call_used_regs[HARD_FRAME_POINTER_REGNUM]) + live_regs_mask |= (1 << HARD_FRAME_POINTER_REGNUM); + if (flag_pic && ! TARGET_SINGLE_PIC_BASE && regs_ever_live[PIC_OFFSET_TABLE_REGNUM]) live_regs_mask |= (1 << PIC_OFFSET_TABLE_REGNUM); @@ -6037,8 +6923,11 @@ arm_output_epilogue () int floats_offset = 12; rtx operands[3]; int frame_size = get_frame_size (); - FILE *f = asm_out_file; - int volatile_func = arm_volatile_func (); + rtx eh_ofs = cfun->machine->eh_epilogue_sp_ofs; + FILE * f = asm_out_file; + int volatile_func = (optimize > 0 + && TREE_THIS_VOLATILE (current_function_decl)); + int return_regnum; if (use_return_insn (FALSE) && return_used_this_function) return ""; @@ -6047,6 +6936,10 @@ arm_output_epilogue () if (arm_naked_function_p (current_function_decl)) return ""; + /* If we are throwing an exception, the address we want to jump to is in + R1; otherwise, it's in LR. */ + return_regnum = eh_ofs ? 2 : LR_REGNUM; + /* A volatile function should never return. Call abort. */ if (TARGET_ABORT_NORETURN && volatile_func) { @@ -6064,6 +6957,16 @@ arm_output_epilogue () floats_offset += 4; } + /* Handle the frame pointer as a special case. */ + if (! TARGET_APCS_FRAME + && ! frame_pointer_needed + && regs_ever_live[HARD_FRAME_POINTER_REGNUM] + && ! call_used_regs[HARD_FRAME_POINTER_REGNUM]) + { + live_regs_mask |= (1 << HARD_FRAME_POINTER_REGNUM); + floats_offset += 4; + } + /* If we aren't loading the PIC register, don't stack it even though it may be live. */ if (flag_pic && ! TARGET_SINGLE_PIC_BASE @@ -6077,7 +6980,7 @@ arm_output_epilogue () { if (arm_fpu_arch == FP_SOFT2) { - for (reg = 23; reg > 15; reg--) + for (reg = LAST_ARM_FP_REGNUM; reg >= FIRST_ARM_FP_REGNUM; reg--) if (regs_ever_live[reg] && ! call_used_regs[reg]) { floats_offset += 12; @@ -6087,9 +6990,9 @@ arm_output_epilogue () } else { - int start_reg = 23; + int start_reg = LAST_ARM_FP_REGNUM; - for (reg = 23; reg > 15; reg--) + for (reg = LAST_ARM_FP_REGNUM; reg >= FIRST_ARM_FP_REGNUM; reg--) { if (regs_ever_live[reg] && ! call_used_regs[reg]) { @@ -6124,7 +7027,20 @@ arm_output_epilogue () { live_regs_mask |= 0x6800; print_multi_reg (f, "ldmea\t%r", FP_REGNUM, live_regs_mask, FALSE); - asm_fprintf (f, "\tbx\t%r\n", LR_REGNUM); + if (eh_ofs) + asm_fprintf (f, "\tadd\t%r, %r, %r\n", SP_REGNUM, SP_REGNUM, + REGNO (eh_ofs)); + asm_fprintf (f, "\tbx\t%r\n", return_regnum); + } + else if (eh_ofs) + { + live_regs_mask |= 0x6800; + print_multi_reg (f, "ldmea\t%r", FP_REGNUM, live_regs_mask, FALSE); + asm_fprintf (f, "\tadd\t%r, %r, %r\n", SP_REGNUM, SP_REGNUM, + REGNO (eh_ofs)); + /* Even in 26-bit mode we do a mov (rather than a movs) because + we don't have the PSR bits set in the address. */ + asm_fprintf (f, "\tmov\t%r, %r\n", PC_REGNUM, return_regnum); } else { @@ -6146,16 +7062,16 @@ arm_output_epilogue () if (arm_fpu_arch == FP_SOFT2) { - for (reg = 16; reg < 24; reg++) + for (reg = FIRST_ARM_FP_REGNUM; reg <= LAST_ARM_FP_REGNUM; reg++) if (regs_ever_live[reg] && ! call_used_regs[reg]) asm_fprintf (f, "\tldfe\t%r, [%r], #12\n", reg, SP_REGNUM); } else { - int start_reg = 16; + int start_reg = FIRST_ARM_FP_REGNUM; - for (reg = 16; reg < 24; reg++) + for (reg = FIRST_ARM_FP_REGNUM; reg <= LAST_ARM_FP_REGNUM; reg++) { if (regs_ever_live[reg] && ! call_used_regs[reg]) { @@ -6190,17 +7106,48 @@ arm_output_epilogue () if (! lr_save_eliminated) live_regs_mask |= 1 << LR_REGNUM; - if (live_regs_mask != 0) - print_multi_reg (f, "ldmfd\t%r!", SP_REGNUM, live_regs_mask, FALSE); - - asm_fprintf (f, "\tbx\t%r\n", LR_REGNUM); + /* Handle LR on its own. */ + if (live_regs_mask == (1 << LR_REGNUM)) + { + if (eh_ofs) + asm_fprintf (f, "\tadd\t%r, %r, #4\n", SP_REGNUM, + SP_REGNUM); + else + asm_fprintf (f, "\tldr\t%r, [%r], #4\n", LR_REGNUM, + SP_REGNUM); + } + else if (live_regs_mask != 0) + print_multi_reg (f, "ldmfd\t%r!", SP_REGNUM, live_regs_mask, + FALSE); + + if (eh_ofs) + asm_fprintf (f, "\tadd\t%r, %r, %r\n", SP_REGNUM, SP_REGNUM, + REGNO (eh_ofs)); + + asm_fprintf (f, "\tbx\t%r\n", return_regnum); } else if (lr_save_eliminated) - asm_fprintf (f, + asm_fprintf (f, TARGET_APCS_32 ? "\tmov\t%r, %r\n" : "\tmovs\t%r, %r\n", PC_REGNUM, LR_REGNUM); + else if (eh_ofs) + { + if (live_regs_mask == 0) + asm_fprintf (f, "\tadd\t%r, %r, #4\n", SP_REGNUM, SP_REGNUM); + else + print_multi_reg (f, "\tldmfd\t%r!", SP_REGNUM, + live_regs_mask | (1 << LR_REGNUM), FALSE); + + asm_fprintf (f, "\tadd\t%r, %r, %r\n", SP_REGNUM, SP_REGNUM, + REGNO (eh_ofs)); + /* Jump to the target; even in 26-bit mode. */ + asm_fprintf (f, "\tmov\t%r, %r\n", PC_REGNUM, return_regnum); + } + else if (TARGET_APCS_32 && live_regs_mask == 0) + asm_fprintf (f, "\tldr\t%r, [%r], #4\n", PC_REGNUM, SP_REGNUM); else - print_multi_reg (f, "ldmfd\t%r!", SP_REGNUM, live_regs_mask | 0x8000, + print_multi_reg (f, "ldmfd\t%r!", SP_REGNUM, + live_regs_mask | (1 << PC_REGNUM), TARGET_APCS_32 ? FALSE : TRUE); } else @@ -6211,8 +7158,18 @@ arm_output_epilogue () if (! lr_save_eliminated) live_regs_mask |= 1 << LR_REGNUM; - if (live_regs_mask != 0) - print_multi_reg (f, "ldmfd\t%r!", SP_REGNUM, live_regs_mask, FALSE); + if (live_regs_mask == (1 << LR_REGNUM)) + { + if (eh_ofs) + asm_fprintf (f, "\tadd\t%r, %r, #4\n", SP_REGNUM, + SP_REGNUM); + else + asm_fprintf (f, "\tldr\t%r, [%r], #4\n", LR_REGNUM, + SP_REGNUM); + } + else if (live_regs_mask != 0) + print_multi_reg (f, "ldmfd\t%r!", SP_REGNUM, live_regs_mask, + FALSE); } if (current_function_pretend_args_size) @@ -6222,13 +7179,18 @@ arm_output_epilogue () operands[2] = GEN_INT (current_function_pretend_args_size); output_add_immediate (operands); } + + if (eh_ofs) + asm_fprintf (f, "\tadd\t%r, %r, %r\n", SP_REGNUM, SP_REGNUM, + REGNO (eh_ofs)); + /* And finally, go home. */ if (TARGET_INTERWORK) - asm_fprintf (f, "\tbx\t%r\n", LR_REGNUM); - else if (TARGET_APCS_32) - asm_fprintf (f, "\tmov\t%r, %r\n", PC_REGNUM, LR_REGNUM); + asm_fprintf (f, "\tbx\t%r\n", return_regnum); + else if (TARGET_APCS_32 || eh_ofs) + asm_fprintf (f, "\tmov\t%r, %r\n", PC_REGNUM, return_regnum); else - asm_fprintf (f, "\tmovs\t%r, %r\n", PC_REGNUM, LR_REGNUM); + asm_fprintf (f, "\tmovs\t%r, %r\n", PC_REGNUM, return_regnum); } } @@ -6239,14 +7201,25 @@ void output_func_epilogue (frame_size) int frame_size; { - if (use_return_insn (FALSE) && return_used_this_function - && (frame_size + current_function_outgoing_args_size) != 0 - && ! (frame_pointer_needed && TARGET_APCS)) - abort (); + if (TARGET_THUMB) + { + /* ??? Probably not safe to set this here, since it assumes that a + function will be emitted as assembly immediately after we generate + RTL for it. This does not happen for inline functions. */ + return_used_this_function = 0; + } + else + { + if (use_return_insn (FALSE) + && return_used_this_function + && (frame_size + current_function_outgoing_args_size) != 0 + && ! frame_pointer_needed) + abort (); - /* Reset the ARM-specific per-function variables. */ - current_function_anonymous_args = 0; - after_arm_reorg = 0; + /* Reset the ARM-specific per-function variables. */ + current_function_anonymous_args = 0; + after_arm_reorg = 0; + } } /* Generate and emit an insn that we will recognize as a push_multi. @@ -6263,9 +7236,9 @@ emit_multi_reg_push (mask) rtx dwarf; rtx tmp, reg; - for (i = 0; i < 16; i++) + for (i = 0; i <= LAST_ARM_REGNUM; i++) if (mask & (1 << i)) - num_regs++; + num_regs ++; if (num_regs == 0 || num_regs > 16) abort (); @@ -6274,7 +7247,7 @@ emit_multi_reg_push (mask) dwarf = gen_rtx_PARALLEL (VOIDmode, rtvec_alloc (num_regs)); RTX_FRAME_RELATED_P (dwarf) = 1; - for (i = 0; i < 16; i++) + for (i = 0; i <= LAST_ARM_REGNUM; i++) { if (mask & (1 << i)) { @@ -6404,6 +7377,12 @@ arm_expand_prologue () if (regs_ever_live[reg] && ! call_used_regs[reg]) live_regs_mask |= 1 << reg; + if (! TARGET_APCS_FRAME + && ! frame_pointer_needed + && regs_ever_live[HARD_FRAME_POINTER_REGNUM] + && ! call_used_regs[HARD_FRAME_POINTER_REGNUM]) + live_regs_mask |= 1 << HARD_FRAME_POINTER_REGNUM; + if (flag_pic && regs_ever_live[PIC_OFFSET_TABLE_REGNUM]) live_regs_mask |= 1 << PIC_OFFSET_TABLE_REGNUM; @@ -6440,12 +7419,13 @@ arm_expand_prologue () RTX_FRAME_RELATED_P (insn) = 1; } - /* And now the floating point regs. */ + /* For now the integer regs are still pushed in output_arm_epilogue (). */ + if (! volatile_func) { if (arm_fpu_arch == FP_SOFT2) { - for (reg = 23; reg > 15; reg--) + for (reg = LAST_ARM_FP_REGNUM; reg >= FIRST_ARM_FP_REGNUM; reg --) if (regs_ever_live[reg] && ! call_used_regs[reg]) { insn = gen_rtx_PRE_DEC (XFmode, stack_pointer_rtx); @@ -6457,9 +7437,9 @@ arm_expand_prologue () } else { - int start_reg = 23; + int start_reg = LAST_ARM_FP_REGNUM; - for (reg = 23; reg > 15; reg--) + for (reg = LAST_ARM_FP_REGNUM; reg >= FIRST_ARM_FP_REGNUM; reg --) { if (regs_ever_live[reg] && ! call_used_regs[reg]) { @@ -6541,6 +7521,10 @@ arm_print_operand (stream, x, code) fputs (ASM_COMMENT_START, stream); return; + case '_': + fputs (user_label_prefix, stream); + return; + case '|': fputs (REGISTER_PREFIX, stream); return; @@ -6600,44 +7584,84 @@ arm_print_operand (stream, x, code) } return; + /* An explanation of the 'Q', 'R' and 'H' register operands: + + In a pair of registers containing a DI or DF value the 'Q' + operand returns the register number of the register containing + the least signficant part of the value. The 'R' operand returns + the register number of the register containing the most + significant part of the value. + + The 'H' operand returns the higher of the two register numbers. + On a run where WORDS_BIG_ENDIAN is true the 'H' operand is the + same as the 'Q' operand, since the most signficant part of the + value is held in the lower number register. The reverse is true + on systems where WORDS_BIG_ENDIAN is false. + + The purpose of these operands is to distinguish between cases + where the endian-ness of the values is important (for example + when they are added together), and cases where the endian-ness + is irrelevant, but the order of register operations is important. + For example when loading a value from memory into a register + pair, the endian-ness does not matter. Provided that the value + from the lower memory address is put into the lower numbered + register, and the value from the higher address is put into the + higher numbered register, the load will work regardless of whether + the value being loaded is big-wordian or little-wordian. The + order of the two register loads can matter however, if the address + of the memory location is actually held in one of the registers + being overwritten by the load. */ case 'Q': - if (REGNO (x) > 15) + if (REGNO (x) > LAST_ARM_REGNUM) abort (); - fputs (REGISTER_PREFIX, stream); - fputs (reg_names[REGNO (x) + (WORDS_BIG_ENDIAN ? 1 : 0)], stream); + asm_fprintf (stream, "%r", REGNO (x) + (WORDS_BIG_ENDIAN ? 1 : 0)); return; case 'R': - if (REGNO (x) > 15) + if (REGNO (x) > LAST_ARM_REGNUM) abort (); - fputs (REGISTER_PREFIX, stream); - fputs (reg_names[REGNO (x) + (WORDS_BIG_ENDIAN ? 0 : 1)], stream); + asm_fprintf (stream, "%r", REGNO (x) + (WORDS_BIG_ENDIAN ? 0 : 1)); + return; + + case 'H': + if (REGNO (x) > LAST_ARM_REGNUM) + abort (); + asm_fprintf (stream, "%r", REGNO (x) + 1); return; case 'm': - fputs (REGISTER_PREFIX, stream); - if (GET_CODE (XEXP (x, 0)) == REG) - fputs (reg_names[REGNO (XEXP (x, 0))], stream); - else - fputs (reg_names[REGNO (XEXP (XEXP (x, 0), 0))], stream); + asm_fprintf (stream, "%r", + GET_CODE (XEXP (x, 0)) == REG + ? REGNO (XEXP (x, 0)) : REGNO (XEXP (XEXP (x, 0), 0))); return; case 'M': asm_fprintf (stream, "{%r-%r}", - REGNO (x), REGNO (x) + NUM_REGS (GET_MODE (x)) - 1); + REGNO (x), + REGNO (x) + NUM_REGS (GET_MODE (x)) - 1); return; case 'd': - if (x) + if (! x) + return; + + if (TARGET_ARM) fputs (arm_condition_codes[get_arm_condition_code (x)], stream); + else + fputs (thumb_condition_code (x, 0), stream); return; case 'D': - if (x) - fputs (arm_condition_codes[ARM_INVERSE_CONDITION_CODE - (get_arm_condition_code (x))], + if (! x) + return; + + if (TARGET_ARM) + fputs (arm_condition_codes[ARM_INVERSE_CONDITION_CODE + (get_arm_condition_code (x))], stream); + else + fputs (thumb_condition_code (x, 1), stream); return; default: @@ -6645,10 +7669,7 @@ arm_print_operand (stream, x, code) abort (); if (GET_CODE (x) == REG) - { - fputs (REGISTER_PREFIX, stream); - fputs (reg_names[REGNO (x)], stream); - } + asm_fprintf (stream, "%r", REGNO (x)); else if (GET_CODE (x) == MEM) { output_memory_reference_mode = GET_MODE (x); @@ -7136,7 +8157,7 @@ arm_final_prescan_insn (insn) if (reverse || then_not_else) arm_current_cc = ARM_INVERSE_CONDITION_CODE (arm_current_cc); } - + /* Restore recog_data (getting the attributes of other insns can destroy this array, but final.c assumes that it remains intact across this call; since the insn has been recognized already we @@ -7145,6 +8166,1547 @@ arm_final_prescan_insn (insn) } } +int +arm_regno_class (regno) + int regno; +{ + if (TARGET_THUMB) + { + if (regno == STACK_POINTER_REGNUM) + return STACK_REG; + if (regno == CC_REGNUM) + return CC_REG; + if (regno < 8) + return LO_REGS; + return HI_REGS; + } + + if ( regno <= LAST_ARM_REGNUM + || regno == FRAME_POINTER_REGNUM + || regno == ARG_POINTER_REGNUM) + return GENERAL_REGS; + + if (regno == CC_REGNUM) + return NO_REGS; + + return FPU_REGS; +} + +/* Handle a special case when computing the offset + of an argument from the frame pointer. */ +int +arm_debugger_arg_offset (value, addr) + int value; + rtx addr; +{ + rtx insn; + + /* We are only interested if dbxout_parms() failed to compute the offset. */ + if (value != 0) + return 0; + + /* We can only cope with the case where the address is held in a register. */ + if (GET_CODE (addr) != REG) + return 0; + + /* If we are using the frame pointer to point at the argument, then + an offset of 0 is correct. */ + if (REGNO (addr) == HARD_FRAME_POINTER_REGNUM) + return 0; + + /* If we are using the stack pointer to point at the + argument, then an offset of 0 is correct. */ + if ((TARGET_THUMB || ! frame_pointer_needed) + && REGNO (addr) == SP_REGNUM) + return 0; + + /* Oh dear. The argument is pointed to by a register rather + than being held in a register, or being stored at a known + offset from the frame pointer. Since GDB only understands + those two kinds of argument we must translate the address + held in the register into an offset from the frame pointer. + We do this by searching through the insns for the function + looking to see where this register gets its value. If the + register is initialised from the frame pointer plus an offset + then we are in luck and we can continue, otherwise we give up. + + This code is exercised by producing debugging information + for a function with arguments like this: + + double func (double a, double b, int c, double d) {return d;} + + Without this code the stab for parameter 'd' will be set to + an offset of 0 from the frame pointer, rather than 8. */ + + /* The if() statement says: + + If the insn is a normal instruction + and if the insn is setting the value in a register + and if the register being set is the register holding the address of the argument + and if the address is computing by an addition + that involves adding to a register + which is the frame pointer + a constant integer + + then... */ + + for (insn = get_insns (); insn; insn = NEXT_INSN (insn)) + { + if ( GET_CODE (insn) == INSN + && GET_CODE (PATTERN (insn)) == SET + && REGNO (XEXP (PATTERN (insn), 0)) == REGNO (addr) + && GET_CODE (XEXP (PATTERN (insn), 1)) == PLUS + && GET_CODE (XEXP (XEXP (PATTERN (insn), 1), 0)) == REG + && REGNO (XEXP (XEXP (PATTERN (insn), 1), 0)) == HARD_FRAME_POINTER_REGNUM + && GET_CODE (XEXP (XEXP (PATTERN (insn), 1), 1)) == CONST_INT + ) + { + value = INTVAL (XEXP (XEXP (PATTERN (insn), 1), 1)); + + break; + } + } + + if (value == 0) + { + debug_rtx (addr); + warning ("Unable to compute real location of stacked parameter"); + value = 8; /* XXX magic hack */ + } + + return value; +} + + +/* Recursively search through all of the blocks in a function + checking to see if any of the variables created in that + function match the RTX called 'orig'. If they do then + replace them with the RTX called 'new'. */ + +static void +replace_symbols_in_block (block, orig, new) + tree block; + rtx orig; + rtx new; +{ + for (; block; block = BLOCK_CHAIN (block)) + { + tree sym; + + if (! TREE_USED (block)) + continue; + + for (sym = BLOCK_VARS (block); sym; sym = TREE_CHAIN (sym)) + { + if ( (DECL_NAME (sym) == 0 && TREE_CODE (sym) != TYPE_DECL) + || DECL_IGNORED_P (sym) + || TREE_CODE (sym) != VAR_DECL + || DECL_EXTERNAL (sym) + || ! rtx_equal_p (DECL_RTL (sym), orig) + ) + continue; + + DECL_RTL (sym) = new; + } + + replace_symbols_in_block (BLOCK_SUBBLOCKS (block), orig, new); + } +} + +/* Return the number (counting from 0) of the least significant set + bit in MASK. */ +#ifdef __GNUC__ +inline +#endif +static int +number_of_first_bit_set (mask) + int mask; +{ + int bit; + + for (bit = 0; + (mask & (1 << bit)) == 0; + ++ bit) + continue; + + return bit; +} + +/* Generate code to return from a thumb function. + If 'reg_containing_return_addr' is -1, then the return address is + actually on the stack, at the stack pointer. */ +static void +thumb_exit (f, reg_containing_return_addr, eh_ofs) + FILE * f; + int reg_containing_return_addr; + rtx eh_ofs; +{ + unsigned regs_available_for_popping; + unsigned regs_to_pop; + int pops_needed; + unsigned available; + unsigned required; + int mode; + int size; + int restore_a4 = FALSE; + + /* Compute the registers we need to pop. */ + regs_to_pop = 0; + pops_needed = 0; + + /* There is an assumption here, that if eh_ofs is not NULL, the + normal return address will have been pushed. */ + if (reg_containing_return_addr == -1 || eh_ofs) + { + /* When we are generating a return for __builtin_eh_return, + reg_containing_return_addr must specify the return regno. */ + if (eh_ofs && reg_containing_return_addr == -1) + abort (); + + regs_to_pop |= 1 << LR_REGNUM; + ++ pops_needed; + } + + if (TARGET_BACKTRACE) + { + /* Restore the (ARM) frame pointer and stack pointer. */ + regs_to_pop |= (1 << ARM_HARD_FRAME_POINTER_REGNUM) | (1 << SP_REGNUM); + pops_needed += 2; + } + + /* If there is nothing to pop then just emit the BX instruction and + return. */ + if (pops_needed == 0) + { + if (eh_ofs) + asm_fprintf (f, "\tadd\t%r, %r\n", SP_REGNUM, REGNO (eh_ofs)); + + asm_fprintf (f, "\tbx\t%r\n", reg_containing_return_addr); + return; + } + /* Otherwise if we are not supporting interworking and we have not created + a backtrace structure and the function was not entered in ARM mode then + just pop the return address straight into the PC. */ + else if ( ! TARGET_INTERWORK + && ! TARGET_BACKTRACE + && ! is_called_in_ARM_mode (current_function_decl)) + { + if (eh_ofs) + { + asm_fprintf (f, "\tadd\t%r, #4\n", SP_REGNUM); + asm_fprintf (f, "\tadd\t%r, %r\n", SP_REGNUM, REGNO (eh_ofs)); + asm_fprintf (f, "\tbx\t%r\n", reg_containing_return_addr); + } + else + asm_fprintf (f, "\tpop\t{%r}\n", PC_REGNUM); + + return; + } + + /* Find out how many of the (return) argument registers we can corrupt. */ + regs_available_for_popping = 0; + + /* If returning via __builtin_eh_return, the bottom three registers + all contain information needed for the return. */ + if (eh_ofs) + size = 12; + else + { +#ifdef RTX_CODE + /* If we can deduce the registers used from the function's + return value. This is more reliable that examining + regs_ever_live[] because that will be set if the register is + ever used in the function, not just if the register is used + to hold a return value. */ + + if (current_function_return_rtx != 0) + mode = GET_MODE (current_function_return_rtx); + else +#endif + mode = DECL_MODE (DECL_RESULT (current_function_decl)); + + size = GET_MODE_SIZE (mode); + + if (size == 0) + { + /* In a void function we can use any argument register. + In a function that returns a structure on the stack + we can use the second and third argument registers. */ + if (mode == VOIDmode) + regs_available_for_popping = + (1 << ARG_REGISTER (1)) + | (1 << ARG_REGISTER (2)) + | (1 << ARG_REGISTER (3)); + else + regs_available_for_popping = + (1 << ARG_REGISTER (2)) + | (1 << ARG_REGISTER (3)); + } + else if (size <= 4) + regs_available_for_popping = + (1 << ARG_REGISTER (2)) + | (1 << ARG_REGISTER (3)); + else if (size <= 8) + regs_available_for_popping = + (1 << ARG_REGISTER (3)); + } + + /* Match registers to be popped with registers into which we pop them. */ + for (available = regs_available_for_popping, + required = regs_to_pop; + required != 0 && available != 0; + available &= ~(available & - available), + required &= ~(required & - required)) + -- pops_needed; + + /* If we have any popping registers left over, remove them. */ + if (available > 0) + regs_available_for_popping &= ~ available; + + /* Otherwise if we need another popping register we can use + the fourth argument register. */ + else if (pops_needed) + { + /* If we have not found any free argument registers and + reg a4 contains the return address, we must move it. */ + if (regs_available_for_popping == 0 + && reg_containing_return_addr == LAST_ARG_REGNUM) + { + asm_fprintf (f, "\tmov\t%r, %r\n", LR_REGNUM, LAST_ARG_REGNUM); + reg_containing_return_addr = LR_REGNUM; + } + else if (size > 12) + { + /* Register a4 is being used to hold part of the return value, + but we have dire need of a free, low register. */ + restore_a4 = TRUE; + + asm_fprintf (f, "\tmov\t%r, %r\n",IP_REGNUM, LAST_ARG_REGNUM); + } + + if (reg_containing_return_addr != LAST_ARG_REGNUM) + { + /* The fourth argument register is available. */ + regs_available_for_popping |= 1 << LAST_ARG_REGNUM; + + -- pops_needed; + } + } + + /* Pop as many registers as we can. */ + thumb_pushpop (f, regs_available_for_popping, FALSE); + + /* Process the registers we popped. */ + if (reg_containing_return_addr == -1) + { + /* The return address was popped into the lowest numbered register. */ + regs_to_pop &= ~ (1 << LR_REGNUM); + + reg_containing_return_addr = + number_of_first_bit_set (regs_available_for_popping); + + /* Remove this register for the mask of available registers, so that + the return address will not be corrupted by futher pops. */ + regs_available_for_popping &= ~ (1 << reg_containing_return_addr); + } + + /* If we popped other registers then handle them here. */ + if (regs_available_for_popping) + { + int frame_pointer; + + /* Work out which register currently contains the frame pointer. */ + frame_pointer = number_of_first_bit_set (regs_available_for_popping); + + /* Move it into the correct place. */ + asm_fprintf (f, "\tmov\t%r, %r\n", + ARM_HARD_FRAME_POINTER_REGNUM, frame_pointer); + + /* (Temporarily) remove it from the mask of popped registers. */ + regs_available_for_popping &= ~ (1 << frame_pointer); + regs_to_pop &= ~ (1 << ARM_HARD_FRAME_POINTER_REGNUM); + + if (regs_available_for_popping) + { + int stack_pointer; + + /* We popped the stack pointer as well, + find the register that contains it. */ + stack_pointer = number_of_first_bit_set (regs_available_for_popping); + + /* Move it into the stack register. */ + asm_fprintf (f, "\tmov\t%r, %r\n", SP_REGNUM, stack_pointer); + + /* At this point we have popped all necessary registers, so + do not worry about restoring regs_available_for_popping + to its correct value: + + assert (pops_needed == 0) + assert (regs_available_for_popping == (1 << frame_pointer)) + assert (regs_to_pop == (1 << STACK_POINTER)) */ + } + else + { + /* Since we have just move the popped value into the frame + pointer, the popping register is available for reuse, and + we know that we still have the stack pointer left to pop. */ + regs_available_for_popping |= (1 << frame_pointer); + } + } + + /* If we still have registers left on the stack, but we no longer have + any registers into which we can pop them, then we must move the return + address into the link register and make available the register that + contained it. */ + if (regs_available_for_popping == 0 && pops_needed > 0) + { + regs_available_for_popping |= 1 << reg_containing_return_addr; + + asm_fprintf (f, "\tmov\t%r, %r\n", LR_REGNUM, + reg_containing_return_addr); + + reg_containing_return_addr = LR_REGNUM; + } + + /* If we have registers left on the stack then pop some more. + We know that at most we will want to pop FP and SP. */ + if (pops_needed > 0) + { + int popped_into; + int move_to; + + thumb_pushpop (f, regs_available_for_popping, FALSE); + + /* We have popped either FP or SP. + Move whichever one it is into the correct register. */ + popped_into = number_of_first_bit_set (regs_available_for_popping); + move_to = number_of_first_bit_set (regs_to_pop); + + asm_fprintf (f, "\tmov\t%r, %r\n", move_to, popped_into); + + regs_to_pop &= ~ (1 << move_to); + + -- pops_needed; + } + + /* If we still have not popped everything then we must have only + had one register available to us and we are now popping the SP. */ + if (pops_needed > 0) + { + int popped_into; + + thumb_pushpop (f, regs_available_for_popping, FALSE); + + popped_into = number_of_first_bit_set (regs_available_for_popping); + + asm_fprintf (f, "\tmov\t%r, %r\n", SP_REGNUM, popped_into); + /* + assert (regs_to_pop == (1 << STACK_POINTER)) + assert (pops_needed == 1) + */ + } + + /* If necessary restore the a4 register. */ + if (restore_a4) + { + if (reg_containing_return_addr != LR_REGNUM) + { + asm_fprintf (f, "\tmov\t%r, %r\n", LR_REGNUM, LAST_ARG_REGNUM); + reg_containing_return_addr = LR_REGNUM; + } + + asm_fprintf (f, "\tmov\t%r, %r\n", LAST_ARG_REGNUM, IP_REGNUM); + } + + if (eh_ofs) + asm_fprintf (f, "\tadd\t%r, %r\n", SP_REGNUM, REGNO (eh_ofs)); + + /* Return to caller. */ + asm_fprintf (f, "\tbx\t%r\n", reg_containing_return_addr); +} + +/* Emit code to push or pop registers to or from the stack. */ +static void +thumb_pushpop (f, mask, push) + FILE * f; + int mask; + int push; +{ + int regno; + int lo_mask = mask & 0xFF; + + if (lo_mask == 0 && ! push && (mask & (1 << 15))) + { + /* Special case. Do not generate a POP PC statement here, do it in + thumb_exit() */ + thumb_exit (f, -1, NULL_RTX); + return; + } + + fprintf (f, "\t%s\t{", push ? "push" : "pop"); + + /* Look at the low registers first. */ + for (regno = 0; regno <= LAST_LO_REGNUM; regno ++, lo_mask >>= 1) + { + if (lo_mask & 1) + { + asm_fprintf (f, "%r", regno); + + if ((lo_mask & ~1) != 0) + fprintf (f, ", "); + } + } + + if (push && (mask & (1 << LR_REGNUM))) + { + /* Catch pushing the LR. */ + if (mask & 0xFF) + fprintf (f, ", "); + + asm_fprintf (f, "%r", LR_REGNUM); + } + else if (!push && (mask & (1 << PC_REGNUM))) + { + /* Catch popping the PC. */ + if (TARGET_INTERWORK || TARGET_BACKTRACE) + { + /* The PC is never poped directly, instead + it is popped into r3 and then BX is used. */ + fprintf (f, "}\n"); + + thumb_exit (f, -1, NULL_RTX); + + return; + } + else + { + if (mask & 0xFF) + fprintf (f, ", "); + + asm_fprintf (f, "%r", PC_REGNUM); + } + } + + fprintf (f, "}\n"); +} + +void +thumb_final_prescan_insn (insn) + rtx insn; +{ + extern int * insn_addresses; + + if (flag_print_asm_name) + asm_fprintf (asm_out_file, "%@ 0x%04x\n", insn_addresses[INSN_UID (insn)]); +} + +int +thumb_shiftable_const (val) + unsigned HOST_WIDE_INT val; +{ + unsigned HOST_WIDE_INT mask = 0xff; + int i; + + if (val == 0) /* XXX */ + return 0; + + for (i = 0; i < 25; i++) + if ((val & (mask << i)) == val) + return 1; + + return 0; +} + +/* Returns non-zero if the current function contains, + or might contain a far jump. */ +int +thumb_far_jump_used_p (int in_prologue) +{ + rtx insn; + + /* This test is only important for leaf functions. */ + /* assert (! leaf_function_p ()); */ + + /* If we have already decided that far jumps may be used, + do not bother checking again, and always return true even if + it turns out that they are not being used. Once we have made + the decision that far jumps are present (and that hence the link + register will be pushed onto the stack) we cannot go back on it. */ + if (cfun->machine->far_jump_used) + return 1; + + /* If this function is not being called from the prologue/epilogue + generation code then it must be being called from the + INITIAL_ELIMINATION_OFFSET macro. */ + if (! in_prologue) + { + /* In this case we know that we are being asked about the elimination + of the arg pointer register. If that register is not being used, + then there are no arguments on the stack, and we do not have to + worry that a far jump might force the prologue to push the link + register, changing the stack offsets. In this case we can just + return false, since the presence of far jumps in the function will + not affect stack offsets. + + If the arg pointer is live (or if it was live, but has now been + eliminated and so set to dead) then we do have to test to see if + the function might contain a far jump. This test can lead to some + false negatives, since before reload is completed, then length of + branch instructions is not known, so gcc defaults to returning their + longest length, which in turn sets the far jump attribute to true. + + A false negative will not result in bad code being generated, but it + will result in a needless push and pop of the link register. We + hope that this does not occur too often. */ + if (regs_ever_live [ARG_POINTER_REGNUM]) + cfun->machine->arg_pointer_live = 1; + else if (! cfun->machine->arg_pointer_live) + return 0; + } + + /* Check to see if the function contains a branch + insn with the far jump attribute set. */ + for (insn = get_insns (); insn; insn = NEXT_INSN (insn)) + { + if (GET_CODE (insn) == JUMP_INSN + /* Ignore tablejump patterns. */ + && GET_CODE (PATTERN (insn)) != ADDR_VEC + && GET_CODE (PATTERN (insn)) != ADDR_DIFF_VEC + && get_attr_far_jump (insn) == FAR_JUMP_YES + ) + { + /* Record the fact that we have decied that + the function does use far jumps. */ + cfun->machine->far_jump_used = 1; + return 1; + } + } + + return 0; +} + +/* Return non-zero if FUNC must be entered in ARM mode. */ +int +is_called_in_ARM_mode (func) + tree func; +{ + if (TREE_CODE (func) != FUNCTION_DECL) + abort (); + + /* Ignore the problem about functions whoes address is taken. */ + if (TARGET_CALLEE_INTERWORKING && TREE_PUBLIC (func)) + return TRUE; + +#ifdef ARM_PE + return lookup_attribute ("interfacearm", DECL_MACHINE_ATTRIBUTES (func)) != NULL_TREE; +#else + return FALSE; +#endif +} + +/* The bits which aren't usefully expanded as rtl. */ +char * +thumb_unexpanded_epilogue () +{ + int regno; + int live_regs_mask = 0; + int high_regs_pushed = 0; + int leaf_function = leaf_function_p (); + int had_to_push_lr; + rtx eh_ofs = cfun->machine->eh_epilogue_sp_ofs; + + if (return_used_this_function) + return ""; + + for (regno = 0; regno <= LAST_LO_REGNUM; regno++) + if (regs_ever_live[regno] && ! call_used_regs[regno] + && ! (TARGET_SINGLE_PIC_BASE && (regno == arm_pic_register))) + live_regs_mask |= 1 << regno; + + for (regno = 8; regno < 13; regno++) + { + if (regs_ever_live[regno] && ! call_used_regs[regno] + && ! (TARGET_SINGLE_PIC_BASE && (regno == arm_pic_register))) + high_regs_pushed ++; + } + + /* The prolog may have pushed some high registers to use as + work registers. eg the testuite file: + gcc/testsuite/gcc/gcc.c-torture/execute/complex-2.c + compiles to produce: + push {r4, r5, r6, r7, lr} + mov r7, r9 + mov r6, r8 + push {r6, r7} + as part of the prolog. We have to undo that pushing here. */ + + if (high_regs_pushed) + { + int mask = live_regs_mask; + int next_hi_reg; + int size; + int mode; + +#ifdef RTX_CODE + /* If we can deduce the registers used from the function's return value. + This is more reliable that examining regs_ever_live[] because that + will be set if the register is ever used in the function, not just if + the register is used to hold a return value. */ + + if (current_function_return_rtx != 0) + mode = GET_MODE (current_function_return_rtx); + else +#endif + mode = DECL_MODE (DECL_RESULT (current_function_decl)); + + size = GET_MODE_SIZE (mode); + + /* Unless we are returning a type of size > 12 register r3 is + available. */ + if (size < 13) + mask |= 1 << 3; + + if (mask == 0) + /* Oh dear! We have no low registers into which we can pop + high registers! */ + fatal ("No low registers available for popping high registers"); + + for (next_hi_reg = 8; next_hi_reg < 13; next_hi_reg++) + if (regs_ever_live[next_hi_reg] && ! call_used_regs[next_hi_reg] + && ! (TARGET_SINGLE_PIC_BASE && (next_hi_reg == arm_pic_register))) + break; + + while (high_regs_pushed) + { + /* Find lo register(s) into which the high register(s) can + be popped. */ + for (regno = 0; regno <= LAST_LO_REGNUM; regno++) + { + if (mask & (1 << regno)) + high_regs_pushed--; + if (high_regs_pushed == 0) + break; + } + + mask &= (2 << regno) - 1; /* A noop if regno == 8 */ + + /* Pop the values into the low register(s). */ + thumb_pushpop (asm_out_file, mask, 0); + + /* Move the value(s) into the high registers. */ + for (regno = 0; regno <= LAST_LO_REGNUM; regno++) + { + if (mask & (1 << regno)) + { + asm_fprintf (asm_out_file, "\tmov\t%r, %r\n", next_hi_reg, + regno); + + for (next_hi_reg++; next_hi_reg < 13; next_hi_reg++) + if (regs_ever_live[next_hi_reg] && + ! call_used_regs[next_hi_reg] + && ! (TARGET_SINGLE_PIC_BASE + && (next_hi_reg == arm_pic_register))) + break; + } + } + } + } + + had_to_push_lr = (live_regs_mask || ! leaf_function + || thumb_far_jump_used_p (1)); + + if (TARGET_BACKTRACE + && ((live_regs_mask & 0xFF) == 0) + && regs_ever_live [LAST_ARG_REGNUM] != 0) + { + /* The stack backtrace structure creation code had to + push R7 in order to get a work register, so we pop + it now. */ + live_regs_mask |= (1 << LAST_LO_REGNUM); + } + + if (current_function_pretend_args_size == 0 || TARGET_BACKTRACE) + { + if (had_to_push_lr + && ! is_called_in_ARM_mode (current_function_decl) + && ! eh_ofs) + live_regs_mask |= 1 << PC_REGNUM; + + /* Either no argument registers were pushed or a backtrace + structure was created which includes an adjusted stack + pointer, so just pop everything. */ + if (live_regs_mask) + thumb_pushpop (asm_out_file, live_regs_mask, FALSE); + + if (eh_ofs) + thumb_exit (asm_out_file, 2, eh_ofs); + /* We have either just popped the return address into the + PC or it is was kept in LR for the entire function or + it is still on the stack because we do not want to + return by doing a pop {pc}. */ + else if ((live_regs_mask & (1 << PC_REGNUM)) == 0) + thumb_exit (asm_out_file, + (had_to_push_lr + && is_called_in_ARM_mode (current_function_decl)) ? + -1 : LR_REGNUM, NULL_RTX); + } + else + { + /* Pop everything but the return address. */ + live_regs_mask &= ~ (1 << PC_REGNUM); + + if (live_regs_mask) + thumb_pushpop (asm_out_file, live_regs_mask, FALSE); + + if (had_to_push_lr) + /* Get the return address into a temporary register. */ + thumb_pushpop (asm_out_file, 1 << LAST_ARG_REGNUM, 0); + + /* Remove the argument registers that were pushed onto the stack. */ + asm_fprintf (asm_out_file, "\tadd\t%r, %r, #%d\n", + SP_REGNUM, SP_REGNUM, + current_function_pretend_args_size); + + if (eh_ofs) + thumb_exit (asm_out_file, 2, eh_ofs); + else + thumb_exit (asm_out_file, + had_to_push_lr ? LAST_ARG_REGNUM : LR_REGNUM, NULL_RTX); + } + + return ""; +} + +/* Functions to save and restore machine-specific function data. */ + +static void +arm_mark_machine_status (p) + struct function * p; +{ + struct machine_function *machine = p->machine; + + ggc_mark_rtx (machine->ra_rtx); + ggc_mark_rtx (machine->eh_epilogue_sp_ofs); +} + +static void +arm_init_machine_status (p) + struct function * p; +{ + p->machine = + (struct machine_function *) xcalloc (1, sizeof (struct machine_function)); +} + +/* Return an RTX indicating where the return address to the + calling function can be found. */ +rtx +arm_return_addr (count, frame) + int count; + rtx frame ATTRIBUTE_UNUSED; +{ + rtx reg; + + if (count != 0) + return NULL_RTX; + + reg = cfun->machine->ra_rtx; + + if (reg == NULL) + { + rtx init; + + /* No rtx yet. Invent one, and initialize it for r14 (lr) in + the prologue. */ + reg = gen_reg_rtx (Pmode); + cfun->machine->ra_rtx = reg; + + if (! TARGET_APCS_32) + init = gen_rtx_AND (Pmode, gen_rtx_REG (Pmode, LR_REGNUM), + GEN_INT (RETURN_ADDR_MASK26)); + else + init = gen_rtx_REG (Pmode, LR_REGNUM); + + init = gen_rtx_SET (VOIDmode, reg, init); + + /* Emit the insn to the prologue with the other argument copies. */ + push_topmost_sequence (); + emit_insn_after (init, get_insns ()); + pop_topmost_sequence (); + } + + return reg; +} + +/* Do anything needed before RTL is emitted for each function. */ +void +arm_init_expanders () +{ + /* Arrange to initialize and mark the machine per-function status. */ + init_machine_status = arm_init_machine_status; + mark_machine_status = arm_mark_machine_status; +} + +/* Generate the rest of a function's prologue. */ +void +thumb_expand_prologue () +{ + HOST_WIDE_INT amount = (get_frame_size () + + current_function_outgoing_args_size); + + /* Naked functions don't have prologues. */ + if (arm_naked_function_p (current_function_decl)) + return; + + if (frame_pointer_needed) + emit_insn (gen_movsi (hard_frame_pointer_rtx, stack_pointer_rtx)); + + if (amount) + { + amount = ROUND_UP (amount); + + if (amount < 512) + emit_insn (gen_addsi3 (stack_pointer_rtx, stack_pointer_rtx, + GEN_INT (- amount))); + else + { + int regno; + rtx reg; + + /* The stack decrement is too big for an immediate value in a single + insn. In theory we could issue multiple subtracts, but after + three of them it becomes more space efficient to place the full + value in the constant pool and load into a register. (Also the + ARM debugger really likes to see only one stack decrement per + function). So instead we look for a scratch register into which + we can load the decrement, and then we subtract this from the + stack pointer. Unfortunately on the thumb the only available + scratch registers are the argument registers, and we cannot use + these as they may hold arguments to the function. Instead we + attempt to locate a call preserved register which is used by this + function. If we can find one, then we know that it will have + been pushed at the start of the prologue and so we can corrupt + it now. */ + for (regno = LAST_ARG_REGNUM + 1; regno <= LAST_LO_REGNUM; regno++) + if (regs_ever_live[regno] + && ! call_used_regs[regno] /* Paranoia */ + && ! (TARGET_SINGLE_PIC_BASE && (regno == arm_pic_register)) + && ! (frame_pointer_needed + && (regno == THUMB_HARD_FRAME_POINTER_REGNUM))) + break; + + if (regno > LAST_LO_REGNUM) /* Very unlikely */ + { + rtx spare = gen_rtx (REG, SImode, IP_REGNUM); + + /* Choose an arbitary, non-argument low register. */ + reg = gen_rtx (REG, SImode, LAST_LO_REGNUM); + + /* Save it by copying it into a high, scratch register. */ + emit_insn (gen_movsi (spare, reg)); + + /* Decrement the stack. */ + emit_insn (gen_movsi (reg, GEN_INT (- amount))); + emit_insn (gen_addsi3 (stack_pointer_rtx, stack_pointer_rtx, + reg)); + + /* Restore the low register's original value. */ + emit_insn (gen_movsi (reg, spare)); + + /* Emit a USE of the restored scratch register, so that flow + analysis will not consider the restore redundant. The + register won't be used again in this function and isn't + restored by the epilogue. */ + emit_insn (gen_rtx_USE (VOIDmode, reg)); + } + else + { + reg = gen_rtx (REG, SImode, regno); + + emit_insn (gen_movsi (reg, GEN_INT (- amount))); + emit_insn (gen_addsi3 (stack_pointer_rtx, stack_pointer_rtx, + reg)); + } + } + } + + if (profile_flag || profile_block_flag || TARGET_NO_SCHED_PRO) + emit_insn (gen_blockage ()); +} + +void +thumb_expand_epilogue () +{ + HOST_WIDE_INT amount = (get_frame_size () + + current_function_outgoing_args_size); + + /* Naked functions don't have epilogues. */ + if (arm_naked_function_p (current_function_decl)) + return; + + if (frame_pointer_needed) + emit_insn (gen_movsi (stack_pointer_rtx, hard_frame_pointer_rtx)); + else if (amount) + { + amount = ROUND_UP (amount); + + if (amount < 512) + emit_insn (gen_addsi3 (stack_pointer_rtx, stack_pointer_rtx, + GEN_INT (amount))); + else + { + /* r3 is always free in the epilogue. */ + rtx reg = gen_rtx (REG, SImode, LAST_ARG_REGNUM); + + emit_insn (gen_movsi (reg, GEN_INT (amount))); + emit_insn (gen_addsi3 (stack_pointer_rtx, stack_pointer_rtx, reg)); + } + } + + /* Emit a USE (stack_pointer_rtx), so that + the stack adjustment will not be deleted. */ + emit_insn (gen_rtx_USE (VOIDmode, stack_pointer_rtx)); + + if (profile_flag || profile_block_flag || TARGET_NO_SCHED_PRO) + emit_insn (gen_blockage ()); +} + +void +output_thumb_prologue (f) + FILE * f; +{ + int live_regs_mask = 0; + int high_regs_pushed = 0; + int store_arg_regs = 0; + int regno; + + if (arm_naked_function_p (current_function_decl)) + return; + + if (is_called_in_ARM_mode (current_function_decl)) + { + const char * name; + + if (GET_CODE (DECL_RTL (current_function_decl)) != MEM) + abort (); + if (GET_CODE (XEXP (DECL_RTL (current_function_decl), 0)) != SYMBOL_REF) + abort (); + name = XSTR (XEXP (DECL_RTL (current_function_decl), 0), 0); + + /* Generate code sequence to switch us into Thumb mode. */ + /* The .code 32 directive has already been emitted by + ASM_DECLARE_FUNCITON_NAME */ + asm_fprintf (f, "\torr\t%r, %r, #1\n", IP_REGNUM, PC_REGNUM); + asm_fprintf (f, "\tbx\t%r\n", IP_REGNUM); + + /* Generate a label, so that the debugger will notice the + change in instruction sets. This label is also used by + the assembler to bypass the ARM code when this function + is called from a Thumb encoded function elsewhere in the + same file. Hence the definition of STUB_NAME here must + agree with the definition in gas/config/tc-arm.c */ + +#define STUB_NAME ".real_start_of" + + asm_fprintf (f, "\t.code\t16\n"); +#ifdef ARM_PE + if (arm_dllexport_name_p (name)) + name = ARM_STRIP_NAME_ENCODING (name); +#endif + asm_fprintf (f, "\t.globl %s%U%s\n", STUB_NAME, name); + asm_fprintf (f, "\t.thumb_func\n"); + asm_fprintf (f, "%s%U%s:\n", STUB_NAME, name); + } + + if (current_function_anonymous_args && current_function_pretend_args_size) + store_arg_regs = 1; + + if (current_function_pretend_args_size) + { + if (store_arg_regs) + { + int num_pushes; + + asm_fprintf (f, "\tpush\t{"); + + num_pushes = NUM_INTS (current_function_pretend_args_size); + + for (regno = LAST_ARG_REGNUM + 1 - num_pushes; + regno <= LAST_ARG_REGNUM; + regno ++) + asm_fprintf (f, "%r%s", regno, + regno == LAST_ARG_REGNUM ? "" : ", "); + + asm_fprintf (f, "}\n"); + } + else + asm_fprintf (f, "\tsub\t%r, %r, #%d\n", + SP_REGNUM, SP_REGNUM, + current_function_pretend_args_size); + } + + for (regno = 0; regno <= LAST_LO_REGNUM; regno ++) + if (regs_ever_live[regno] && ! call_used_regs[regno] + && ! (TARGET_SINGLE_PIC_BASE && (regno == arm_pic_register))) + live_regs_mask |= 1 << regno; + + if (live_regs_mask || ! leaf_function_p () || thumb_far_jump_used_p (1)) + live_regs_mask |= 1 << LR_REGNUM; + + if (TARGET_BACKTRACE) + { + int offset; + int work_register = 0; + int wr; + + /* We have been asked to create a stack backtrace structure. + The code looks like this: + + 0 .align 2 + 0 func: + 0 sub SP, #16 Reserve space for 4 registers. + 2 push {R7} Get a work register. + 4 add R7, SP, #20 Get the stack pointer before the push. + 6 str R7, [SP, #8] Store the stack pointer (before reserving the space). + 8 mov R7, PC Get hold of the start of this code plus 12. + 10 str R7, [SP, #16] Store it. + 12 mov R7, FP Get hold of the current frame pointer. + 14 str R7, [SP, #4] Store it. + 16 mov R7, LR Get hold of the current return address. + 18 str R7, [SP, #12] Store it. + 20 add R7, SP, #16 Point at the start of the backtrace structure. + 22 mov FP, R7 Put this value into the frame pointer. */ + + if ((live_regs_mask & 0xFF) == 0) + { + /* See if the a4 register is free. */ + + if (regs_ever_live [LAST_ARG_REGNUM] == 0) + work_register = LAST_ARG_REGNUM; + else /* We must push a register of our own */ + live_regs_mask |= (1 << LAST_LO_REGNUM); + } + + if (work_register == 0) + { + /* Select a register from the list that will be pushed to + use as our work register. */ + for (work_register = (LAST_LO_REGNUM + 1); work_register--;) + if ((1 << work_register) & live_regs_mask) + break; + } + + asm_fprintf + (f, "\tsub\t%r, %r, #16\t%@ Create stack backtrace structure\n", + SP_REGNUM, SP_REGNUM); + + if (live_regs_mask) + thumb_pushpop (f, live_regs_mask, 1); + + for (offset = 0, wr = 1 << 15; wr != 0; wr >>= 1) + if (wr & live_regs_mask) + offset += 4; + + asm_fprintf (f, "\tadd\t%r, %r, #%d\n", work_register, SP_REGNUM, + offset + 16 + current_function_pretend_args_size); + + asm_fprintf (f, "\tstr\t%r, [%r, #%d]\n", work_register, SP_REGNUM, + offset + 4); + + /* Make sure that the instruction fetching the PC is in the right place + to calculate "start of backtrace creation code + 12". */ + if (live_regs_mask) + { + asm_fprintf (f, "\tmov\t%r, %r\n", work_register, PC_REGNUM); + asm_fprintf (f, "\tstr\t%r, [%r, #%d]\n", work_register, SP_REGNUM, + offset + 12); + asm_fprintf (f, "\tmov\t%r, %r\n", work_register, + ARM_HARD_FRAME_POINTER_REGNUM); + asm_fprintf (f, "\tstr\t%r, [%r, #%d]\n", work_register, SP_REGNUM, + offset); + } + else + { + asm_fprintf (f, "\tmov\t%r, %r\n", work_register, + ARM_HARD_FRAME_POINTER_REGNUM); + asm_fprintf (f, "\tstr\t%r, [%r, #%d]\n", work_register, SP_REGNUM, + offset); + asm_fprintf (f, "\tmov\t%r, %r\n", work_register, PC_REGNUM); + asm_fprintf (f, "\tstr\t%r, [%r, #%d]\n", work_register, SP_REGNUM, + offset + 12); + } + + asm_fprintf (f, "\tmov\t%r, %r\n", work_register, LR_REGNUM); + asm_fprintf (f, "\tstr\t%r, [%r, #%d]\n", work_register, SP_REGNUM, + offset + 8); + asm_fprintf (f, "\tadd\t%r, %r, #%d\n", work_register, SP_REGNUM, + offset + 12); + asm_fprintf (f, "\tmov\t%r, %r\t\t%@ Backtrace structure created\n", + ARM_HARD_FRAME_POINTER_REGNUM, work_register); + } + else if (live_regs_mask) + thumb_pushpop (f, live_regs_mask, 1); + + for (regno = 8; regno < 13; regno++) + { + if (regs_ever_live[regno] && ! call_used_regs[regno] + && ! (TARGET_SINGLE_PIC_BASE && (regno == arm_pic_register))) + high_regs_pushed ++; + } + + if (high_regs_pushed) + { + int pushable_regs = 0; + int mask = live_regs_mask & 0xff; + int next_hi_reg; + + for (next_hi_reg = 12; next_hi_reg > LAST_LO_REGNUM; next_hi_reg--) + { + if (regs_ever_live[next_hi_reg] && ! call_used_regs[next_hi_reg] + && ! (TARGET_SINGLE_PIC_BASE + && (next_hi_reg == arm_pic_register))) + break; + } + + pushable_regs = mask; + + if (pushable_regs == 0) + { + /* Desperation time -- this probably will never happen. */ + if (regs_ever_live[LAST_ARG_REGNUM] + || ! call_used_regs[LAST_ARG_REGNUM]) + asm_fprintf (f, "\tmov\t%r, %r\n", IP_REGNUM, LAST_ARG_REGNUM); + mask = 1 << LAST_ARG_REGNUM; + } + + while (high_regs_pushed > 0) + { + for (regno = LAST_LO_REGNUM; regno >= 0; regno--) + { + if (mask & (1 << regno)) + { + asm_fprintf (f, "\tmov\t%r, %r\n", regno, next_hi_reg); + + high_regs_pushed --; + + if (high_regs_pushed) + for (next_hi_reg--; next_hi_reg > LAST_LO_REGNUM; + next_hi_reg--) + { + if (regs_ever_live[next_hi_reg] + && ! call_used_regs[next_hi_reg] + && ! (TARGET_SINGLE_PIC_BASE + && (next_hi_reg == arm_pic_register))) + break; + } + else + { + mask &= ~ ((1 << regno) - 1); + break; + } + } + } + + thumb_pushpop (f, mask, 1); + } + + if (pushable_regs == 0 + && (regs_ever_live[LAST_ARG_REGNUM] + || ! call_used_regs[LAST_ARG_REGNUM])) + asm_fprintf (f, "\tmov\t%r, %r\n", LAST_ARG_REGNUM, IP_REGNUM); + } +} + +/* Handle the case of a double word load into a low register from + a computed memory address. The computed address may involve a + register which is overwritten by the load. */ + +char * +thumb_load_double_from_address (operands) + rtx * operands; +{ + rtx addr; + rtx base; + rtx offset; + rtx arg1; + rtx arg2; + + if (GET_CODE (operands[0]) != REG) + fatal ("thumb_load_double_from_address: destination is not a register"); + + if (GET_CODE (operands[1]) != MEM) + { + debug_rtx (operands[1]); + fatal ("thumb_load_double_from_address: source is not a computed memory address"); + } + + /* Get the memory address. */ + addr = XEXP (operands[1], 0); + + /* Work out how the memory address is computed. */ + switch (GET_CODE (addr)) + { + case REG: + operands[2] = gen_rtx (MEM, SImode, + plus_constant (XEXP (operands[1], 0), 4)); + + if (REGNO (operands[0]) == REGNO (addr)) + { + output_asm_insn ("ldr\t%H0, %2", operands); + output_asm_insn ("ldr\t%0, %1", operands); + } + else + { + output_asm_insn ("ldr\t%0, %1", operands); + output_asm_insn ("ldr\t%H0, %2", operands); + } + break; + + case CONST: + /* Compute <address> + 4 for the high order load. */ + operands[2] = gen_rtx (MEM, SImode, + plus_constant (XEXP (operands[1], 0), 4)); + + output_asm_insn ("ldr\t%0, %1", operands); + output_asm_insn ("ldr\t%H0, %2", operands); + break; + + case PLUS: + arg1 = XEXP (addr, 0); + arg2 = XEXP (addr, 1); + + if (CONSTANT_P (arg1)) + base = arg2, offset = arg1; + else + base = arg1, offset = arg2; + + if (GET_CODE (base) != REG) + fatal ("thumb_load_double_from_address: base is not a register"); + + /* Catch the case of <address> = <reg> + <reg> */ + if (GET_CODE (offset) == REG) + { + int reg_offset = REGNO (offset); + int reg_base = REGNO (base); + int reg_dest = REGNO (operands[0]); + + /* Add the base and offset registers together into the + higher destination register. */ + asm_fprintf (asm_out_file, "\tadd\t%r, %r, %r", + reg_dest + 1, reg_base, reg_offset); + + /* Load the lower destination register from the address in + the higher destination register. */ + asm_fprintf (asm_out_file, "\tldr\t%r, [%r, #0]", + reg_dest, reg_dest + 1); + + /* Load the higher destination register from its own address + plus 4. */ + asm_fprintf (asm_out_file, "\tldr\t%r, [%r, #4]", + reg_dest + 1, reg_dest + 1); + } + else + { + /* Compute <address> + 4 for the high order load. */ + operands[2] = gen_rtx (MEM, SImode, + plus_constant (XEXP (operands[1], 0), 4)); + + /* If the computed address is held in the low order register + then load the high order register first, otherwise always + load the low order register first. */ + if (REGNO (operands[0]) == REGNO (base)) + { + output_asm_insn ("ldr\t%H0, %2", operands); + output_asm_insn ("ldr\t%0, %1", operands); + } + else + { + output_asm_insn ("ldr\t%0, %1", operands); + output_asm_insn ("ldr\t%H0, %2", operands); + } + } + break; + + case LABEL_REF: + /* With no registers to worry about we can just load the value + directly. */ + operands[2] = gen_rtx (MEM, SImode, + plus_constant (XEXP (operands[1], 0), 4)); + + output_asm_insn ("ldr\t%H0, %2", operands); + output_asm_insn ("ldr\t%0, %1", operands); + break; + + default: + debug_rtx (operands[1]); + fatal ("thumb_load_double_from_address: Unhandled address calculation"); + break; + } + + return ""; +} + + +char * +thumb_output_move_mem_multiple (n, operands) + int n; + rtx * operands; +{ + rtx tmp; + + switch (n) + { + case 2: + if (REGNO (operands[2]) > REGNO (operands[3])) + { + tmp = operands[2]; + operands[2] = operands[3]; + operands[3] = tmp; + } + output_asm_insn ("ldmia\t%1!, {%2, %3}", operands); + output_asm_insn ("stmia\t%0!, {%2, %3}", operands); + break; + + case 3: + if (REGNO (operands[2]) > REGNO (operands[3])) + { + tmp = operands[2]; + operands[2] = operands[3]; + operands[3] = tmp; + } + if (REGNO (operands[3]) > REGNO (operands[4])) + { + tmp = operands[3]; + operands[3] = operands[4]; + operands[4] = tmp; + } + if (REGNO (operands[2]) > REGNO (operands[3])) + { + tmp = operands[2]; + operands[2] = operands[3]; + operands[3] = tmp; + } + + output_asm_insn ("ldmia\t%1!, {%2, %3, %4}", operands); + output_asm_insn ("stmia\t%0!, {%2, %3, %4}", operands); + break; + + default: + abort (); + } + + return ""; +} + +/* Routines for generating rtl */ + +void +thumb_expand_movstrqi (operands) + rtx * operands; +{ + rtx out = copy_to_mode_reg (SImode, XEXP (operands[0], 0)); + rtx in = copy_to_mode_reg (SImode, XEXP (operands[1], 0)); + HOST_WIDE_INT len = INTVAL (operands[2]); + HOST_WIDE_INT offset = 0; + + while (len >= 12) + { + emit_insn (gen_movmem12b (out, in)); + len -= 12; + } + + if (len >= 8) + { + emit_insn (gen_movmem8b (out, in)); + len -= 8; + } + + if (len >= 4) + { + rtx reg = gen_reg_rtx (SImode); + emit_insn (gen_movsi (reg, gen_rtx (MEM, SImode, in))); + emit_insn (gen_movsi (gen_rtx (MEM, SImode, out), reg)); + len -= 4; + offset += 4; + } + + if (len >= 2) + { + rtx reg = gen_reg_rtx (HImode); + emit_insn (gen_movhi (reg, gen_rtx (MEM, HImode, + plus_constant (in, offset)))); + emit_insn (gen_movhi (gen_rtx (MEM, HImode, plus_constant (out, offset)), + reg)); + len -= 2; + offset += 2; + } + + if (len) + { + rtx reg = gen_reg_rtx (QImode); + emit_insn (gen_movqi (reg, gen_rtx (MEM, QImode, + plus_constant (in, offset)))); + emit_insn (gen_movqi (gen_rtx (MEM, QImode, plus_constant (out, offset)), + reg)); + } +} + +int +thumb_cmp_operand (op, mode) + rtx op; + enum machine_mode mode; +{ + return ((GET_CODE (op) == CONST_INT + && (unsigned HOST_WIDE_INT) (INTVAL (op)) < 256) + || register_operand (op, mode)); +} + +static char * +thumb_condition_code (x, invert) + rtx x; + int invert; +{ + static char * conds[] = + { + "eq", "ne", "cs", "cc", "mi", "pl", "vs", "vc", + "hi", "ls", "ge", "lt", "gt", "le" + }; + int val; + + switch (GET_CODE (x)) + { + case EQ: val = 0; break; + case NE: val = 1; break; + case GEU: val = 2; break; + case LTU: val = 3; break; + case GTU: val = 8; break; + case LEU: val = 9; break; + case GE: val = 10; break; + case LT: val = 11; break; + case GT: val = 12; break; + case LE: val = 13; break; + default: + abort (); + } + + return conds[val ^ invert]; +} + +/* Handle storing a half-word to memory during reload. */ +void +thumb_reload_out_hi (operands) + rtx * operands; +{ + emit_insn (gen_thumb_movhi_clobber (operands[0], operands[1], operands[2])); +} + +/* Handle storing a half-word to memory during reload. */ +void +thumb_reload_in_hi (operands) + rtx * operands ATTRIBUTE_UNUSED; +{ + abort (); +} + /* Return the length of a function name prefix that starts with the character 'c'. */ static int @@ -7194,7 +9756,7 @@ aof_pic_entry (x) /* We mark this here and not in arm_add_gc_roots() to avoid polluting even more code with ifdefs, and because it never contains anything useful until we assign to it here. */ - ggc_add_rtx_root (&aof_pic_label, 1); + ggc_add_rtx_root (& aof_pic_label, 1); /* This needs to persist throughout the compilation. */ end_temporary_allocation (); aof_pic_label = gen_rtx_SYMBOL_REF (Pmode, "x$adcons"); |