>+/* STRD in ARM mode needs consecutive registers to be stored. This function >+ keeps accumulating non-consecutive registers until first consecutive >register
numchar > 80. >+ pair is found. It then generates multi-reg PUSH for all accumulated >+ registers, and then generates STRD with write-back for consecutive register >+ pair. This process is repeated until all the registers are stored on >stack. And again. >+ multi-reg PUSH takes care of lone registers as well. */ s/multi-reg/Multi register >+static void >+arm_emit_strd_push (unsigned long saved_regs_mask) How different is this from the thumb2 version you sent out in Patch 03/05 ? >+{ >+ int num_regs = 0; >+ int i, j; >+ rtx par = NULL_RTX; >+ rtx dwarf = NULL_RTX; >+ rtx insn = NULL_RTX; >+ rtx tmp, tmp1; >+ unsigned long regs_to_be_pushed_mask; >+ >+ for (i = 0; i <= LAST_ARM_REGNUM; i++) >+ if (saved_regs_mask & (1 << i)) >+ num_regs++; >+ >+ gcc_assert (num_regs && num_regs <= 16); >+ >+ for (i=0, j = LAST_ARM_REGNUM, regs_to_be_pushed_mask = 0; i < num_regs; >j--) >+ /* Var j iterates over all registers to gather all registers in >+ saved_regs_mask. Var i is used to count number of registers stored on >+ stack. regs_to_be_pushed_mask accumulates non-consecutive registers >+ that can be pushed using multi-reg PUSH before STRD is generated. */ Comment above loop. <...snip...> >@@ -15958,7 +16081,8 @@ arm_get_frame_offsets (void) > use 32-bit push/pop instructions. */ > if (! any_sibcall_uses_r3 () > && arm_size_return_regs () <= 12 >- && (offsets->saved_regs_mask & (1 << 3)) == 0) >+ && (offsets->saved_regs_mask & (1 << 3)) == 0 >+ && (TARGET_THUMB2 || !current_tune->prefer_ldrd_strd)) Not sure I completely follow this change yet. >@@ -16427,9 +16551,12 @@ arm_expand_prologue (void) > } > } > >- if (TARGET_THUMB2 && current_tune->prefer_ldrd_strd && !optimize_size) >+ if (current_tune->prefer_ldrd_strd && !optimize_size) s/optimize_size/optimize_function_for_size () > { >- thumb2_emit_strd_push (live_regs_mask); >+ if (TARGET_THUMB2) >+ thumb2_emit_strd_push (live_regs_mask); >+ else >+ arm_emit_strd_push (live_regs_mask); > } > else > { >diff --git a/gcc/config/arm/ldmstm.md b/gcc/config/arm/ldmstm.md >index e3dcd4f..3c729bb 100644 >--- a/gcc/config/arm/ldmstm.md >+++ b/gcc/config/arm/ldmstm.md >@@ -73,6 +73,42 @@ > [(set_attr "type" "store2") > (set_attr "predicable" "yes")]) > >+(define_insn "*arm_strd_base" >+ [(set (match_operand:SI 0 "arm_hard_register_operand" "+rk") >+ (plus:SI (match_dup 0) >+ (const_int -8))) >+ (set (mem:SI (match_dup 0)) >+ (match_operand:SI 1 "arm_hard_register_operand" "r")) >+ (set (mem:SI (plus:SI (match_dup 0) >+ (const_int 4))) >+ (match_operand:SI 2 "arm_hard_register_operand" "r"))] >+ "(TARGET_ARM && current_tune->prefer_ldrd_strd >+ && (!bad_reg_pair_for_arm_ldrd_strd (operands[1], operands[2])) >+ && (REGNO (operands[1]) != REGNO (operands[0])) >+ && (REGNO (operands[2]) != REGNO (operands[0])))" >+ "str%(d%)\t%1, %2, [%0, #-8]!" >+ [(set_attr "type" "store2") >+ (set_attr "predicable" "yes")]) Hmmm the question remains if we want to put these into ldmstm.md since it was theoretically auto-generated from ldmstm.ml. If this has to be marked to be separate then I'd like to regenerate ldmstm.md from ldmstm.ml and differentiate between the bits that can be auto-generated and the bits that have been added since. Otherwise OK. Ramana