CbC/CbC_gcc: gcc/loop-unroll.c comparison

comparison gcc/loop-unroll.c @ 67:f6334be47118

update gcc from gcc-4.6-20100522 to gcc-4.6-20110318

author	nobuyasu <dimolto@cr.ie.u-ryukyu.ac.jp>
date	Tue, 22 Mar 2011 17:18:12 +0900
parents	b7f97abdc517
children	04ced10e8804

comparison

equal deleted inserted replaced

-:65488c3d617d
+:f6334be47118
 	  apply_opt_in_copies (opt_info, npeel, false, true);
 	  free_opt_info (opt_info);
 	}
 /* Remove the exit edges.  */
-for (i = 0; VEC_iterate (edge, remove_edges, i, ein); i++)
+FOR_EACH_VEC_ELT (edge, remove_edges, i, ein)
 	remove_path (ein);
 VEC_free (edge, heap, remove_edges);
 }
 ein = desc->in_edge;
 desc->niter /= max_unroll + 1;
 desc->niter_max /= max_unroll + 1;
 desc->niter_expr = GEN_INT (desc->niter);
 /* Remove the edges.  */
-for (i = 0; VEC_iterate (edge, remove_edges, i, e); i++)
+FOR_EACH_VEC_ELT (edge, remove_edges, i, e)
 remove_path (e);
 VEC_free (edge, heap, remove_edges);
 if (dump_file)
 fprintf (dump_file,
 /* ??? We used to assume that INSNS can contain control flow insns, and
 that we had to try to find sub basic blocks in BB to maintain a valid
 CFG.  For this purpose we used to set the BB_SUPERBLOCK flag on BB
 and call break_superblocks when going out of cfglayout mode.  But it
 turns out that this never happens; and that if it does ever happen,
-the verify_flow_info call in loop_optimizer_finalize would fail.
+the TODO_verify_flow at the end of the RTL loop passes would fail.
 There are two reasons why we expected we could have control flow insns
 in INSNS.  The first is when a comparison has to be done in parts, and
 the second is when the number of iterations is computed for loops with
 the number of iterations known at runtime.  In both cases, test cases
 {
 VEC (basic_block, heap) *ldom;
 basic_block bb;
 ldom = get_dominated_by (CDI_DOMINATORS, body[i]);
-for (j = 0; VEC_iterate (basic_block, ldom, j, bb); j++)
+FOR_EACH_VEC_ELT (basic_block, ldom, j, bb)
 	if (!flow_bb_inside_loop_p (loop, bb))
 	  VEC_safe_push (basic_block, heap, dom_bbs, bb);
 VEC_free (basic_block, heap, ldom);
 }
 	  desc->in_edge = EDGE_SUCC (exit_block, 0);
 	}
 }
 /* Remove the edges.  */
-for (i = 0; VEC_iterate (edge, remove_edges, i, e); i++)
+FOR_EACH_VEC_ELT (edge, remove_edges, i, e)
 remove_path (e);
 VEC_free (edge, heap, remove_edges);
 /* We must be careful when updating the number of iterations due to
 preconditioning and the fact that the value must be valid at entry
 */
 static struct var_to_expand *
 analyze_insn_to_expand_var (struct loop *loop, rtx insn)
 {
-rtx set, dest, src, op1, op2, something;
+rtx set, dest, src;
 struct var_to_expand *ves;
-enum machine_mode mode1, mode2;
 unsigned accum_pos;
+enum rtx_code code;
 int debug_uses = 0;
 set = single_set (insn);
 if (!set)
 return NULL;
 dest = SET_DEST (set);
 src = SET_SRC (set);
+code = GET_CODE (src);
-if (GET_CODE (src) != PLUS
-&& GET_CODE (src) != MINUS
+if (code != PLUS && code != MINUS && code != MULT && code != FMA)
-&& GET_CODE (src) != MULT)
 return NULL;
+if (FLOAT_MODE_P (GET_MODE (dest)))
+{
+if (!flag_associative_math)
+return NULL;
+/* In the case of FMA, we're also changing the rounding.  */
+if (code == FMA && !flag_unsafe_math_optimizations)
+	return NULL;
+}
 /* Hmm, this is a bit paradoxical.  We know that INSN is a valid insn
 in MD.  But if there is no optab to generate the insn, we can not
 perform the variable expansion.  This can happen if an MD provides
 an insn but not a named pattern to generate it, for example to avoid
 producing code that needs additional mode switches like for x87/mmx.
 So we check have_insn_for which looks for an optab for the operation
 in SRC.  If it doesn't exist, we can't perform the expansion even
 though INSN is valid.  */
-if (!have_insn_for (GET_CODE (src), GET_MODE (src)))
+if (!have_insn_for (code, GET_MODE (src)))
 return NULL;
-op1 = XEXP (src, 0);
-op2 = XEXP (src, 1);
 if (!REG_P (dest)
 && !(GET_CODE (dest) == SUBREG
 && REG_P (SUBREG_REG (dest))))
 return NULL;
-if (rtx_equal_p (dest, op1))
+/* Find the accumulator use within the operation.  */
+if (code == FMA)
+{
+/* We only support accumulation via FMA in the ADD position.  */
+if (!rtx_equal_p  (dest, XEXP (src, 2)))
+	return NULL;
+accum_pos = 2;
+}
+else if (rtx_equal_p (dest, XEXP (src, 0)))
 accum_pos = 0;
-else if (rtx_equal_p (dest, op2))
+else if (rtx_equal_p (dest, XEXP (src, 1)))
-accum_pos = 1;
+{
+/* The method of expansion that we are using; which includes the
+	 initialization of the expansions with zero and the summation of
+the expansions at the end of the computation will yield wrong
+	 results for (x = something - x) thus avoid using it in that case.  */
+if (code == MINUS)
+	return NULL;
+accum_pos = 1;
+}
 else
 return NULL;
-/* The method of expansion that we are using; which includes
+/* It must not otherwise be used.  */
-the initialization of the expansions with zero and the summation of
+if (code == FMA)
-the expansions at the end of the computation will yield wrong results
+{
-for (x = something - x) thus avoid using it in that case.  */
+if (rtx_referenced_p (dest, XEXP (src, 0))
-if (accum_pos == 1
+	  || rtx_referenced_p (dest, XEXP (src, 1)))
-&& GET_CODE (src) == MINUS)
+	return NULL;
-return NULL;
+}
+else if (rtx_referenced_p (dest, XEXP (src, 1 - accum_pos)))
-something = (accum_pos == 0) ? op2 : op1;
-if (rtx_referenced_p (dest, something))
 return NULL;
+/* It must be used in exactly one insn.  */
 if (!referenced_in_one_insn_in_loop_p (loop, dest, &debug_uses))
 return NULL;
-mode1 = GET_MODE (dest);
-mode2 = GET_MODE (something);
-if ((FLOAT_MODE_P (mode1)
-|| FLOAT_MODE_P (mode2))
-&& !flag_associative_math)
-return NULL;
 if (dump_file)
 {
-fprintf (dump_file,
+fprintf (dump_file, "\n;; Expanding Accumulator ");
-"\n;; Expanding Accumulator ");
+print_rtl (dump_file, dest);
-print_rtl (dump_file, dest);
+fprintf (dump_file, "\n");
-fprintf (dump_file, "\n");
+}
-}
 if (debug_uses)
 /* Instead of resetting the debug insns, we could replace each
 debug use in the loop with the sum or product of all expanded
 accummulators.  Since we'll only know of all expansions at the
 if (VEC_length (rtx, ve->var_expansions) == 0)
 return;
 start_sequence ();
-if (ve->op == PLUS || ve->op == MINUS)
+switch (ve->op)
-for (i = 0; VEC_iterate (rtx, ve->var_expansions, i, var); i++)
+{
-{
+case FMA:
-	if (honor_signed_zero_p)
+/* Note that we only accumulate FMA via the ADD operand.  */
-	  zero_init = simplify_gen_unary (NEG, mode, CONST0_RTX (mode), mode);
+case PLUS:
-	else
+case MINUS:
-	  zero_init = CONST0_RTX (mode);
+FOR_EACH_VEC_ELT (rtx, ve->var_expansions, i, var)
+{
-emit_move_insn (var, zero_init);
+	  if (honor_signed_zero_p)
-}
+	    zero_init = simplify_gen_unary (NEG, mode, CONST0_RTX (mode), mode);
-else if (ve->op == MULT)
+	  else
-for (i = 0; VEC_iterate (rtx, ve->var_expansions, i, var); i++)
+	    zero_init = CONST0_RTX (mode);
-{
+emit_move_insn (var, zero_init);
-zero_init =  CONST1_RTX (GET_MODE (var));
+}
-emit_move_insn (var, zero_init);
+break;
-}
+case MULT:
+FOR_EACH_VEC_ELT (rtx, ve->var_expansions, i, var)
+{
+zero_init = CONST1_RTX (GET_MODE (var));
+emit_move_insn (var, zero_init);
+}
+break;
+default:
+gcc_unreachable ();
+}
 seq = get_insns ();
 end_sequence ();
 insn = BB_HEAD (place);
 if (VEC_length (rtx, ve->var_expansions) == 0)
 return;
 start_sequence ();
-if (ve->op == PLUS || ve->op == MINUS)
+switch (ve->op)
-for (i = 0; VEC_iterate (rtx, ve->var_expansions, i, var); i++)
+{
-{
+case FMA:
-sum = simplify_gen_binary (PLUS, GET_MODE (ve->reg),
+/* Note that we only accumulate FMA via the ADD operand.  */
-var, sum);
+case PLUS:
-}
+case MINUS:
-else if (ve->op == MULT)
+FOR_EACH_VEC_ELT (rtx, ve->var_expansions, i, var)
-for (i = 0; VEC_iterate (rtx, ve->var_expansions, i, var); i++)
+	sum = simplify_gen_binary (PLUS, GET_MODE (ve->reg), var, sum);
-{
+break;
-sum = simplify_gen_binary (MULT, GET_MODE (ve->reg),
-var, sum);
+case MULT:
-}
+FOR_EACH_VEC_ELT (rtx, ve->var_expansions, i, var)
+	sum = simplify_gen_binary (MULT, GET_MODE (ve->reg), var, sum);
+break;
+default:
+gcc_unreachable ();
+}
 expr = force_operand (sum, ve->reg);
 if (expr != ve->reg)
 emit_move_insn (ve->reg, expr);
 seq = get_insns ();

Mercurial > hg > CbC > CbC_gcc

comparison gcc/loop-unroll.c @ 67:f6334be47118