Mercurial > hg > CbC > CbC_gcc
annotate gcc/loop-iv.c @ 132:d34655255c78
update gcc-8.2
author | mir3636 |
---|---|
date | Thu, 25 Oct 2018 10:21:07 +0900 |
parents | 84e7813d76e9 |
children | 1830386684a0 |
rev | line source |
---|---|
0 | 1 /* Rtl-level induction variable analysis. |
131 | 2 Copyright (C) 2004-2018 Free Software Foundation, Inc. |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
3 |
0 | 4 This file is part of GCC. |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
5 |
0 | 6 GCC is free software; you can redistribute it and/or modify it |
7 under the terms of the GNU General Public License as published by the | |
8 Free Software Foundation; either version 3, or (at your option) any | |
9 later version. | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
10 |
0 | 11 GCC is distributed in the hope that it will be useful, but WITHOUT |
12 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | |
13 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License | |
14 for more details. | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
15 |
0 | 16 You should have received a copy of the GNU General Public License |
17 along with GCC; see the file COPYING3. If not see | |
18 <http://www.gnu.org/licenses/>. */ | |
19 | |
20 /* This is a simple analysis of induction variables of the loop. The major use | |
21 is for determining the number of iterations of a loop for loop unrolling, | |
22 doloop optimization and branch prediction. The iv information is computed | |
23 on demand. | |
24 | |
25 Induction variables are analyzed by walking the use-def chains. When | |
26 a basic induction variable (biv) is found, it is cached in the bivs | |
27 hash table. When register is proved to be a biv, its description | |
28 is stored to DF_REF_DATA of the def reference. | |
29 | |
30 The analysis works always with one loop -- you must call | |
31 iv_analysis_loop_init (loop) for it. All the other functions then work with | |
32 this loop. When you need to work with another loop, just call | |
33 iv_analysis_loop_init for it. When you no longer need iv analysis, call | |
34 iv_analysis_done () to clean up the memory. | |
35 | |
36 The available functions are: | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
37 |
111 | 38 iv_analyze (insn, mode, reg, iv): Stores the description of the induction |
39 variable corresponding to the use of register REG in INSN to IV, given | |
40 that REG has mode MODE. Returns true if REG is an induction variable | |
41 in INSN. false otherwise. If a use of REG is not found in INSN, | |
42 the following insns are scanned (so that we may call this function | |
43 on insns returned by get_condition). | |
0 | 44 iv_analyze_result (insn, def, iv): Stores to IV the description of the iv |
45 corresponding to DEF, which is a register defined in INSN. | |
111 | 46 iv_analyze_expr (insn, mode, expr, iv): Stores to IV the description of iv |
0 | 47 corresponding to expression EXPR evaluated at INSN. All registers used bu |
111 | 48 EXPR must also be used in INSN. MODE is the mode of EXPR. |
0 | 49 */ |
50 | |
51 #include "config.h" | |
52 #include "system.h" | |
53 #include "coretypes.h" | |
111 | 54 #include "backend.h" |
0 | 55 #include "rtl.h" |
111 | 56 #include "df.h" |
57 #include "memmodel.h" | |
58 #include "emit-rtl.h" | |
59 #include "diagnostic-core.h" | |
0 | 60 #include "cfgloop.h" |
61 #include "intl.h" | |
111 | 62 #include "dumpfile.h" |
63 #include "rtl-iter.h" | |
0 | 64 |
65 /* Possible return values of iv_get_reaching_def. */ | |
66 | |
67 enum iv_grd_result | |
68 { | |
69 /* More than one reaching def, or reaching def that does not | |
70 dominate the use. */ | |
71 GRD_INVALID, | |
72 | |
73 /* The use is trivial invariant of the loop, i.e. is not changed | |
74 inside the loop. */ | |
75 GRD_INVARIANT, | |
76 | |
77 /* The use is reached by initial value and a value from the | |
78 previous iteration. */ | |
79 GRD_MAYBE_BIV, | |
80 | |
81 /* The use has single dominating def. */ | |
82 GRD_SINGLE_DOM | |
83 }; | |
84 | |
85 /* Information about a biv. */ | |
86 | |
87 struct biv_entry | |
88 { | |
89 unsigned regno; /* The register of the biv. */ | |
90 struct rtx_iv iv; /* Value of the biv. */ | |
91 }; | |
92 | |
93 static bool clean_slate = true; | |
94 | |
95 static unsigned int iv_ref_table_size = 0; | |
96 | |
97 /* Table of rtx_ivs indexed by the df_ref uid field. */ | |
98 static struct rtx_iv ** iv_ref_table; | |
99 | |
100 /* Induction variable stored at the reference. */ | |
111 | 101 #define DF_REF_IV(REF) iv_ref_table[DF_REF_ID (REF)] |
102 #define DF_REF_IV_SET(REF, IV) iv_ref_table[DF_REF_ID (REF)] = (IV) | |
0 | 103 |
104 /* The current loop. */ | |
105 | |
106 static struct loop *current_loop; | |
107 | |
111 | 108 /* Hashtable helper. */ |
109 | |
110 struct biv_entry_hasher : free_ptr_hash <biv_entry> | |
111 { | |
112 typedef rtx_def *compare_type; | |
113 static inline hashval_t hash (const biv_entry *); | |
114 static inline bool equal (const biv_entry *, const rtx_def *); | |
115 }; | |
116 | |
117 /* Returns hash value for biv B. */ | |
118 | |
119 inline hashval_t | |
120 biv_entry_hasher::hash (const biv_entry *b) | |
121 { | |
122 return b->regno; | |
123 } | |
124 | |
125 /* Compares biv B and register R. */ | |
126 | |
127 inline bool | |
128 biv_entry_hasher::equal (const biv_entry *b, const rtx_def *r) | |
129 { | |
130 return b->regno == REGNO (r); | |
131 } | |
132 | |
0 | 133 /* Bivs of the current loop. */ |
134 | |
111 | 135 static hash_table<biv_entry_hasher> *bivs; |
136 | |
137 static bool iv_analyze_op (rtx_insn *, scalar_int_mode, rtx, struct rtx_iv *); | |
138 | |
139 /* Return the RTX code corresponding to the IV extend code EXTEND. */ | |
140 static inline enum rtx_code | |
141 iv_extend_to_rtx_code (enum iv_extend_code extend) | |
142 { | |
143 switch (extend) | |
144 { | |
145 case IV_SIGN_EXTEND: | |
146 return SIGN_EXTEND; | |
147 case IV_ZERO_EXTEND: | |
148 return ZERO_EXTEND; | |
149 case IV_UNKNOWN_EXTEND: | |
150 return UNKNOWN; | |
151 } | |
152 gcc_unreachable (); | |
153 } | |
0 | 154 |
155 /* Dumps information about IV to FILE. */ | |
156 | |
157 extern void dump_iv_info (FILE *, struct rtx_iv *); | |
158 void | |
159 dump_iv_info (FILE *file, struct rtx_iv *iv) | |
160 { | |
161 if (!iv->base) | |
162 { | |
163 fprintf (file, "not simple"); | |
164 return; | |
165 } | |
166 | |
167 if (iv->step == const0_rtx | |
168 && !iv->first_special) | |
169 fprintf (file, "invariant "); | |
170 | |
171 print_rtl (file, iv->base); | |
172 if (iv->step != const0_rtx) | |
173 { | |
174 fprintf (file, " + "); | |
175 print_rtl (file, iv->step); | |
176 fprintf (file, " * iteration"); | |
177 } | |
178 fprintf (file, " (in %s)", GET_MODE_NAME (iv->mode)); | |
179 | |
180 if (iv->mode != iv->extend_mode) | |
181 fprintf (file, " %s to %s", | |
111 | 182 rtx_name[iv_extend_to_rtx_code (iv->extend)], |
0 | 183 GET_MODE_NAME (iv->extend_mode)); |
184 | |
185 if (iv->mult != const1_rtx) | |
186 { | |
187 fprintf (file, " * "); | |
188 print_rtl (file, iv->mult); | |
189 } | |
190 if (iv->delta != const0_rtx) | |
191 { | |
192 fprintf (file, " + "); | |
193 print_rtl (file, iv->delta); | |
194 } | |
195 if (iv->first_special) | |
196 fprintf (file, " (first special)"); | |
197 } | |
198 | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
199 static void |
0 | 200 check_iv_ref_table_size (void) |
201 { | |
111 | 202 if (iv_ref_table_size < DF_DEFS_TABLE_SIZE ()) |
0 | 203 { |
204 unsigned int new_size = DF_DEFS_TABLE_SIZE () + (DF_DEFS_TABLE_SIZE () / 4); | |
205 iv_ref_table = XRESIZEVEC (struct rtx_iv *, iv_ref_table, new_size); | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
206 memset (&iv_ref_table[iv_ref_table_size], 0, |
0 | 207 (new_size - iv_ref_table_size) * sizeof (struct rtx_iv *)); |
208 iv_ref_table_size = new_size; | |
209 } | |
210 } | |
211 | |
212 | |
213 /* Checks whether REG is a well-behaved register. */ | |
214 | |
215 static bool | |
216 simple_reg_p (rtx reg) | |
217 { | |
218 unsigned r; | |
219 | |
220 if (GET_CODE (reg) == SUBREG) | |
221 { | |
222 if (!subreg_lowpart_p (reg)) | |
223 return false; | |
224 reg = SUBREG_REG (reg); | |
225 } | |
226 | |
227 if (!REG_P (reg)) | |
228 return false; | |
229 | |
230 r = REGNO (reg); | |
231 if (HARD_REGISTER_NUM_P (r)) | |
232 return false; | |
233 | |
234 if (GET_MODE_CLASS (GET_MODE (reg)) != MODE_INT) | |
235 return false; | |
236 | |
237 return true; | |
238 } | |
239 | |
240 /* Clears the information about ivs stored in df. */ | |
241 | |
242 static void | |
243 clear_iv_info (void) | |
244 { | |
245 unsigned i, n_defs = DF_DEFS_TABLE_SIZE (); | |
246 struct rtx_iv *iv; | |
247 | |
248 check_iv_ref_table_size (); | |
249 for (i = 0; i < n_defs; i++) | |
250 { | |
251 iv = iv_ref_table[i]; | |
252 if (iv) | |
253 { | |
254 free (iv); | |
255 iv_ref_table[i] = NULL; | |
256 } | |
257 } | |
258 | |
111 | 259 bivs->empty (); |
0 | 260 } |
261 | |
262 | |
263 /* Prepare the data for an induction variable analysis of a LOOP. */ | |
264 | |
265 void | |
266 iv_analysis_loop_init (struct loop *loop) | |
267 { | |
268 current_loop = loop; | |
269 | |
270 /* Clear the information from the analysis of the previous loop. */ | |
271 if (clean_slate) | |
272 { | |
273 df_set_flags (DF_EQ_NOTES + DF_DEFER_INSN_RESCAN); | |
111 | 274 bivs = new hash_table<biv_entry_hasher> (10); |
0 | 275 clean_slate = false; |
276 } | |
277 else | |
278 clear_iv_info (); | |
279 | |
280 /* Get rid of the ud chains before processing the rescans. Then add | |
281 the problem back. */ | |
282 df_remove_problem (df_chain); | |
283 df_process_deferred_rescans (); | |
111 | 284 df_set_flags (DF_RD_PRUNE_DEAD_DEFS); |
0 | 285 df_chain_add_problem (DF_UD_CHAIN); |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
286 df_note_add_problem (); |
111 | 287 df_analyze_loop (loop); |
0 | 288 if (dump_file) |
289 df_dump_region (dump_file); | |
290 | |
291 check_iv_ref_table_size (); | |
292 } | |
293 | |
294 /* Finds the definition of REG that dominates loop latch and stores | |
295 it to DEF. Returns false if there is not a single definition | |
296 dominating the latch. If REG has no definition in loop, DEF | |
297 is set to NULL and true is returned. */ | |
298 | |
299 static bool | |
300 latch_dominating_def (rtx reg, df_ref *def) | |
301 { | |
302 df_ref single_rd = NULL, adef; | |
303 unsigned regno = REGNO (reg); | |
304 struct df_rd_bb_info *bb_info = DF_RD_BB_INFO (current_loop->latch); | |
305 | |
306 for (adef = DF_REG_DEF_CHAIN (regno); adef; adef = DF_REF_NEXT_REG (adef)) | |
307 { | |
308 if (!bitmap_bit_p (df->blocks_to_analyze, DF_REF_BBNO (adef)) | |
67
f6334be47118
update gcc from gcc-4.6-20100522 to gcc-4.6-20110318
nobuyasu <dimolto@cr.ie.u-ryukyu.ac.jp>
parents:
55
diff
changeset
|
309 || !bitmap_bit_p (&bb_info->out, DF_REF_ID (adef))) |
0 | 310 continue; |
311 | |
312 /* More than one reaching definition. */ | |
313 if (single_rd) | |
314 return false; | |
315 | |
316 if (!just_once_each_iteration_p (current_loop, DF_REF_BB (adef))) | |
317 return false; | |
318 | |
319 single_rd = adef; | |
320 } | |
321 | |
322 *def = single_rd; | |
323 return true; | |
324 } | |
325 | |
326 /* Gets definition of REG reaching its use in INSN and stores it to DEF. */ | |
327 | |
328 static enum iv_grd_result | |
111 | 329 iv_get_reaching_def (rtx_insn *insn, rtx reg, df_ref *def) |
0 | 330 { |
331 df_ref use, adef; | |
332 basic_block def_bb, use_bb; | |
111 | 333 rtx_insn *def_insn; |
0 | 334 bool dom_p; |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
335 |
0 | 336 *def = NULL; |
337 if (!simple_reg_p (reg)) | |
338 return GRD_INVALID; | |
339 if (GET_CODE (reg) == SUBREG) | |
340 reg = SUBREG_REG (reg); | |
341 gcc_assert (REG_P (reg)); | |
342 | |
343 use = df_find_use (insn, reg); | |
344 gcc_assert (use != NULL); | |
345 | |
346 if (!DF_REF_CHAIN (use)) | |
347 return GRD_INVARIANT; | |
348 | |
349 /* More than one reaching def. */ | |
350 if (DF_REF_CHAIN (use)->next) | |
351 return GRD_INVALID; | |
352 | |
353 adef = DF_REF_CHAIN (use)->ref; | |
354 | |
355 /* We do not handle setting only part of the register. */ | |
356 if (DF_REF_FLAGS (adef) & DF_REF_READ_WRITE) | |
357 return GRD_INVALID; | |
358 | |
359 def_insn = DF_REF_INSN (adef); | |
360 def_bb = DF_REF_BB (adef); | |
361 use_bb = BLOCK_FOR_INSN (insn); | |
362 | |
363 if (use_bb == def_bb) | |
364 dom_p = (DF_INSN_LUID (def_insn) < DF_INSN_LUID (insn)); | |
365 else | |
366 dom_p = dominated_by_p (CDI_DOMINATORS, use_bb, def_bb); | |
367 | |
368 if (dom_p) | |
369 { | |
370 *def = adef; | |
371 return GRD_SINGLE_DOM; | |
372 } | |
373 | |
374 /* The definition does not dominate the use. This is still OK if | |
375 this may be a use of a biv, i.e. if the def_bb dominates loop | |
376 latch. */ | |
377 if (just_once_each_iteration_p (current_loop, def_bb)) | |
378 return GRD_MAYBE_BIV; | |
379 | |
380 return GRD_INVALID; | |
381 } | |
382 | |
383 /* Sets IV to invariant CST in MODE. Always returns true (just for | |
384 consistency with other iv manipulation functions that may fail). */ | |
385 | |
386 static bool | |
111 | 387 iv_constant (struct rtx_iv *iv, scalar_int_mode mode, rtx cst) |
0 | 388 { |
389 iv->mode = mode; | |
390 iv->base = cst; | |
391 iv->step = const0_rtx; | |
392 iv->first_special = false; | |
111 | 393 iv->extend = IV_UNKNOWN_EXTEND; |
0 | 394 iv->extend_mode = iv->mode; |
395 iv->delta = const0_rtx; | |
396 iv->mult = const1_rtx; | |
397 | |
398 return true; | |
399 } | |
400 | |
401 /* Evaluates application of subreg to MODE on IV. */ | |
402 | |
403 static bool | |
111 | 404 iv_subreg (struct rtx_iv *iv, scalar_int_mode mode) |
0 | 405 { |
406 /* If iv is invariant, just calculate the new value. */ | |
407 if (iv->step == const0_rtx | |
408 && !iv->first_special) | |
409 { | |
410 rtx val = get_iv_value (iv, const0_rtx); | |
111 | 411 val = lowpart_subreg (mode, val, |
412 iv->extend == IV_UNKNOWN_EXTEND | |
413 ? iv->mode : iv->extend_mode); | |
0 | 414 |
415 iv->base = val; | |
111 | 416 iv->extend = IV_UNKNOWN_EXTEND; |
0 | 417 iv->mode = iv->extend_mode = mode; |
418 iv->delta = const0_rtx; | |
419 iv->mult = const1_rtx; | |
420 return true; | |
421 } | |
422 | |
423 if (iv->extend_mode == mode) | |
424 return true; | |
425 | |
426 if (GET_MODE_BITSIZE (mode) > GET_MODE_BITSIZE (iv->mode)) | |
427 return false; | |
428 | |
111 | 429 iv->extend = IV_UNKNOWN_EXTEND; |
0 | 430 iv->mode = mode; |
431 | |
432 iv->base = simplify_gen_binary (PLUS, iv->extend_mode, iv->delta, | |
433 simplify_gen_binary (MULT, iv->extend_mode, | |
434 iv->base, iv->mult)); | |
435 iv->step = simplify_gen_binary (MULT, iv->extend_mode, iv->step, iv->mult); | |
436 iv->mult = const1_rtx; | |
437 iv->delta = const0_rtx; | |
438 iv->first_special = false; | |
439 | |
440 return true; | |
441 } | |
442 | |
443 /* Evaluates application of EXTEND to MODE on IV. */ | |
444 | |
445 static bool | |
111 | 446 iv_extend (struct rtx_iv *iv, enum iv_extend_code extend, scalar_int_mode mode) |
0 | 447 { |
448 /* If iv is invariant, just calculate the new value. */ | |
449 if (iv->step == const0_rtx | |
450 && !iv->first_special) | |
451 { | |
452 rtx val = get_iv_value (iv, const0_rtx); | |
111 | 453 if (iv->extend_mode != iv->mode |
454 && iv->extend != IV_UNKNOWN_EXTEND | |
455 && iv->extend != extend) | |
456 val = lowpart_subreg (iv->mode, val, iv->extend_mode); | |
457 val = simplify_gen_unary (iv_extend_to_rtx_code (extend), mode, | |
458 val, | |
459 iv->extend == extend | |
460 ? iv->extend_mode : iv->mode); | |
0 | 461 iv->base = val; |
111 | 462 iv->extend = IV_UNKNOWN_EXTEND; |
0 | 463 iv->mode = iv->extend_mode = mode; |
464 iv->delta = const0_rtx; | |
465 iv->mult = const1_rtx; | |
466 return true; | |
467 } | |
468 | |
469 if (mode != iv->extend_mode) | |
470 return false; | |
471 | |
111 | 472 if (iv->extend != IV_UNKNOWN_EXTEND |
0 | 473 && iv->extend != extend) |
474 return false; | |
475 | |
476 iv->extend = extend; | |
477 | |
478 return true; | |
479 } | |
480 | |
481 /* Evaluates negation of IV. */ | |
482 | |
483 static bool | |
484 iv_neg (struct rtx_iv *iv) | |
485 { | |
111 | 486 if (iv->extend == IV_UNKNOWN_EXTEND) |
0 | 487 { |
488 iv->base = simplify_gen_unary (NEG, iv->extend_mode, | |
489 iv->base, iv->extend_mode); | |
490 iv->step = simplify_gen_unary (NEG, iv->extend_mode, | |
491 iv->step, iv->extend_mode); | |
492 } | |
493 else | |
494 { | |
495 iv->delta = simplify_gen_unary (NEG, iv->extend_mode, | |
496 iv->delta, iv->extend_mode); | |
497 iv->mult = simplify_gen_unary (NEG, iv->extend_mode, | |
498 iv->mult, iv->extend_mode); | |
499 } | |
500 | |
501 return true; | |
502 } | |
503 | |
504 /* Evaluates addition or subtraction (according to OP) of IV1 to IV0. */ | |
505 | |
506 static bool | |
507 iv_add (struct rtx_iv *iv0, struct rtx_iv *iv1, enum rtx_code op) | |
508 { | |
111 | 509 scalar_int_mode mode; |
0 | 510 rtx arg; |
511 | |
512 /* Extend the constant to extend_mode of the other operand if necessary. */ | |
111 | 513 if (iv0->extend == IV_UNKNOWN_EXTEND |
0 | 514 && iv0->mode == iv0->extend_mode |
515 && iv0->step == const0_rtx | |
516 && GET_MODE_SIZE (iv0->extend_mode) < GET_MODE_SIZE (iv1->extend_mode)) | |
517 { | |
518 iv0->extend_mode = iv1->extend_mode; | |
519 iv0->base = simplify_gen_unary (ZERO_EXTEND, iv0->extend_mode, | |
520 iv0->base, iv0->mode); | |
521 } | |
111 | 522 if (iv1->extend == IV_UNKNOWN_EXTEND |
0 | 523 && iv1->mode == iv1->extend_mode |
524 && iv1->step == const0_rtx | |
525 && GET_MODE_SIZE (iv1->extend_mode) < GET_MODE_SIZE (iv0->extend_mode)) | |
526 { | |
527 iv1->extend_mode = iv0->extend_mode; | |
528 iv1->base = simplify_gen_unary (ZERO_EXTEND, iv1->extend_mode, | |
529 iv1->base, iv1->mode); | |
530 } | |
531 | |
532 mode = iv0->extend_mode; | |
533 if (mode != iv1->extend_mode) | |
534 return false; | |
535 | |
111 | 536 if (iv0->extend == IV_UNKNOWN_EXTEND |
537 && iv1->extend == IV_UNKNOWN_EXTEND) | |
0 | 538 { |
539 if (iv0->mode != iv1->mode) | |
540 return false; | |
541 | |
542 iv0->base = simplify_gen_binary (op, mode, iv0->base, iv1->base); | |
543 iv0->step = simplify_gen_binary (op, mode, iv0->step, iv1->step); | |
544 | |
545 return true; | |
546 } | |
547 | |
548 /* Handle addition of constant. */ | |
111 | 549 if (iv1->extend == IV_UNKNOWN_EXTEND |
0 | 550 && iv1->mode == mode |
551 && iv1->step == const0_rtx) | |
552 { | |
553 iv0->delta = simplify_gen_binary (op, mode, iv0->delta, iv1->base); | |
554 return true; | |
555 } | |
556 | |
111 | 557 if (iv0->extend == IV_UNKNOWN_EXTEND |
0 | 558 && iv0->mode == mode |
559 && iv0->step == const0_rtx) | |
560 { | |
561 arg = iv0->base; | |
562 *iv0 = *iv1; | |
563 if (op == MINUS | |
564 && !iv_neg (iv0)) | |
565 return false; | |
566 | |
567 iv0->delta = simplify_gen_binary (PLUS, mode, iv0->delta, arg); | |
568 return true; | |
569 } | |
570 | |
571 return false; | |
572 } | |
573 | |
574 /* Evaluates multiplication of IV by constant CST. */ | |
575 | |
576 static bool | |
577 iv_mult (struct rtx_iv *iv, rtx mby) | |
578 { | |
111 | 579 scalar_int_mode mode = iv->extend_mode; |
0 | 580 |
581 if (GET_MODE (mby) != VOIDmode | |
582 && GET_MODE (mby) != mode) | |
583 return false; | |
584 | |
111 | 585 if (iv->extend == IV_UNKNOWN_EXTEND) |
0 | 586 { |
587 iv->base = simplify_gen_binary (MULT, mode, iv->base, mby); | |
588 iv->step = simplify_gen_binary (MULT, mode, iv->step, mby); | |
589 } | |
590 else | |
591 { | |
592 iv->delta = simplify_gen_binary (MULT, mode, iv->delta, mby); | |
593 iv->mult = simplify_gen_binary (MULT, mode, iv->mult, mby); | |
594 } | |
595 | |
596 return true; | |
597 } | |
598 | |
599 /* Evaluates shift of IV by constant CST. */ | |
600 | |
601 static bool | |
602 iv_shift (struct rtx_iv *iv, rtx mby) | |
603 { | |
111 | 604 scalar_int_mode mode = iv->extend_mode; |
0 | 605 |
606 if (GET_MODE (mby) != VOIDmode | |
607 && GET_MODE (mby) != mode) | |
608 return false; | |
609 | |
111 | 610 if (iv->extend == IV_UNKNOWN_EXTEND) |
0 | 611 { |
612 iv->base = simplify_gen_binary (ASHIFT, mode, iv->base, mby); | |
613 iv->step = simplify_gen_binary (ASHIFT, mode, iv->step, mby); | |
614 } | |
615 else | |
616 { | |
617 iv->delta = simplify_gen_binary (ASHIFT, mode, iv->delta, mby); | |
618 iv->mult = simplify_gen_binary (ASHIFT, mode, iv->mult, mby); | |
619 } | |
620 | |
621 return true; | |
622 } | |
623 | |
624 /* The recursive part of get_biv_step. Gets the value of the single value | |
625 defined by DEF wrto initial value of REG inside loop, in shape described | |
626 at get_biv_step. */ | |
627 | |
628 static bool | |
111 | 629 get_biv_step_1 (df_ref def, scalar_int_mode outer_mode, rtx reg, |
630 rtx *inner_step, scalar_int_mode *inner_mode, | |
631 enum iv_extend_code *extend, | |
0 | 632 rtx *outer_step) |
633 { | |
634 rtx set, rhs, op0 = NULL_RTX, op1 = NULL_RTX; | |
111 | 635 rtx next, nextr; |
0 | 636 enum rtx_code code; |
111 | 637 rtx_insn *insn = DF_REF_INSN (def); |
0 | 638 df_ref next_def; |
639 enum iv_grd_result res; | |
640 | |
641 set = single_set (insn); | |
642 if (!set) | |
643 return false; | |
644 | |
645 rhs = find_reg_equal_equiv_note (insn); | |
646 if (rhs) | |
647 rhs = XEXP (rhs, 0); | |
648 else | |
649 rhs = SET_SRC (set); | |
650 | |
651 code = GET_CODE (rhs); | |
652 switch (code) | |
653 { | |
654 case SUBREG: | |
655 case REG: | |
656 next = rhs; | |
657 break; | |
658 | |
659 case PLUS: | |
660 case MINUS: | |
661 op0 = XEXP (rhs, 0); | |
662 op1 = XEXP (rhs, 1); | |
663 | |
664 if (code == PLUS && CONSTANT_P (op0)) | |
111 | 665 std::swap (op0, op1); |
0 | 666 |
667 if (!simple_reg_p (op0) | |
668 || !CONSTANT_P (op1)) | |
669 return false; | |
670 | |
671 if (GET_MODE (rhs) != outer_mode) | |
672 { | |
673 /* ppc64 uses expressions like | |
674 | |
675 (set x:SI (plus:SI (subreg:SI y:DI) 1)). | |
676 | |
677 this is equivalent to | |
678 | |
679 (set x':DI (plus:DI y:DI 1)) | |
680 (set x:SI (subreg:SI (x':DI)). */ | |
681 if (GET_CODE (op0) != SUBREG) | |
682 return false; | |
683 if (GET_MODE (SUBREG_REG (op0)) != outer_mode) | |
684 return false; | |
685 } | |
686 | |
687 next = op0; | |
688 break; | |
689 | |
690 case SIGN_EXTEND: | |
691 case ZERO_EXTEND: | |
692 if (GET_MODE (rhs) != outer_mode) | |
693 return false; | |
694 | |
695 op0 = XEXP (rhs, 0); | |
696 if (!simple_reg_p (op0)) | |
697 return false; | |
698 | |
699 next = op0; | |
700 break; | |
701 | |
702 default: | |
703 return false; | |
704 } | |
705 | |
706 if (GET_CODE (next) == SUBREG) | |
707 { | |
708 if (!subreg_lowpart_p (next)) | |
709 return false; | |
710 | |
711 nextr = SUBREG_REG (next); | |
712 if (GET_MODE (nextr) != outer_mode) | |
713 return false; | |
714 } | |
715 else | |
716 nextr = next; | |
717 | |
718 res = iv_get_reaching_def (insn, nextr, &next_def); | |
719 | |
720 if (res == GRD_INVALID || res == GRD_INVARIANT) | |
721 return false; | |
722 | |
723 if (res == GRD_MAYBE_BIV) | |
724 { | |
725 if (!rtx_equal_p (nextr, reg)) | |
726 return false; | |
727 | |
728 *inner_step = const0_rtx; | |
111 | 729 *extend = IV_UNKNOWN_EXTEND; |
0 | 730 *inner_mode = outer_mode; |
731 *outer_step = const0_rtx; | |
732 } | |
111 | 733 else if (!get_biv_step_1 (next_def, outer_mode, reg, |
734 inner_step, inner_mode, extend, | |
0 | 735 outer_step)) |
736 return false; | |
737 | |
738 if (GET_CODE (next) == SUBREG) | |
739 { | |
111 | 740 scalar_int_mode amode; |
741 if (!is_a <scalar_int_mode> (GET_MODE (next), &amode) | |
742 || GET_MODE_SIZE (amode) > GET_MODE_SIZE (*inner_mode)) | |
0 | 743 return false; |
744 | |
745 *inner_mode = amode; | |
746 *inner_step = simplify_gen_binary (PLUS, outer_mode, | |
747 *inner_step, *outer_step); | |
748 *outer_step = const0_rtx; | |
111 | 749 *extend = IV_UNKNOWN_EXTEND; |
0 | 750 } |
751 | |
752 switch (code) | |
753 { | |
754 case REG: | |
755 case SUBREG: | |
756 break; | |
757 | |
758 case PLUS: | |
759 case MINUS: | |
760 if (*inner_mode == outer_mode | |
761 /* See comment in previous switch. */ | |
762 || GET_MODE (rhs) != outer_mode) | |
763 *inner_step = simplify_gen_binary (code, outer_mode, | |
764 *inner_step, op1); | |
765 else | |
766 *outer_step = simplify_gen_binary (code, outer_mode, | |
767 *outer_step, op1); | |
768 break; | |
769 | |
770 case SIGN_EXTEND: | |
771 case ZERO_EXTEND: | |
772 gcc_assert (GET_MODE (op0) == *inner_mode | |
111 | 773 && *extend == IV_UNKNOWN_EXTEND |
0 | 774 && *outer_step == const0_rtx); |
775 | |
111 | 776 *extend = (code == SIGN_EXTEND) ? IV_SIGN_EXTEND : IV_ZERO_EXTEND; |
0 | 777 break; |
778 | |
779 default: | |
780 return false; | |
781 } | |
782 | |
783 return true; | |
784 } | |
785 | |
786 /* Gets the operation on register REG inside loop, in shape | |
787 | |
788 OUTER_STEP + EXTEND_{OUTER_MODE} (SUBREG_{INNER_MODE} (REG + INNER_STEP)) | |
789 | |
790 If the operation cannot be described in this shape, return false. | |
791 LAST_DEF is the definition of REG that dominates loop latch. */ | |
792 | |
793 static bool | |
111 | 794 get_biv_step (df_ref last_def, scalar_int_mode outer_mode, rtx reg, |
795 rtx *inner_step, scalar_int_mode *inner_mode, | |
796 enum iv_extend_code *extend, rtx *outer_step) | |
0 | 797 { |
111 | 798 if (!get_biv_step_1 (last_def, outer_mode, reg, |
799 inner_step, inner_mode, extend, | |
0 | 800 outer_step)) |
801 return false; | |
802 | |
111 | 803 gcc_assert ((*inner_mode == outer_mode) != (*extend != IV_UNKNOWN_EXTEND)); |
804 gcc_assert (*inner_mode != outer_mode || *outer_step == const0_rtx); | |
0 | 805 |
806 return true; | |
807 } | |
808 | |
809 /* Records information that DEF is induction variable IV. */ | |
810 | |
811 static void | |
812 record_iv (df_ref def, struct rtx_iv *iv) | |
813 { | |
814 struct rtx_iv *recorded_iv = XNEW (struct rtx_iv); | |
815 | |
816 *recorded_iv = *iv; | |
817 check_iv_ref_table_size (); | |
818 DF_REF_IV_SET (def, recorded_iv); | |
819 } | |
820 | |
821 /* If DEF was already analyzed for bivness, store the description of the biv to | |
822 IV and return true. Otherwise return false. */ | |
823 | |
824 static bool | |
825 analyzed_for_bivness_p (rtx def, struct rtx_iv *iv) | |
826 { | |
111 | 827 struct biv_entry *biv = bivs->find_with_hash (def, REGNO (def)); |
0 | 828 |
829 if (!biv) | |
830 return false; | |
831 | |
832 *iv = biv->iv; | |
833 return true; | |
834 } | |
835 | |
836 static void | |
837 record_biv (rtx def, struct rtx_iv *iv) | |
838 { | |
839 struct biv_entry *biv = XNEW (struct biv_entry); | |
111 | 840 biv_entry **slot = bivs->find_slot_with_hash (def, REGNO (def), INSERT); |
0 | 841 |
842 biv->regno = REGNO (def); | |
843 biv->iv = *iv; | |
844 gcc_assert (!*slot); | |
845 *slot = biv; | |
846 } | |
847 | |
848 /* Determines whether DEF is a biv and if so, stores its description | |
111 | 849 to *IV. OUTER_MODE is the mode of DEF. */ |
0 | 850 |
851 static bool | |
111 | 852 iv_analyze_biv (scalar_int_mode outer_mode, rtx def, struct rtx_iv *iv) |
0 | 853 { |
854 rtx inner_step, outer_step; | |
111 | 855 scalar_int_mode inner_mode; |
856 enum iv_extend_code extend; | |
0 | 857 df_ref last_def; |
858 | |
859 if (dump_file) | |
860 { | |
861 fprintf (dump_file, "Analyzing "); | |
862 print_rtl (dump_file, def); | |
863 fprintf (dump_file, " for bivness.\n"); | |
864 } | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
865 |
0 | 866 if (!REG_P (def)) |
867 { | |
868 if (!CONSTANT_P (def)) | |
869 return false; | |
870 | |
111 | 871 return iv_constant (iv, outer_mode, def); |
0 | 872 } |
873 | |
874 if (!latch_dominating_def (def, &last_def)) | |
875 { | |
876 if (dump_file) | |
877 fprintf (dump_file, " not simple.\n"); | |
878 return false; | |
879 } | |
880 | |
881 if (!last_def) | |
111 | 882 return iv_constant (iv, outer_mode, def); |
0 | 883 |
884 if (analyzed_for_bivness_p (def, iv)) | |
885 { | |
886 if (dump_file) | |
887 fprintf (dump_file, " already analysed.\n"); | |
888 return iv->base != NULL_RTX; | |
889 } | |
890 | |
111 | 891 if (!get_biv_step (last_def, outer_mode, def, &inner_step, &inner_mode, |
892 &extend, &outer_step)) | |
0 | 893 { |
894 iv->base = NULL_RTX; | |
895 goto end; | |
896 } | |
897 | |
898 /* Loop transforms base to es (base + inner_step) + outer_step, | |
899 where es means extend of subreg between inner_mode and outer_mode. | |
900 The corresponding induction variable is | |
901 | |
902 es ((base - outer_step) + i * (inner_step + outer_step)) + outer_step */ | |
903 | |
904 iv->base = simplify_gen_binary (MINUS, outer_mode, def, outer_step); | |
905 iv->step = simplify_gen_binary (PLUS, outer_mode, inner_step, outer_step); | |
906 iv->mode = inner_mode; | |
907 iv->extend_mode = outer_mode; | |
908 iv->extend = extend; | |
909 iv->mult = const1_rtx; | |
910 iv->delta = outer_step; | |
911 iv->first_special = inner_mode != outer_mode; | |
912 | |
913 end: | |
914 if (dump_file) | |
915 { | |
916 fprintf (dump_file, " "); | |
917 dump_iv_info (dump_file, iv); | |
918 fprintf (dump_file, "\n"); | |
919 } | |
920 | |
921 record_biv (def, iv); | |
922 return iv->base != NULL_RTX; | |
923 } | |
924 | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
925 /* Analyzes expression RHS used at INSN and stores the result to *IV. |
0 | 926 The mode of the induction variable is MODE. */ |
927 | |
928 bool | |
111 | 929 iv_analyze_expr (rtx_insn *insn, scalar_int_mode mode, rtx rhs, |
930 struct rtx_iv *iv) | |
0 | 931 { |
111 | 932 rtx mby = NULL_RTX; |
0 | 933 rtx op0 = NULL_RTX, op1 = NULL_RTX; |
934 struct rtx_iv iv0, iv1; | |
935 enum rtx_code code = GET_CODE (rhs); | |
111 | 936 scalar_int_mode omode = mode; |
937 | |
0 | 938 iv->base = NULL_RTX; |
939 iv->step = NULL_RTX; | |
940 | |
941 gcc_assert (GET_MODE (rhs) == mode || GET_MODE (rhs) == VOIDmode); | |
942 | |
943 if (CONSTANT_P (rhs) | |
944 || REG_P (rhs) | |
945 || code == SUBREG) | |
111 | 946 return iv_analyze_op (insn, mode, rhs, iv); |
0 | 947 |
948 switch (code) | |
949 { | |
950 case REG: | |
951 op0 = rhs; | |
952 break; | |
953 | |
954 case SIGN_EXTEND: | |
955 case ZERO_EXTEND: | |
956 case NEG: | |
957 op0 = XEXP (rhs, 0); | |
111 | 958 /* We don't know how many bits there are in a sign-extended constant. */ |
959 if (!is_a <scalar_int_mode> (GET_MODE (op0), &omode)) | |
960 return false; | |
0 | 961 break; |
962 | |
963 case PLUS: | |
964 case MINUS: | |
965 op0 = XEXP (rhs, 0); | |
966 op1 = XEXP (rhs, 1); | |
967 break; | |
968 | |
969 case MULT: | |
970 op0 = XEXP (rhs, 0); | |
971 mby = XEXP (rhs, 1); | |
972 if (!CONSTANT_P (mby)) | |
111 | 973 std::swap (op0, mby); |
0 | 974 if (!CONSTANT_P (mby)) |
975 return false; | |
976 break; | |
977 | |
978 case ASHIFT: | |
979 op0 = XEXP (rhs, 0); | |
980 mby = XEXP (rhs, 1); | |
981 if (!CONSTANT_P (mby)) | |
982 return false; | |
983 break; | |
984 | |
985 default: | |
986 return false; | |
987 } | |
988 | |
989 if (op0 | |
111 | 990 && !iv_analyze_expr (insn, omode, op0, &iv0)) |
0 | 991 return false; |
992 | |
993 if (op1 | |
111 | 994 && !iv_analyze_expr (insn, omode, op1, &iv1)) |
0 | 995 return false; |
996 | |
997 switch (code) | |
998 { | |
999 case SIGN_EXTEND: | |
111 | 1000 if (!iv_extend (&iv0, IV_SIGN_EXTEND, mode)) |
1001 return false; | |
1002 break; | |
1003 | |
0 | 1004 case ZERO_EXTEND: |
111 | 1005 if (!iv_extend (&iv0, IV_ZERO_EXTEND, mode)) |
0 | 1006 return false; |
1007 break; | |
1008 | |
1009 case NEG: | |
1010 if (!iv_neg (&iv0)) | |
1011 return false; | |
1012 break; | |
1013 | |
1014 case PLUS: | |
1015 case MINUS: | |
1016 if (!iv_add (&iv0, &iv1, code)) | |
1017 return false; | |
1018 break; | |
1019 | |
1020 case MULT: | |
1021 if (!iv_mult (&iv0, mby)) | |
1022 return false; | |
1023 break; | |
1024 | |
1025 case ASHIFT: | |
1026 if (!iv_shift (&iv0, mby)) | |
1027 return false; | |
1028 break; | |
1029 | |
1030 default: | |
1031 break; | |
1032 } | |
1033 | |
1034 *iv = iv0; | |
1035 return iv->base != NULL_RTX; | |
1036 } | |
1037 | |
1038 /* Analyzes iv DEF and stores the result to *IV. */ | |
1039 | |
1040 static bool | |
1041 iv_analyze_def (df_ref def, struct rtx_iv *iv) | |
1042 { | |
111 | 1043 rtx_insn *insn = DF_REF_INSN (def); |
0 | 1044 rtx reg = DF_REF_REG (def); |
1045 rtx set, rhs; | |
1046 | |
1047 if (dump_file) | |
1048 { | |
1049 fprintf (dump_file, "Analyzing def of "); | |
1050 print_rtl (dump_file, reg); | |
1051 fprintf (dump_file, " in insn "); | |
1052 print_rtl_single (dump_file, insn); | |
1053 } | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1054 |
0 | 1055 check_iv_ref_table_size (); |
1056 if (DF_REF_IV (def)) | |
1057 { | |
1058 if (dump_file) | |
1059 fprintf (dump_file, " already analysed.\n"); | |
1060 *iv = *DF_REF_IV (def); | |
1061 return iv->base != NULL_RTX; | |
1062 } | |
1063 | |
1064 iv->base = NULL_RTX; | |
1065 iv->step = NULL_RTX; | |
1066 | |
111 | 1067 scalar_int_mode mode; |
1068 if (!REG_P (reg) || !is_a <scalar_int_mode> (GET_MODE (reg), &mode)) | |
0 | 1069 return false; |
1070 | |
1071 set = single_set (insn); | |
1072 if (!set) | |
1073 return false; | |
1074 | |
1075 if (!REG_P (SET_DEST (set))) | |
1076 return false; | |
1077 | |
1078 gcc_assert (SET_DEST (set) == reg); | |
1079 rhs = find_reg_equal_equiv_note (insn); | |
1080 if (rhs) | |
1081 rhs = XEXP (rhs, 0); | |
1082 else | |
1083 rhs = SET_SRC (set); | |
1084 | |
111 | 1085 iv_analyze_expr (insn, mode, rhs, iv); |
0 | 1086 record_iv (def, iv); |
1087 | |
1088 if (dump_file) | |
1089 { | |
1090 print_rtl (dump_file, reg); | |
1091 fprintf (dump_file, " in insn "); | |
1092 print_rtl_single (dump_file, insn); | |
1093 fprintf (dump_file, " is "); | |
1094 dump_iv_info (dump_file, iv); | |
1095 fprintf (dump_file, "\n"); | |
1096 } | |
1097 | |
1098 return iv->base != NULL_RTX; | |
1099 } | |
1100 | |
111 | 1101 /* Analyzes operand OP of INSN and stores the result to *IV. MODE is the |
1102 mode of OP. */ | |
0 | 1103 |
1104 static bool | |
111 | 1105 iv_analyze_op (rtx_insn *insn, scalar_int_mode mode, rtx op, struct rtx_iv *iv) |
0 | 1106 { |
1107 df_ref def = NULL; | |
1108 enum iv_grd_result res; | |
1109 | |
1110 if (dump_file) | |
1111 { | |
1112 fprintf (dump_file, "Analyzing operand "); | |
1113 print_rtl (dump_file, op); | |
1114 fprintf (dump_file, " of insn "); | |
1115 print_rtl_single (dump_file, insn); | |
1116 } | |
1117 | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1118 if (function_invariant_p (op)) |
0 | 1119 res = GRD_INVARIANT; |
1120 else if (GET_CODE (op) == SUBREG) | |
1121 { | |
111 | 1122 scalar_int_mode inner_mode; |
1123 if (!subreg_lowpart_p (op) | |
1124 || !is_a <scalar_int_mode> (GET_MODE (SUBREG_REG (op)), &inner_mode)) | |
0 | 1125 return false; |
1126 | |
111 | 1127 if (!iv_analyze_op (insn, inner_mode, SUBREG_REG (op), iv)) |
0 | 1128 return false; |
1129 | |
111 | 1130 return iv_subreg (iv, mode); |
0 | 1131 } |
1132 else | |
1133 { | |
1134 res = iv_get_reaching_def (insn, op, &def); | |
1135 if (res == GRD_INVALID) | |
1136 { | |
1137 if (dump_file) | |
1138 fprintf (dump_file, " not simple.\n"); | |
1139 return false; | |
1140 } | |
1141 } | |
1142 | |
1143 if (res == GRD_INVARIANT) | |
1144 { | |
111 | 1145 iv_constant (iv, mode, op); |
0 | 1146 |
1147 if (dump_file) | |
1148 { | |
1149 fprintf (dump_file, " "); | |
1150 dump_iv_info (dump_file, iv); | |
1151 fprintf (dump_file, "\n"); | |
1152 } | |
1153 return true; | |
1154 } | |
1155 | |
1156 if (res == GRD_MAYBE_BIV) | |
111 | 1157 return iv_analyze_biv (mode, op, iv); |
0 | 1158 |
1159 return iv_analyze_def (def, iv); | |
1160 } | |
1161 | |
111 | 1162 /* Analyzes value VAL at INSN and stores the result to *IV. MODE is the |
1163 mode of VAL. */ | |
0 | 1164 |
1165 bool | |
111 | 1166 iv_analyze (rtx_insn *insn, scalar_int_mode mode, rtx val, struct rtx_iv *iv) |
0 | 1167 { |
1168 rtx reg; | |
1169 | |
1170 /* We must find the insn in that val is used, so that we get to UD chains. | |
1171 Since the function is sometimes called on result of get_condition, | |
1172 this does not necessarily have to be directly INSN; scan also the | |
1173 following insns. */ | |
1174 if (simple_reg_p (val)) | |
1175 { | |
1176 if (GET_CODE (val) == SUBREG) | |
1177 reg = SUBREG_REG (val); | |
1178 else | |
1179 reg = val; | |
1180 | |
1181 while (!df_find_use (insn, reg)) | |
1182 insn = NEXT_INSN (insn); | |
1183 } | |
1184 | |
111 | 1185 return iv_analyze_op (insn, mode, val, iv); |
0 | 1186 } |
1187 | |
1188 /* Analyzes definition of DEF in INSN and stores the result to IV. */ | |
1189 | |
1190 bool | |
111 | 1191 iv_analyze_result (rtx_insn *insn, rtx def, struct rtx_iv *iv) |
0 | 1192 { |
1193 df_ref adef; | |
1194 | |
1195 adef = df_find_def (insn, def); | |
1196 if (!adef) | |
1197 return false; | |
1198 | |
1199 return iv_analyze_def (adef, iv); | |
1200 } | |
1201 | |
1202 /* Checks whether definition of register REG in INSN is a basic induction | |
111 | 1203 variable. MODE is the mode of REG. |
1204 | |
1205 IV analysis must have been initialized (via a call to | |
0 | 1206 iv_analysis_loop_init) for this function to produce a result. */ |
1207 | |
1208 bool | |
111 | 1209 biv_p (rtx_insn *insn, scalar_int_mode mode, rtx reg) |
0 | 1210 { |
1211 struct rtx_iv iv; | |
1212 df_ref def, last_def; | |
1213 | |
1214 if (!simple_reg_p (reg)) | |
1215 return false; | |
1216 | |
1217 def = df_find_def (insn, reg); | |
1218 gcc_assert (def != NULL); | |
1219 if (!latch_dominating_def (reg, &last_def)) | |
1220 return false; | |
1221 if (last_def != def) | |
1222 return false; | |
1223 | |
111 | 1224 if (!iv_analyze_biv (mode, reg, &iv)) |
0 | 1225 return false; |
1226 | |
1227 return iv.step != const0_rtx; | |
1228 } | |
1229 | |
1230 /* Calculates value of IV at ITERATION-th iteration. */ | |
1231 | |
1232 rtx | |
1233 get_iv_value (struct rtx_iv *iv, rtx iteration) | |
1234 { | |
1235 rtx val; | |
1236 | |
1237 /* We would need to generate some if_then_else patterns, and so far | |
1238 it is not needed anywhere. */ | |
1239 gcc_assert (!iv->first_special); | |
1240 | |
1241 if (iv->step != const0_rtx && iteration != const0_rtx) | |
1242 val = simplify_gen_binary (PLUS, iv->extend_mode, iv->base, | |
1243 simplify_gen_binary (MULT, iv->extend_mode, | |
1244 iv->step, iteration)); | |
1245 else | |
1246 val = iv->base; | |
1247 | |
1248 if (iv->extend_mode == iv->mode) | |
1249 return val; | |
1250 | |
1251 val = lowpart_subreg (iv->mode, val, iv->extend_mode); | |
1252 | |
111 | 1253 if (iv->extend == IV_UNKNOWN_EXTEND) |
0 | 1254 return val; |
1255 | |
111 | 1256 val = simplify_gen_unary (iv_extend_to_rtx_code (iv->extend), |
1257 iv->extend_mode, val, iv->mode); | |
0 | 1258 val = simplify_gen_binary (PLUS, iv->extend_mode, iv->delta, |
1259 simplify_gen_binary (MULT, iv->extend_mode, | |
1260 iv->mult, val)); | |
1261 | |
1262 return val; | |
1263 } | |
1264 | |
1265 /* Free the data for an induction variable analysis. */ | |
1266 | |
1267 void | |
1268 iv_analysis_done (void) | |
1269 { | |
1270 if (!clean_slate) | |
1271 { | |
1272 clear_iv_info (); | |
1273 clean_slate = true; | |
1274 df_finish_pass (true); | |
111 | 1275 delete bivs; |
1276 bivs = NULL; | |
0 | 1277 free (iv_ref_table); |
1278 iv_ref_table = NULL; | |
1279 iv_ref_table_size = 0; | |
1280 } | |
1281 } | |
1282 | |
1283 /* Computes inverse to X modulo (1 << MOD). */ | |
1284 | |
111 | 1285 static uint64_t |
1286 inverse (uint64_t x, int mod) | |
0 | 1287 { |
111 | 1288 uint64_t mask = |
1289 ((uint64_t) 1 << (mod - 1) << 1) - 1; | |
1290 uint64_t rslt = 1; | |
0 | 1291 int i; |
1292 | |
1293 for (i = 0; i < mod - 1; i++) | |
1294 { | |
1295 rslt = (rslt * x) & mask; | |
1296 x = (x * x) & mask; | |
1297 } | |
1298 | |
1299 return rslt; | |
1300 } | |
1301 | |
111 | 1302 /* Checks whether any register in X is in set ALT. */ |
1303 | |
1304 static bool | |
1305 altered_reg_used (const_rtx x, bitmap alt) | |
0 | 1306 { |
111 | 1307 subrtx_iterator::array_type array; |
1308 FOR_EACH_SUBRTX (iter, array, x, NONCONST) | |
1309 { | |
1310 const_rtx x = *iter; | |
1311 if (REG_P (x) && REGNO_REG_SET_P (alt, REGNO (x))) | |
1312 return true; | |
1313 } | |
1314 return false; | |
0 | 1315 } |
1316 | |
1317 /* Marks registers altered by EXPR in set ALT. */ | |
1318 | |
1319 static void | |
1320 mark_altered (rtx expr, const_rtx by ATTRIBUTE_UNUSED, void *alt) | |
1321 { | |
1322 if (GET_CODE (expr) == SUBREG) | |
1323 expr = SUBREG_REG (expr); | |
1324 if (!REG_P (expr)) | |
1325 return; | |
1326 | |
1327 SET_REGNO_REG_SET ((bitmap) alt, REGNO (expr)); | |
1328 } | |
1329 | |
1330 /* Checks whether RHS is simple enough to process. */ | |
1331 | |
1332 static bool | |
1333 simple_rhs_p (rtx rhs) | |
1334 { | |
1335 rtx op0, op1; | |
1336 | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1337 if (function_invariant_p (rhs) |
0 | 1338 || (REG_P (rhs) && !HARD_REGISTER_P (rhs))) |
1339 return true; | |
1340 | |
1341 switch (GET_CODE (rhs)) | |
1342 { | |
1343 case PLUS: | |
1344 case MINUS: | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1345 case AND: |
0 | 1346 op0 = XEXP (rhs, 0); |
1347 op1 = XEXP (rhs, 1); | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1348 /* Allow reg OP const and reg OP reg. */ |
0 | 1349 if (!(REG_P (op0) && !HARD_REGISTER_P (op0)) |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1350 && !function_invariant_p (op0)) |
0 | 1351 return false; |
1352 if (!(REG_P (op1) && !HARD_REGISTER_P (op1)) | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1353 && !function_invariant_p (op1)) |
0 | 1354 return false; |
1355 | |
1356 return true; | |
1357 | |
1358 case ASHIFT: | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1359 case ASHIFTRT: |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1360 case LSHIFTRT: |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1361 case MULT: |
0 | 1362 op0 = XEXP (rhs, 0); |
1363 op1 = XEXP (rhs, 1); | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1364 /* Allow reg OP const. */ |
0 | 1365 if (!(REG_P (op0) && !HARD_REGISTER_P (op0))) |
1366 return false; | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1367 if (!function_invariant_p (op1)) |
0 | 1368 return false; |
1369 | |
1370 return true; | |
1371 | |
1372 default: | |
1373 return false; | |
1374 } | |
1375 } | |
1376 | |
111 | 1377 /* If REGNO has a single definition, return its known value, otherwise return |
1378 null. */ | |
1379 | |
1380 static rtx | |
1381 find_single_def_src (unsigned int regno) | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1382 { |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1383 df_ref adef; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1384 rtx set, src; |
111 | 1385 |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1386 for (;;) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1387 { |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1388 rtx note; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1389 adef = DF_REG_DEF_CHAIN (regno); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1390 if (adef == NULL || DF_REF_NEXT_REG (adef) != NULL |
111 | 1391 || DF_REF_IS_ARTIFICIAL (adef)) |
1392 return NULL_RTX; | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1393 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1394 set = single_set (DF_REF_INSN (adef)); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1395 if (set == NULL || !REG_P (SET_DEST (set)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1396 || REGNO (SET_DEST (set)) != regno) |
111 | 1397 return NULL_RTX; |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1398 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1399 note = find_reg_equal_equiv_note (DF_REF_INSN (adef)); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1400 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1401 if (note && function_invariant_p (XEXP (note, 0))) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1402 { |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1403 src = XEXP (note, 0); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1404 break; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1405 } |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1406 src = SET_SRC (set); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1407 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1408 if (REG_P (src)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1409 { |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1410 regno = REGNO (src); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1411 continue; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1412 } |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1413 break; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1414 } |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1415 if (!function_invariant_p (src)) |
111 | 1416 return NULL_RTX; |
1417 | |
1418 return src; | |
1419 } | |
1420 | |
1421 /* If any registers in *EXPR that have a single definition, try to replace | |
1422 them with the known-equivalent values. */ | |
1423 | |
1424 static void | |
1425 replace_single_def_regs (rtx *expr) | |
1426 { | |
1427 subrtx_var_iterator::array_type array; | |
1428 repeat: | |
1429 FOR_EACH_SUBRTX_VAR (iter, array, *expr, NONCONST) | |
1430 { | |
1431 rtx x = *iter; | |
1432 if (REG_P (x)) | |
1433 if (rtx new_x = find_single_def_src (REGNO (x))) | |
1434 { | |
1435 *expr = simplify_replace_rtx (*expr, x, new_x); | |
1436 goto repeat; | |
1437 } | |
1438 } | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1439 } |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1440 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1441 /* A subroutine of simplify_using_initial_values, this function examines INSN |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1442 to see if it contains a suitable set that we can use to make a replacement. |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1443 If it is suitable, return true and set DEST and SRC to the lhs and rhs of |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1444 the set; return false otherwise. */ |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1445 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1446 static bool |
111 | 1447 suitable_set_for_replacement (rtx_insn *insn, rtx *dest, rtx *src) |
0 | 1448 { |
1449 rtx set = single_set (insn); | |
1450 rtx lhs = NULL_RTX, rhs; | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1451 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1452 if (!set) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1453 return false; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1454 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1455 lhs = SET_DEST (set); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1456 if (!REG_P (lhs)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1457 return false; |
0 | 1458 |
1459 rhs = find_reg_equal_equiv_note (insn); | |
1460 if (rhs) | |
1461 rhs = XEXP (rhs, 0); | |
1462 else | |
1463 rhs = SET_SRC (set); | |
1464 | |
1465 if (!simple_rhs_p (rhs)) | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1466 return false; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1467 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1468 *dest = lhs; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1469 *src = rhs; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1470 return true; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1471 } |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1472 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1473 /* Using the data returned by suitable_set_for_replacement, replace DEST |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1474 with SRC in *EXPR and return the new expression. Also call |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1475 replace_single_def_regs if the replacement changed something. */ |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1476 static void |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1477 replace_in_expr (rtx *expr, rtx dest, rtx src) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1478 { |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1479 rtx old = *expr; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1480 *expr = simplify_replace_rtx (*expr, dest, src); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1481 if (old == *expr) |
0 | 1482 return; |
111 | 1483 replace_single_def_regs (expr); |
0 | 1484 } |
1485 | |
1486 /* Checks whether A implies B. */ | |
1487 | |
1488 static bool | |
1489 implies_p (rtx a, rtx b) | |
1490 { | |
111 | 1491 rtx op0, op1, opb0, opb1; |
1492 machine_mode mode; | |
1493 | |
1494 if (rtx_equal_p (a, b)) | |
1495 return true; | |
0 | 1496 |
1497 if (GET_CODE (a) == EQ) | |
1498 { | |
1499 op0 = XEXP (a, 0); | |
1500 op1 = XEXP (a, 1); | |
1501 | |
111 | 1502 if (REG_P (op0) |
1503 || (GET_CODE (op0) == SUBREG | |
1504 && REG_P (SUBREG_REG (op0)))) | |
0 | 1505 { |
111 | 1506 rtx r = simplify_replace_rtx (b, op0, op1); |
0 | 1507 if (r == const_true_rtx) |
1508 return true; | |
1509 } | |
1510 | |
111 | 1511 if (REG_P (op1) |
1512 || (GET_CODE (op1) == SUBREG | |
1513 && REG_P (SUBREG_REG (op1)))) | |
0 | 1514 { |
111 | 1515 rtx r = simplify_replace_rtx (b, op1, op0); |
0 | 1516 if (r == const_true_rtx) |
1517 return true; | |
1518 } | |
1519 } | |
1520 | |
1521 if (b == const_true_rtx) | |
1522 return true; | |
1523 | |
1524 if ((GET_RTX_CLASS (GET_CODE (a)) != RTX_COMM_COMPARE | |
1525 && GET_RTX_CLASS (GET_CODE (a)) != RTX_COMPARE) | |
1526 || (GET_RTX_CLASS (GET_CODE (b)) != RTX_COMM_COMPARE | |
1527 && GET_RTX_CLASS (GET_CODE (b)) != RTX_COMPARE)) | |
1528 return false; | |
1529 | |
1530 op0 = XEXP (a, 0); | |
1531 op1 = XEXP (a, 1); | |
1532 opb0 = XEXP (b, 0); | |
1533 opb1 = XEXP (b, 1); | |
1534 | |
1535 mode = GET_MODE (op0); | |
1536 if (mode != GET_MODE (opb0)) | |
1537 mode = VOIDmode; | |
1538 else if (mode == VOIDmode) | |
1539 { | |
1540 mode = GET_MODE (op1); | |
1541 if (mode != GET_MODE (opb1)) | |
1542 mode = VOIDmode; | |
1543 } | |
1544 | |
1545 /* A < B implies A + 1 <= B. */ | |
1546 if ((GET_CODE (a) == GT || GET_CODE (a) == LT) | |
1547 && (GET_CODE (b) == GE || GET_CODE (b) == LE)) | |
1548 { | |
1549 | |
1550 if (GET_CODE (a) == GT) | |
111 | 1551 std::swap (op0, op1); |
0 | 1552 |
1553 if (GET_CODE (b) == GE) | |
111 | 1554 std::swap (opb0, opb1); |
0 | 1555 |
1556 if (SCALAR_INT_MODE_P (mode) | |
1557 && rtx_equal_p (op1, opb1) | |
1558 && simplify_gen_binary (MINUS, mode, opb0, op0) == const1_rtx) | |
1559 return true; | |
1560 return false; | |
1561 } | |
1562 | |
1563 /* A < B or A > B imply A != B. TODO: Likewise | |
1564 A + n < B implies A != B + n if neither wraps. */ | |
1565 if (GET_CODE (b) == NE | |
1566 && (GET_CODE (a) == GT || GET_CODE (a) == GTU | |
1567 || GET_CODE (a) == LT || GET_CODE (a) == LTU)) | |
1568 { | |
1569 if (rtx_equal_p (op0, opb0) | |
1570 && rtx_equal_p (op1, opb1)) | |
1571 return true; | |
1572 } | |
1573 | |
1574 /* For unsigned comparisons, A != 0 implies A > 0 and A >= 1. */ | |
1575 if (GET_CODE (a) == NE | |
1576 && op1 == const0_rtx) | |
1577 { | |
1578 if ((GET_CODE (b) == GTU | |
1579 && opb1 == const0_rtx) | |
1580 || (GET_CODE (b) == GEU | |
1581 && opb1 == const1_rtx)) | |
1582 return rtx_equal_p (op0, opb0); | |
1583 } | |
1584 | |
1585 /* A != N is equivalent to A - (N + 1) <u -1. */ | |
1586 if (GET_CODE (a) == NE | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1587 && CONST_INT_P (op1) |
0 | 1588 && GET_CODE (b) == LTU |
1589 && opb1 == constm1_rtx | |
1590 && GET_CODE (opb0) == PLUS | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1591 && CONST_INT_P (XEXP (opb0, 1)) |
0 | 1592 /* Avoid overflows. */ |
1593 && ((unsigned HOST_WIDE_INT) INTVAL (XEXP (opb0, 1)) | |
1594 != ((unsigned HOST_WIDE_INT)1 | |
1595 << (HOST_BITS_PER_WIDE_INT - 1)) - 1) | |
1596 && INTVAL (XEXP (opb0, 1)) + 1 == -INTVAL (op1)) | |
1597 return rtx_equal_p (op0, XEXP (opb0, 0)); | |
1598 | |
1599 /* Likewise, A != N implies A - N > 0. */ | |
1600 if (GET_CODE (a) == NE | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1601 && CONST_INT_P (op1)) |
0 | 1602 { |
1603 if (GET_CODE (b) == GTU | |
1604 && GET_CODE (opb0) == PLUS | |
1605 && opb1 == const0_rtx | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1606 && CONST_INT_P (XEXP (opb0, 1)) |
0 | 1607 /* Avoid overflows. */ |
1608 && ((unsigned HOST_WIDE_INT) INTVAL (XEXP (opb0, 1)) | |
111 | 1609 != (HOST_WIDE_INT_1U << (HOST_BITS_PER_WIDE_INT - 1))) |
0 | 1610 && rtx_equal_p (XEXP (opb0, 0), op0)) |
1611 return INTVAL (op1) == -INTVAL (XEXP (opb0, 1)); | |
1612 if (GET_CODE (b) == GEU | |
1613 && GET_CODE (opb0) == PLUS | |
1614 && opb1 == const1_rtx | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1615 && CONST_INT_P (XEXP (opb0, 1)) |
0 | 1616 /* Avoid overflows. */ |
1617 && ((unsigned HOST_WIDE_INT) INTVAL (XEXP (opb0, 1)) | |
111 | 1618 != (HOST_WIDE_INT_1U << (HOST_BITS_PER_WIDE_INT - 1))) |
0 | 1619 && rtx_equal_p (XEXP (opb0, 0), op0)) |
1620 return INTVAL (op1) == -INTVAL (XEXP (opb0, 1)); | |
1621 } | |
1622 | |
1623 /* A >s X, where X is positive, implies A <u Y, if Y is negative. */ | |
1624 if ((GET_CODE (a) == GT || GET_CODE (a) == GE) | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1625 && CONST_INT_P (op1) |
0 | 1626 && ((GET_CODE (a) == GT && op1 == constm1_rtx) |
1627 || INTVAL (op1) >= 0) | |
1628 && GET_CODE (b) == LTU | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1629 && CONST_INT_P (opb1) |
0 | 1630 && rtx_equal_p (op0, opb0)) |
1631 return INTVAL (opb1) < 0; | |
1632 | |
1633 return false; | |
1634 } | |
1635 | |
1636 /* Canonicalizes COND so that | |
1637 | |
1638 (1) Ensure that operands are ordered according to | |
1639 swap_commutative_operands_p. | |
1640 (2) (LE x const) will be replaced with (LT x <const+1>) and similarly | |
1641 for GE, GEU, and LEU. */ | |
1642 | |
1643 rtx | |
1644 canon_condition (rtx cond) | |
1645 { | |
1646 rtx op0, op1; | |
1647 enum rtx_code code; | |
111 | 1648 machine_mode mode; |
0 | 1649 |
1650 code = GET_CODE (cond); | |
1651 op0 = XEXP (cond, 0); | |
1652 op1 = XEXP (cond, 1); | |
1653 | |
1654 if (swap_commutative_operands_p (op0, op1)) | |
1655 { | |
1656 code = swap_condition (code); | |
111 | 1657 std::swap (op0, op1); |
0 | 1658 } |
1659 | |
1660 mode = GET_MODE (op0); | |
1661 if (mode == VOIDmode) | |
1662 mode = GET_MODE (op1); | |
1663 gcc_assert (mode != VOIDmode); | |
1664 | |
111 | 1665 if (CONST_SCALAR_INT_P (op1) && GET_MODE_CLASS (mode) != MODE_CC) |
0 | 1666 { |
111 | 1667 rtx_mode_t const_val (op1, mode); |
0 | 1668 |
1669 switch (code) | |
1670 { | |
1671 case LE: | |
111 | 1672 if (wi::ne_p (const_val, wi::max_value (mode, SIGNED))) |
1673 { | |
1674 code = LT; | |
1675 op1 = immed_wide_int_const (wi::add (const_val, 1), mode); | |
1676 } | |
0 | 1677 break; |
1678 | |
1679 case GE: | |
111 | 1680 if (wi::ne_p (const_val, wi::min_value (mode, SIGNED))) |
1681 { | |
1682 code = GT; | |
1683 op1 = immed_wide_int_const (wi::sub (const_val, 1), mode); | |
1684 } | |
0 | 1685 break; |
1686 | |
1687 case LEU: | |
111 | 1688 if (wi::ne_p (const_val, -1)) |
1689 { | |
1690 code = LTU; | |
1691 op1 = immed_wide_int_const (wi::add (const_val, 1), mode); | |
1692 } | |
0 | 1693 break; |
1694 | |
1695 case GEU: | |
111 | 1696 if (wi::ne_p (const_val, 0)) |
1697 { | |
1698 code = GTU; | |
1699 op1 = immed_wide_int_const (wi::sub (const_val, 1), mode); | |
1700 } | |
0 | 1701 break; |
1702 | |
1703 default: | |
1704 break; | |
1705 } | |
1706 } | |
1707 | |
1708 if (op0 != XEXP (cond, 0) | |
1709 || op1 != XEXP (cond, 1) | |
1710 || code != GET_CODE (cond) | |
1711 || GET_MODE (cond) != SImode) | |
1712 cond = gen_rtx_fmt_ee (code, SImode, op0, op1); | |
1713 | |
1714 return cond; | |
1715 } | |
1716 | |
111 | 1717 /* Reverses CONDition; returns NULL if we cannot. */ |
1718 | |
1719 static rtx | |
1720 reversed_condition (rtx cond) | |
1721 { | |
1722 enum rtx_code reversed; | |
1723 reversed = reversed_comparison_code (cond, NULL); | |
1724 if (reversed == UNKNOWN) | |
1725 return NULL_RTX; | |
1726 else | |
1727 return gen_rtx_fmt_ee (reversed, | |
1728 GET_MODE (cond), XEXP (cond, 0), | |
1729 XEXP (cond, 1)); | |
1730 } | |
1731 | |
0 | 1732 /* Tries to use the fact that COND holds to simplify EXPR. ALTERED is the |
1733 set of altered regs. */ | |
1734 | |
1735 void | |
1736 simplify_using_condition (rtx cond, rtx *expr, regset altered) | |
1737 { | |
1738 rtx rev, reve, exp = *expr; | |
1739 | |
1740 /* If some register gets altered later, we do not really speak about its | |
1741 value at the time of comparison. */ | |
111 | 1742 if (altered && altered_reg_used (cond, altered)) |
0 | 1743 return; |
1744 | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1745 if (GET_CODE (cond) == EQ |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1746 && REG_P (XEXP (cond, 0)) && CONSTANT_P (XEXP (cond, 1))) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1747 { |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1748 *expr = simplify_replace_rtx (*expr, XEXP (cond, 0), XEXP (cond, 1)); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1749 return; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1750 } |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1751 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1752 if (!COMPARISON_P (exp)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1753 return; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1754 |
0 | 1755 rev = reversed_condition (cond); |
1756 reve = reversed_condition (exp); | |
1757 | |
1758 cond = canon_condition (cond); | |
1759 exp = canon_condition (exp); | |
1760 if (rev) | |
1761 rev = canon_condition (rev); | |
1762 if (reve) | |
1763 reve = canon_condition (reve); | |
1764 | |
1765 if (rtx_equal_p (exp, cond)) | |
1766 { | |
1767 *expr = const_true_rtx; | |
1768 return; | |
1769 } | |
1770 | |
1771 if (rev && rtx_equal_p (exp, rev)) | |
1772 { | |
1773 *expr = const0_rtx; | |
1774 return; | |
1775 } | |
1776 | |
1777 if (implies_p (cond, exp)) | |
1778 { | |
1779 *expr = const_true_rtx; | |
1780 return; | |
1781 } | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1782 |
0 | 1783 if (reve && implies_p (cond, reve)) |
1784 { | |
1785 *expr = const0_rtx; | |
1786 return; | |
1787 } | |
1788 | |
1789 /* A proof by contradiction. If *EXPR implies (not cond), *EXPR must | |
1790 be false. */ | |
1791 if (rev && implies_p (exp, rev)) | |
1792 { | |
1793 *expr = const0_rtx; | |
1794 return; | |
1795 } | |
1796 | |
1797 /* Similarly, If (not *EXPR) implies (not cond), *EXPR must be true. */ | |
1798 if (rev && reve && implies_p (reve, rev)) | |
1799 { | |
1800 *expr = const_true_rtx; | |
1801 return; | |
1802 } | |
1803 | |
1804 /* We would like to have some other tests here. TODO. */ | |
1805 | |
1806 return; | |
1807 } | |
1808 | |
1809 /* Use relationship between A and *B to eventually eliminate *B. | |
1810 OP is the operation we consider. */ | |
1811 | |
1812 static void | |
1813 eliminate_implied_condition (enum rtx_code op, rtx a, rtx *b) | |
1814 { | |
1815 switch (op) | |
1816 { | |
1817 case AND: | |
1818 /* If A implies *B, we may replace *B by true. */ | |
1819 if (implies_p (a, *b)) | |
1820 *b = const_true_rtx; | |
1821 break; | |
1822 | |
1823 case IOR: | |
1824 /* If *B implies A, we may replace *B by false. */ | |
1825 if (implies_p (*b, a)) | |
1826 *b = const0_rtx; | |
1827 break; | |
1828 | |
1829 default: | |
1830 gcc_unreachable (); | |
1831 } | |
1832 } | |
1833 | |
1834 /* Eliminates the conditions in TAIL that are implied by HEAD. OP is the | |
1835 operation we consider. */ | |
1836 | |
1837 static void | |
1838 eliminate_implied_conditions (enum rtx_code op, rtx *head, rtx tail) | |
1839 { | |
1840 rtx elt; | |
1841 | |
1842 for (elt = tail; elt; elt = XEXP (elt, 1)) | |
1843 eliminate_implied_condition (op, *head, &XEXP (elt, 0)); | |
1844 for (elt = tail; elt; elt = XEXP (elt, 1)) | |
1845 eliminate_implied_condition (op, XEXP (elt, 0), head); | |
1846 } | |
1847 | |
1848 /* Simplifies *EXPR using initial values at the start of the LOOP. If *EXPR | |
1849 is a list, its elements are assumed to be combined using OP. */ | |
1850 | |
1851 static void | |
1852 simplify_using_initial_values (struct loop *loop, enum rtx_code op, rtx *expr) | |
1853 { | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1854 bool expression_valid; |
111 | 1855 rtx head, tail, last_valid_expr; |
1856 rtx_expr_list *cond_list; | |
1857 rtx_insn *insn; | |
0 | 1858 rtx neutral, aggr; |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1859 regset altered, this_altered; |
0 | 1860 edge e; |
1861 | |
1862 if (!*expr) | |
1863 return; | |
1864 | |
1865 if (CONSTANT_P (*expr)) | |
1866 return; | |
1867 | |
1868 if (GET_CODE (*expr) == EXPR_LIST) | |
1869 { | |
1870 head = XEXP (*expr, 0); | |
1871 tail = XEXP (*expr, 1); | |
1872 | |
1873 eliminate_implied_conditions (op, &head, tail); | |
1874 | |
1875 switch (op) | |
1876 { | |
1877 case AND: | |
1878 neutral = const_true_rtx; | |
1879 aggr = const0_rtx; | |
1880 break; | |
1881 | |
1882 case IOR: | |
1883 neutral = const0_rtx; | |
1884 aggr = const_true_rtx; | |
1885 break; | |
1886 | |
1887 default: | |
1888 gcc_unreachable (); | |
1889 } | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1890 |
0 | 1891 simplify_using_initial_values (loop, UNKNOWN, &head); |
1892 if (head == aggr) | |
1893 { | |
1894 XEXP (*expr, 0) = aggr; | |
1895 XEXP (*expr, 1) = NULL_RTX; | |
1896 return; | |
1897 } | |
1898 else if (head == neutral) | |
1899 { | |
1900 *expr = tail; | |
1901 simplify_using_initial_values (loop, op, expr); | |
1902 return; | |
1903 } | |
1904 simplify_using_initial_values (loop, op, &tail); | |
1905 | |
1906 if (tail && XEXP (tail, 0) == aggr) | |
1907 { | |
1908 *expr = tail; | |
1909 return; | |
1910 } | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1911 |
0 | 1912 XEXP (*expr, 0) = head; |
1913 XEXP (*expr, 1) = tail; | |
1914 return; | |
1915 } | |
1916 | |
1917 gcc_assert (op == UNKNOWN); | |
1918 | |
111 | 1919 replace_single_def_regs (expr); |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1920 if (CONSTANT_P (*expr)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1921 return; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1922 |
0 | 1923 e = loop_preheader_edge (loop); |
111 | 1924 if (e->src == ENTRY_BLOCK_PTR_FOR_FN (cfun)) |
0 | 1925 return; |
1926 | |
1927 altered = ALLOC_REG_SET (®_obstack); | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1928 this_altered = ALLOC_REG_SET (®_obstack); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1929 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1930 expression_valid = true; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1931 last_valid_expr = *expr; |
111 | 1932 cond_list = NULL; |
0 | 1933 while (1) |
1934 { | |
1935 insn = BB_END (e->src); | |
1936 if (any_condjump_p (insn)) | |
1937 { | |
1938 rtx cond = get_condition (BB_END (e->src), NULL, false, true); | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1939 |
0 | 1940 if (cond && (e->flags & EDGE_FALLTHRU)) |
1941 cond = reversed_condition (cond); | |
1942 if (cond) | |
1943 { | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1944 rtx old = *expr; |
0 | 1945 simplify_using_condition (cond, expr, altered); |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1946 if (old != *expr) |
0 | 1947 { |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1948 rtx note; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1949 if (CONSTANT_P (*expr)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1950 goto out; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1951 for (note = cond_list; note; note = XEXP (note, 1)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1952 { |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1953 simplify_using_condition (XEXP (note, 0), expr, altered); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1954 if (CONSTANT_P (*expr)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1955 goto out; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1956 } |
0 | 1957 } |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1958 cond_list = alloc_EXPR_LIST (0, cond, cond_list); |
0 | 1959 } |
1960 } | |
1961 | |
1962 FOR_BB_INSNS_REVERSE (e->src, insn) | |
1963 { | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1964 rtx src, dest; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1965 rtx old = *expr; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1966 |
0 | 1967 if (!INSN_P (insn)) |
1968 continue; | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1969 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1970 CLEAR_REG_SET (this_altered); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1971 note_stores (PATTERN (insn), mark_altered, this_altered); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1972 if (CALL_P (insn)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1973 { |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1974 /* Kill all call clobbered registers. */ |
111 | 1975 unsigned int i; |
1976 hard_reg_set_iterator hrsi; | |
1977 EXECUTE_IF_SET_IN_HARD_REG_SET (regs_invalidated_by_call, | |
1978 0, i, hrsi) | |
1979 SET_REGNO_REG_SET (this_altered, i); | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1980 } |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1981 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1982 if (suitable_set_for_replacement (insn, &dest, &src)) |
0 | 1983 { |
111 | 1984 rtx_expr_list **pnote, **pnote_next; |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1985 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1986 replace_in_expr (expr, dest, src); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1987 if (CONSTANT_P (*expr)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1988 goto out; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1989 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1990 for (pnote = &cond_list; *pnote; pnote = pnote_next) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1991 { |
111 | 1992 rtx_expr_list *note = *pnote; |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1993 rtx old_cond = XEXP (note, 0); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1994 |
111 | 1995 pnote_next = (rtx_expr_list **)&XEXP (note, 1); |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1996 replace_in_expr (&XEXP (note, 0), dest, src); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1997 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1998 /* We can no longer use a condition that has been simplified |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
1999 to a constant, and simplify_using_condition will abort if |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2000 we try. */ |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2001 if (CONSTANT_P (XEXP (note, 0))) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2002 { |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2003 *pnote = *pnote_next; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2004 pnote_next = pnote; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2005 free_EXPR_LIST_node (note); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2006 } |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2007 /* Retry simplifications with this condition if either the |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2008 expression or the condition changed. */ |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2009 else if (old_cond != XEXP (note, 0) || old != *expr) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2010 simplify_using_condition (XEXP (note, 0), expr, altered); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2011 } |
0 | 2012 } |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2013 else |
111 | 2014 { |
2015 rtx_expr_list **pnote, **pnote_next; | |
2016 | |
2017 /* If we did not use this insn to make a replacement, any overlap | |
2018 between stores in this insn and our expression will cause the | |
2019 expression to become invalid. */ | |
2020 if (altered_reg_used (*expr, this_altered)) | |
2021 goto out; | |
2022 | |
2023 /* Likewise for the conditions. */ | |
2024 for (pnote = &cond_list; *pnote; pnote = pnote_next) | |
2025 { | |
2026 rtx_expr_list *note = *pnote; | |
2027 rtx old_cond = XEXP (note, 0); | |
2028 | |
2029 pnote_next = (rtx_expr_list **)&XEXP (note, 1); | |
2030 if (altered_reg_used (old_cond, this_altered)) | |
2031 { | |
2032 *pnote = *pnote_next; | |
2033 pnote_next = pnote; | |
2034 free_EXPR_LIST_node (note); | |
2035 } | |
2036 } | |
2037 } | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2038 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2039 if (CONSTANT_P (*expr)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2040 goto out; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2041 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2042 IOR_REG_SET (altered, this_altered); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2043 |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2044 /* If the expression now contains regs that have been altered, we |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2045 can't return it to the caller. However, it is still valid for |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2046 further simplification, so keep searching to see if we can |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2047 eventually turn it into a constant. */ |
111 | 2048 if (altered_reg_used (*expr, altered)) |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2049 expression_valid = false; |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2050 if (expression_valid) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2051 last_valid_expr = *expr; |
0 | 2052 } |
2053 | |
2054 if (!single_pred_p (e->src) | |
111 | 2055 || single_pred (e->src) == ENTRY_BLOCK_PTR_FOR_FN (cfun)) |
0 | 2056 break; |
2057 e = single_pred_edge (e->src); | |
2058 } | |
2059 | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2060 out: |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2061 free_EXPR_LIST_list (&cond_list); |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2062 if (!CONSTANT_P (*expr)) |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2063 *expr = last_valid_expr; |
0 | 2064 FREE_REG_SET (altered); |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2065 FREE_REG_SET (this_altered); |
0 | 2066 } |
2067 | |
2068 /* Transforms invariant IV into MODE. Adds assumptions based on the fact | |
2069 that IV occurs as left operands of comparison COND and its signedness | |
2070 is SIGNED_P to DESC. */ | |
2071 | |
2072 static void | |
111 | 2073 shorten_into_mode (struct rtx_iv *iv, scalar_int_mode mode, |
0 | 2074 enum rtx_code cond, bool signed_p, struct niter_desc *desc) |
2075 { | |
2076 rtx mmin, mmax, cond_over, cond_under; | |
2077 | |
2078 get_mode_bounds (mode, signed_p, iv->extend_mode, &mmin, &mmax); | |
2079 cond_under = simplify_gen_relational (LT, SImode, iv->extend_mode, | |
2080 iv->base, mmin); | |
2081 cond_over = simplify_gen_relational (GT, SImode, iv->extend_mode, | |
2082 iv->base, mmax); | |
2083 | |
2084 switch (cond) | |
2085 { | |
2086 case LE: | |
2087 case LT: | |
2088 case LEU: | |
2089 case LTU: | |
2090 if (cond_under != const0_rtx) | |
2091 desc->infinite = | |
2092 alloc_EXPR_LIST (0, cond_under, desc->infinite); | |
2093 if (cond_over != const0_rtx) | |
2094 desc->noloop_assumptions = | |
2095 alloc_EXPR_LIST (0, cond_over, desc->noloop_assumptions); | |
2096 break; | |
2097 | |
2098 case GE: | |
2099 case GT: | |
2100 case GEU: | |
2101 case GTU: | |
2102 if (cond_over != const0_rtx) | |
2103 desc->infinite = | |
2104 alloc_EXPR_LIST (0, cond_over, desc->infinite); | |
2105 if (cond_under != const0_rtx) | |
2106 desc->noloop_assumptions = | |
2107 alloc_EXPR_LIST (0, cond_under, desc->noloop_assumptions); | |
2108 break; | |
2109 | |
2110 case NE: | |
2111 if (cond_over != const0_rtx) | |
2112 desc->infinite = | |
2113 alloc_EXPR_LIST (0, cond_over, desc->infinite); | |
2114 if (cond_under != const0_rtx) | |
2115 desc->infinite = | |
2116 alloc_EXPR_LIST (0, cond_under, desc->infinite); | |
2117 break; | |
2118 | |
2119 default: | |
2120 gcc_unreachable (); | |
2121 } | |
2122 | |
2123 iv->mode = mode; | |
111 | 2124 iv->extend = signed_p ? IV_SIGN_EXTEND : IV_ZERO_EXTEND; |
0 | 2125 } |
2126 | |
2127 /* Transforms IV0 and IV1 compared by COND so that they are both compared as | |
2128 subregs of the same mode if possible (sometimes it is necessary to add | |
2129 some assumptions to DESC). */ | |
2130 | |
2131 static bool | |
2132 canonicalize_iv_subregs (struct rtx_iv *iv0, struct rtx_iv *iv1, | |
2133 enum rtx_code cond, struct niter_desc *desc) | |
2134 { | |
111 | 2135 scalar_int_mode comp_mode; |
0 | 2136 bool signed_p; |
2137 | |
2138 /* If the ivs behave specially in the first iteration, or are | |
2139 added/multiplied after extending, we ignore them. */ | |
2140 if (iv0->first_special || iv0->mult != const1_rtx || iv0->delta != const0_rtx) | |
2141 return false; | |
2142 if (iv1->first_special || iv1->mult != const1_rtx || iv1->delta != const0_rtx) | |
2143 return false; | |
2144 | |
2145 /* If there is some extend, it must match signedness of the comparison. */ | |
2146 switch (cond) | |
2147 { | |
2148 case LE: | |
2149 case LT: | |
111 | 2150 if (iv0->extend == IV_ZERO_EXTEND |
2151 || iv1->extend == IV_ZERO_EXTEND) | |
0 | 2152 return false; |
2153 signed_p = true; | |
2154 break; | |
2155 | |
2156 case LEU: | |
2157 case LTU: | |
111 | 2158 if (iv0->extend == IV_SIGN_EXTEND |
2159 || iv1->extend == IV_SIGN_EXTEND) | |
0 | 2160 return false; |
2161 signed_p = false; | |
2162 break; | |
2163 | |
2164 case NE: | |
111 | 2165 if (iv0->extend != IV_UNKNOWN_EXTEND |
2166 && iv1->extend != IV_UNKNOWN_EXTEND | |
0 | 2167 && iv0->extend != iv1->extend) |
2168 return false; | |
2169 | |
2170 signed_p = false; | |
111 | 2171 if (iv0->extend != IV_UNKNOWN_EXTEND) |
2172 signed_p = iv0->extend == IV_SIGN_EXTEND; | |
2173 if (iv1->extend != IV_UNKNOWN_EXTEND) | |
2174 signed_p = iv1->extend == IV_SIGN_EXTEND; | |
0 | 2175 break; |
2176 | |
2177 default: | |
2178 gcc_unreachable (); | |
2179 } | |
2180 | |
2181 /* Values of both variables should be computed in the same mode. These | |
2182 might indeed be different, if we have comparison like | |
2183 | |
2184 (compare (subreg:SI (iv0)) (subreg:SI (iv1))) | |
2185 | |
2186 and iv0 and iv1 are both ivs iterating in SI mode, but calculated | |
2187 in different modes. This does not seem impossible to handle, but | |
2188 it hardly ever occurs in practice. | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2189 |
0 | 2190 The only exception is the case when one of operands is invariant. |
2191 For example pentium 3 generates comparisons like | |
2192 (lt (subreg:HI (reg:SI)) 100). Here we assign HImode to 100, but we | |
2193 definitely do not want this prevent the optimization. */ | |
2194 comp_mode = iv0->extend_mode; | |
2195 if (GET_MODE_BITSIZE (comp_mode) < GET_MODE_BITSIZE (iv1->extend_mode)) | |
2196 comp_mode = iv1->extend_mode; | |
2197 | |
2198 if (iv0->extend_mode != comp_mode) | |
2199 { | |
2200 if (iv0->mode != iv0->extend_mode | |
2201 || iv0->step != const0_rtx) | |
2202 return false; | |
2203 | |
2204 iv0->base = simplify_gen_unary (signed_p ? SIGN_EXTEND : ZERO_EXTEND, | |
2205 comp_mode, iv0->base, iv0->mode); | |
2206 iv0->extend_mode = comp_mode; | |
2207 } | |
2208 | |
2209 if (iv1->extend_mode != comp_mode) | |
2210 { | |
2211 if (iv1->mode != iv1->extend_mode | |
2212 || iv1->step != const0_rtx) | |
2213 return false; | |
2214 | |
2215 iv1->base = simplify_gen_unary (signed_p ? SIGN_EXTEND : ZERO_EXTEND, | |
2216 comp_mode, iv1->base, iv1->mode); | |
2217 iv1->extend_mode = comp_mode; | |
2218 } | |
2219 | |
2220 /* Check that both ivs belong to a range of a single mode. If one of the | |
2221 operands is an invariant, we may need to shorten it into the common | |
2222 mode. */ | |
2223 if (iv0->mode == iv0->extend_mode | |
2224 && iv0->step == const0_rtx | |
2225 && iv0->mode != iv1->mode) | |
2226 shorten_into_mode (iv0, iv1->mode, cond, signed_p, desc); | |
2227 | |
2228 if (iv1->mode == iv1->extend_mode | |
2229 && iv1->step == const0_rtx | |
2230 && iv0->mode != iv1->mode) | |
2231 shorten_into_mode (iv1, iv0->mode, swap_condition (cond), signed_p, desc); | |
2232 | |
2233 if (iv0->mode != iv1->mode) | |
2234 return false; | |
2235 | |
2236 desc->mode = iv0->mode; | |
2237 desc->signed_p = signed_p; | |
2238 | |
2239 return true; | |
2240 } | |
2241 | |
111 | 2242 /* Tries to estimate the maximum number of iterations in LOOP, and return the |
2243 result. This function is called from iv_number_of_iterations with | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2244 a number of fields in DESC already filled in. OLD_NITER is the original |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2245 expression for the number of iterations, before we tried to simplify it. */ |
0 | 2246 |
111 | 2247 static uint64_t |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2248 determine_max_iter (struct loop *loop, struct niter_desc *desc, rtx old_niter) |
0 | 2249 { |
2250 rtx niter = desc->niter_expr; | |
2251 rtx mmin, mmax, cmp; | |
111 | 2252 uint64_t nmax, inc; |
2253 uint64_t andmax = 0; | |
2254 | |
2255 /* We used to look for constant operand 0 of AND, | |
2256 but canonicalization should always make this impossible. */ | |
2257 gcc_checking_assert (GET_CODE (niter) != AND | |
2258 || !CONST_INT_P (XEXP (niter, 0))); | |
0 | 2259 |
2260 if (GET_CODE (niter) == AND | |
111 | 2261 && CONST_INT_P (XEXP (niter, 1))) |
0 | 2262 { |
111 | 2263 andmax = UINTVAL (XEXP (niter, 1)); |
2264 niter = XEXP (niter, 0); | |
0 | 2265 } |
2266 | |
2267 get_mode_bounds (desc->mode, desc->signed_p, desc->mode, &mmin, &mmax); | |
111 | 2268 nmax = UINTVAL (mmax) - UINTVAL (mmin); |
0 | 2269 |
2270 if (GET_CODE (niter) == UDIV) | |
2271 { | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2272 if (!CONST_INT_P (XEXP (niter, 1))) |
111 | 2273 return nmax; |
0 | 2274 inc = INTVAL (XEXP (niter, 1)); |
2275 niter = XEXP (niter, 0); | |
2276 } | |
2277 else | |
2278 inc = 1; | |
2279 | |
2280 /* We could use a binary search here, but for now improving the upper | |
2281 bound by just one eliminates one important corner case. */ | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2282 cmp = simplify_gen_relational (desc->signed_p ? LT : LTU, VOIDmode, |
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2283 desc->mode, old_niter, mmax); |
0 | 2284 simplify_using_initial_values (loop, UNKNOWN, &cmp); |
2285 if (cmp == const_true_rtx) | |
2286 { | |
2287 nmax--; | |
2288 | |
2289 if (dump_file) | |
2290 fprintf (dump_file, ";; improved upper bound by one.\n"); | |
2291 } | |
111 | 2292 nmax /= inc; |
2293 if (andmax) | |
2294 nmax = MIN (nmax, andmax); | |
2295 if (dump_file) | |
2296 fprintf (dump_file, ";; Determined upper bound %" PRId64".\n", | |
2297 nmax); | |
2298 return nmax; | |
0 | 2299 } |
2300 | |
2301 /* Computes number of iterations of the CONDITION in INSN in LOOP and stores | |
2302 the result into DESC. Very similar to determine_number_of_iterations | |
2303 (basically its rtl version), complicated by things like subregs. */ | |
2304 | |
2305 static void | |
111 | 2306 iv_number_of_iterations (struct loop *loop, rtx_insn *insn, rtx condition, |
0 | 2307 struct niter_desc *desc) |
2308 { | |
2309 rtx op0, op1, delta, step, bound, may_xform, tmp, tmp0, tmp1; | |
111 | 2310 struct rtx_iv iv0, iv1; |
0 | 2311 rtx assumption, may_not_xform; |
2312 enum rtx_code cond; | |
111 | 2313 machine_mode nonvoid_mode; |
2314 scalar_int_mode comp_mode; | |
0 | 2315 rtx mmin, mmax, mode_mmin, mode_mmax; |
111 | 2316 uint64_t s, size, d, inv, max, up, down; |
2317 int64_t inc, step_val; | |
0 | 2318 int was_sharp = false; |
2319 rtx old_niter; | |
2320 bool step_is_pow2; | |
2321 | |
2322 /* The meaning of these assumptions is this: | |
2323 if !assumptions | |
2324 then the rest of information does not have to be valid | |
2325 if noloop_assumptions then the loop does not roll | |
2326 if infinite then this exit is never used */ | |
2327 | |
2328 desc->assumptions = NULL_RTX; | |
2329 desc->noloop_assumptions = NULL_RTX; | |
2330 desc->infinite = NULL_RTX; | |
2331 desc->simple_p = true; | |
2332 | |
2333 desc->const_iter = false; | |
2334 desc->niter_expr = NULL_RTX; | |
2335 | |
2336 cond = GET_CODE (condition); | |
2337 gcc_assert (COMPARISON_P (condition)); | |
2338 | |
111 | 2339 nonvoid_mode = GET_MODE (XEXP (condition, 0)); |
2340 if (nonvoid_mode == VOIDmode) | |
2341 nonvoid_mode = GET_MODE (XEXP (condition, 1)); | |
0 | 2342 /* The constant comparisons should be folded. */ |
111 | 2343 gcc_assert (nonvoid_mode != VOIDmode); |
0 | 2344 |
2345 /* We only handle integers or pointers. */ | |
111 | 2346 scalar_int_mode mode; |
2347 if (!is_a <scalar_int_mode> (nonvoid_mode, &mode)) | |
0 | 2348 goto fail; |
2349 | |
2350 op0 = XEXP (condition, 0); | |
111 | 2351 if (!iv_analyze (insn, mode, op0, &iv0)) |
0 | 2352 goto fail; |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2353 |
0 | 2354 op1 = XEXP (condition, 1); |
111 | 2355 if (!iv_analyze (insn, mode, op1, &iv1)) |
0 | 2356 goto fail; |
2357 | |
2358 if (GET_MODE_BITSIZE (iv0.extend_mode) > HOST_BITS_PER_WIDE_INT | |
2359 || GET_MODE_BITSIZE (iv1.extend_mode) > HOST_BITS_PER_WIDE_INT) | |
2360 goto fail; | |
2361 | |
2362 /* Check condition and normalize it. */ | |
2363 | |
2364 switch (cond) | |
2365 { | |
2366 case GE: | |
2367 case GT: | |
2368 case GEU: | |
2369 case GTU: | |
111 | 2370 std::swap (iv0, iv1); |
0 | 2371 cond = swap_condition (cond); |
2372 break; | |
2373 case NE: | |
2374 case LE: | |
2375 case LEU: | |
2376 case LT: | |
2377 case LTU: | |
2378 break; | |
2379 default: | |
2380 goto fail; | |
2381 } | |
2382 | |
2383 /* Handle extends. This is relatively nontrivial, so we only try in some | |
2384 easy cases, when we can canonicalize the ivs (possibly by adding some | |
2385 assumptions) to shape subreg (base + i * step). This function also fills | |
2386 in desc->mode and desc->signed_p. */ | |
2387 | |
2388 if (!canonicalize_iv_subregs (&iv0, &iv1, cond, desc)) | |
2389 goto fail; | |
2390 | |
2391 comp_mode = iv0.extend_mode; | |
2392 mode = iv0.mode; | |
111 | 2393 size = GET_MODE_PRECISION (mode); |
0 | 2394 get_mode_bounds (mode, (cond == LE || cond == LT), comp_mode, &mmin, &mmax); |
2395 mode_mmin = lowpart_subreg (mode, mmin, comp_mode); | |
2396 mode_mmax = lowpart_subreg (mode, mmax, comp_mode); | |
2397 | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2398 if (!CONST_INT_P (iv0.step) || !CONST_INT_P (iv1.step)) |
0 | 2399 goto fail; |
2400 | |
2401 /* We can take care of the case of two induction variables chasing each other | |
2402 if the test is NE. I have never seen a loop using it, but still it is | |
2403 cool. */ | |
2404 if (iv0.step != const0_rtx && iv1.step != const0_rtx) | |
2405 { | |
2406 if (cond != NE) | |
2407 goto fail; | |
2408 | |
2409 iv0.step = simplify_gen_binary (MINUS, comp_mode, iv0.step, iv1.step); | |
2410 iv1.step = const0_rtx; | |
2411 } | |
2412 | |
111 | 2413 iv0.step = lowpart_subreg (mode, iv0.step, comp_mode); |
2414 iv1.step = lowpart_subreg (mode, iv1.step, comp_mode); | |
2415 | |
0 | 2416 /* This is either infinite loop or the one that ends immediately, depending |
2417 on initial values. Unswitching should remove this kind of conditions. */ | |
2418 if (iv0.step == const0_rtx && iv1.step == const0_rtx) | |
2419 goto fail; | |
2420 | |
2421 if (cond != NE) | |
2422 { | |
2423 if (iv0.step == const0_rtx) | |
2424 step_val = -INTVAL (iv1.step); | |
2425 else | |
2426 step_val = INTVAL (iv0.step); | |
2427 | |
2428 /* Ignore loops of while (i-- < 10) type. */ | |
2429 if (step_val < 0) | |
2430 goto fail; | |
2431 | |
2432 step_is_pow2 = !(step_val & (step_val - 1)); | |
2433 } | |
2434 else | |
2435 { | |
2436 /* We do not care about whether the step is power of two in this | |
2437 case. */ | |
2438 step_is_pow2 = false; | |
2439 step_val = 0; | |
2440 } | |
2441 | |
2442 /* Some more condition normalization. We must record some assumptions | |
2443 due to overflows. */ | |
2444 switch (cond) | |
2445 { | |
2446 case LT: | |
2447 case LTU: | |
2448 /* We want to take care only of non-sharp relationals; this is easy, | |
2449 as in cases the overflow would make the transformation unsafe | |
2450 the loop does not roll. Seemingly it would make more sense to want | |
2451 to take care of sharp relationals instead, as NE is more similar to | |
2452 them, but the problem is that here the transformation would be more | |
2453 difficult due to possibly infinite loops. */ | |
2454 if (iv0.step == const0_rtx) | |
2455 { | |
2456 tmp = lowpart_subreg (mode, iv0.base, comp_mode); | |
2457 assumption = simplify_gen_relational (EQ, SImode, mode, tmp, | |
2458 mode_mmax); | |
2459 if (assumption == const_true_rtx) | |
2460 goto zero_iter_simplify; | |
2461 iv0.base = simplify_gen_binary (PLUS, comp_mode, | |
2462 iv0.base, const1_rtx); | |
2463 } | |
2464 else | |
2465 { | |
2466 tmp = lowpart_subreg (mode, iv1.base, comp_mode); | |
2467 assumption = simplify_gen_relational (EQ, SImode, mode, tmp, | |
2468 mode_mmin); | |
2469 if (assumption == const_true_rtx) | |
2470 goto zero_iter_simplify; | |
2471 iv1.base = simplify_gen_binary (PLUS, comp_mode, | |
2472 iv1.base, constm1_rtx); | |
2473 } | |
2474 | |
2475 if (assumption != const0_rtx) | |
2476 desc->noloop_assumptions = | |
2477 alloc_EXPR_LIST (0, assumption, desc->noloop_assumptions); | |
2478 cond = (cond == LT) ? LE : LEU; | |
2479 | |
2480 /* It will be useful to be able to tell the difference once more in | |
2481 LE -> NE reduction. */ | |
2482 was_sharp = true; | |
2483 break; | |
2484 default: ; | |
2485 } | |
2486 | |
2487 /* Take care of trivially infinite loops. */ | |
2488 if (cond != NE) | |
2489 { | |
2490 if (iv0.step == const0_rtx) | |
2491 { | |
2492 tmp = lowpart_subreg (mode, iv0.base, comp_mode); | |
2493 if (rtx_equal_p (tmp, mode_mmin)) | |
2494 { | |
2495 desc->infinite = | |
2496 alloc_EXPR_LIST (0, const_true_rtx, NULL_RTX); | |
2497 /* Fill in the remaining fields somehow. */ | |
2498 goto zero_iter_simplify; | |
2499 } | |
2500 } | |
2501 else | |
2502 { | |
2503 tmp = lowpart_subreg (mode, iv1.base, comp_mode); | |
2504 if (rtx_equal_p (tmp, mode_mmax)) | |
2505 { | |
2506 desc->infinite = | |
2507 alloc_EXPR_LIST (0, const_true_rtx, NULL_RTX); | |
2508 /* Fill in the remaining fields somehow. */ | |
2509 goto zero_iter_simplify; | |
2510 } | |
2511 } | |
2512 } | |
2513 | |
2514 /* If we can we want to take care of NE conditions instead of size | |
2515 comparisons, as they are much more friendly (most importantly | |
2516 this takes care of special handling of loops with step 1). We can | |
2517 do it if we first check that upper bound is greater or equal to | |
2518 lower bound, their difference is constant c modulo step and that | |
2519 there is not an overflow. */ | |
2520 if (cond != NE) | |
2521 { | |
2522 if (iv0.step == const0_rtx) | |
2523 step = simplify_gen_unary (NEG, comp_mode, iv1.step, comp_mode); | |
2524 else | |
2525 step = iv0.step; | |
111 | 2526 step = lowpart_subreg (mode, step, comp_mode); |
0 | 2527 delta = simplify_gen_binary (MINUS, comp_mode, iv1.base, iv0.base); |
2528 delta = lowpart_subreg (mode, delta, comp_mode); | |
2529 delta = simplify_gen_binary (UMOD, mode, delta, step); | |
2530 may_xform = const0_rtx; | |
2531 may_not_xform = const_true_rtx; | |
2532 | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2533 if (CONST_INT_P (delta)) |
0 | 2534 { |
2535 if (was_sharp && INTVAL (delta) == INTVAL (step) - 1) | |
2536 { | |
2537 /* A special case. We have transformed condition of type | |
2538 for (i = 0; i < 4; i += 4) | |
2539 into | |
2540 for (i = 0; i <= 3; i += 4) | |
2541 obviously if the test for overflow during that transformation | |
2542 passed, we cannot overflow here. Most importantly any | |
2543 loop with sharp end condition and step 1 falls into this | |
2544 category, so handling this case specially is definitely | |
2545 worth the troubles. */ | |
2546 may_xform = const_true_rtx; | |
2547 } | |
2548 else if (iv0.step == const0_rtx) | |
2549 { | |
2550 bound = simplify_gen_binary (PLUS, comp_mode, mmin, step); | |
2551 bound = simplify_gen_binary (MINUS, comp_mode, bound, delta); | |
2552 bound = lowpart_subreg (mode, bound, comp_mode); | |
2553 tmp = lowpart_subreg (mode, iv0.base, comp_mode); | |
2554 may_xform = simplify_gen_relational (cond, SImode, mode, | |
2555 bound, tmp); | |
2556 may_not_xform = simplify_gen_relational (reverse_condition (cond), | |
2557 SImode, mode, | |
2558 bound, tmp); | |
2559 } | |
2560 else | |
2561 { | |
2562 bound = simplify_gen_binary (MINUS, comp_mode, mmax, step); | |
2563 bound = simplify_gen_binary (PLUS, comp_mode, bound, delta); | |
2564 bound = lowpart_subreg (mode, bound, comp_mode); | |
2565 tmp = lowpart_subreg (mode, iv1.base, comp_mode); | |
2566 may_xform = simplify_gen_relational (cond, SImode, mode, | |
2567 tmp, bound); | |
2568 may_not_xform = simplify_gen_relational (reverse_condition (cond), | |
2569 SImode, mode, | |
2570 tmp, bound); | |
2571 } | |
2572 } | |
2573 | |
2574 if (may_xform != const0_rtx) | |
2575 { | |
2576 /* We perform the transformation always provided that it is not | |
2577 completely senseless. This is OK, as we would need this assumption | |
2578 to determine the number of iterations anyway. */ | |
2579 if (may_xform != const_true_rtx) | |
2580 { | |
2581 /* If the step is a power of two and the final value we have | |
2582 computed overflows, the cycle is infinite. Otherwise it | |
2583 is nontrivial to compute the number of iterations. */ | |
2584 if (step_is_pow2) | |
2585 desc->infinite = alloc_EXPR_LIST (0, may_not_xform, | |
2586 desc->infinite); | |
2587 else | |
2588 desc->assumptions = alloc_EXPR_LIST (0, may_xform, | |
2589 desc->assumptions); | |
2590 } | |
2591 | |
2592 /* We are going to lose some information about upper bound on | |
2593 number of iterations in this step, so record the information | |
2594 here. */ | |
2595 inc = INTVAL (iv0.step) - INTVAL (iv1.step); | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2596 if (CONST_INT_P (iv1.base)) |
0 | 2597 up = INTVAL (iv1.base); |
2598 else | |
2599 up = INTVAL (mode_mmax) - inc; | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2600 down = INTVAL (CONST_INT_P (iv0.base) |
0 | 2601 ? iv0.base |
2602 : mode_mmin); | |
111 | 2603 max = (up - down) / inc + 1; |
2604 if (!desc->infinite | |
2605 && !desc->assumptions) | |
2606 record_niter_bound (loop, max, false, true); | |
0 | 2607 |
2608 if (iv0.step == const0_rtx) | |
2609 { | |
2610 iv0.base = simplify_gen_binary (PLUS, comp_mode, iv0.base, delta); | |
2611 iv0.base = simplify_gen_binary (MINUS, comp_mode, iv0.base, step); | |
2612 } | |
2613 else | |
2614 { | |
2615 iv1.base = simplify_gen_binary (MINUS, comp_mode, iv1.base, delta); | |
2616 iv1.base = simplify_gen_binary (PLUS, comp_mode, iv1.base, step); | |
2617 } | |
2618 | |
2619 tmp0 = lowpart_subreg (mode, iv0.base, comp_mode); | |
2620 tmp1 = lowpart_subreg (mode, iv1.base, comp_mode); | |
2621 assumption = simplify_gen_relational (reverse_condition (cond), | |
2622 SImode, mode, tmp0, tmp1); | |
2623 if (assumption == const_true_rtx) | |
2624 goto zero_iter_simplify; | |
2625 else if (assumption != const0_rtx) | |
2626 desc->noloop_assumptions = | |
2627 alloc_EXPR_LIST (0, assumption, desc->noloop_assumptions); | |
2628 cond = NE; | |
2629 } | |
2630 } | |
2631 | |
2632 /* Count the number of iterations. */ | |
2633 if (cond == NE) | |
2634 { | |
2635 /* Everything we do here is just arithmetics modulo size of mode. This | |
2636 makes us able to do more involved computations of number of iterations | |
2637 than in other cases. First transform the condition into shape | |
2638 s * i <> c, with s positive. */ | |
2639 iv1.base = simplify_gen_binary (MINUS, comp_mode, iv1.base, iv0.base); | |
2640 iv0.base = const0_rtx; | |
2641 iv0.step = simplify_gen_binary (MINUS, comp_mode, iv0.step, iv1.step); | |
2642 iv1.step = const0_rtx; | |
2643 if (INTVAL (iv0.step) < 0) | |
2644 { | |
111 | 2645 iv0.step = simplify_gen_unary (NEG, comp_mode, iv0.step, comp_mode); |
2646 iv1.base = simplify_gen_unary (NEG, comp_mode, iv1.base, comp_mode); | |
0 | 2647 } |
2648 iv0.step = lowpart_subreg (mode, iv0.step, comp_mode); | |
2649 | |
2650 /* Let nsd (s, size of mode) = d. If d does not divide c, the loop | |
2651 is infinite. Otherwise, the number of iterations is | |
2652 (inverse(s/d) * (c/d)) mod (size of mode/d). */ | |
2653 s = INTVAL (iv0.step); d = 1; | |
2654 while (s % 2 != 1) | |
2655 { | |
2656 s /= 2; | |
2657 d *= 2; | |
2658 size--; | |
2659 } | |
111 | 2660 bound = GEN_INT (((uint64_t) 1 << (size - 1 ) << 1) - 1); |
0 | 2661 |
2662 tmp1 = lowpart_subreg (mode, iv1.base, comp_mode); | |
111 | 2663 tmp = simplify_gen_binary (UMOD, mode, tmp1, gen_int_mode (d, mode)); |
0 | 2664 assumption = simplify_gen_relational (NE, SImode, mode, tmp, const0_rtx); |
2665 desc->infinite = alloc_EXPR_LIST (0, assumption, desc->infinite); | |
2666 | |
111 | 2667 tmp = simplify_gen_binary (UDIV, mode, tmp1, gen_int_mode (d, mode)); |
0 | 2668 inv = inverse (s, size); |
2669 tmp = simplify_gen_binary (MULT, mode, tmp, gen_int_mode (inv, mode)); | |
2670 desc->niter_expr = simplify_gen_binary (AND, mode, tmp, bound); | |
2671 } | |
2672 else | |
2673 { | |
2674 if (iv1.step == const0_rtx) | |
2675 /* Condition in shape a + s * i <= b | |
2676 We must know that b + s does not overflow and a <= b + s and then we | |
2677 can compute number of iterations as (b + s - a) / s. (It might | |
2678 seem that we in fact could be more clever about testing the b + s | |
2679 overflow condition using some information about b - a mod s, | |
2680 but it was already taken into account during LE -> NE transform). */ | |
2681 { | |
2682 step = iv0.step; | |
2683 tmp0 = lowpart_subreg (mode, iv0.base, comp_mode); | |
2684 tmp1 = lowpart_subreg (mode, iv1.base, comp_mode); | |
2685 | |
2686 bound = simplify_gen_binary (MINUS, mode, mode_mmax, | |
2687 lowpart_subreg (mode, step, | |
2688 comp_mode)); | |
2689 if (step_is_pow2) | |
2690 { | |
2691 rtx t0, t1; | |
2692 | |
2693 /* If s is power of 2, we know that the loop is infinite if | |
2694 a % s <= b % s and b + s overflows. */ | |
2695 assumption = simplify_gen_relational (reverse_condition (cond), | |
2696 SImode, mode, | |
2697 tmp1, bound); | |
2698 | |
2699 t0 = simplify_gen_binary (UMOD, mode, copy_rtx (tmp0), step); | |
2700 t1 = simplify_gen_binary (UMOD, mode, copy_rtx (tmp1), step); | |
2701 tmp = simplify_gen_relational (cond, SImode, mode, t0, t1); | |
2702 assumption = simplify_gen_binary (AND, SImode, assumption, tmp); | |
2703 desc->infinite = | |
2704 alloc_EXPR_LIST (0, assumption, desc->infinite); | |
2705 } | |
2706 else | |
2707 { | |
2708 assumption = simplify_gen_relational (cond, SImode, mode, | |
2709 tmp1, bound); | |
2710 desc->assumptions = | |
2711 alloc_EXPR_LIST (0, assumption, desc->assumptions); | |
2712 } | |
2713 | |
2714 tmp = simplify_gen_binary (PLUS, comp_mode, iv1.base, iv0.step); | |
2715 tmp = lowpart_subreg (mode, tmp, comp_mode); | |
2716 assumption = simplify_gen_relational (reverse_condition (cond), | |
2717 SImode, mode, tmp0, tmp); | |
2718 | |
2719 delta = simplify_gen_binary (PLUS, mode, tmp1, step); | |
2720 delta = simplify_gen_binary (MINUS, mode, delta, tmp0); | |
2721 } | |
2722 else | |
2723 { | |
2724 /* Condition in shape a <= b - s * i | |
2725 We must know that a - s does not overflow and a - s <= b and then | |
2726 we can again compute number of iterations as (b - (a - s)) / s. */ | |
2727 step = simplify_gen_unary (NEG, mode, iv1.step, mode); | |
2728 tmp0 = lowpart_subreg (mode, iv0.base, comp_mode); | |
2729 tmp1 = lowpart_subreg (mode, iv1.base, comp_mode); | |
2730 | |
2731 bound = simplify_gen_binary (PLUS, mode, mode_mmin, | |
2732 lowpart_subreg (mode, step, comp_mode)); | |
2733 if (step_is_pow2) | |
2734 { | |
2735 rtx t0, t1; | |
2736 | |
2737 /* If s is power of 2, we know that the loop is infinite if | |
2738 a % s <= b % s and a - s overflows. */ | |
2739 assumption = simplify_gen_relational (reverse_condition (cond), | |
2740 SImode, mode, | |
2741 bound, tmp0); | |
2742 | |
2743 t0 = simplify_gen_binary (UMOD, mode, copy_rtx (tmp0), step); | |
2744 t1 = simplify_gen_binary (UMOD, mode, copy_rtx (tmp1), step); | |
2745 tmp = simplify_gen_relational (cond, SImode, mode, t0, t1); | |
2746 assumption = simplify_gen_binary (AND, SImode, assumption, tmp); | |
2747 desc->infinite = | |
2748 alloc_EXPR_LIST (0, assumption, desc->infinite); | |
2749 } | |
2750 else | |
2751 { | |
2752 assumption = simplify_gen_relational (cond, SImode, mode, | |
2753 bound, tmp0); | |
2754 desc->assumptions = | |
2755 alloc_EXPR_LIST (0, assumption, desc->assumptions); | |
2756 } | |
2757 | |
2758 tmp = simplify_gen_binary (PLUS, comp_mode, iv0.base, iv1.step); | |
2759 tmp = lowpart_subreg (mode, tmp, comp_mode); | |
2760 assumption = simplify_gen_relational (reverse_condition (cond), | |
2761 SImode, mode, | |
2762 tmp, tmp1); | |
2763 delta = simplify_gen_binary (MINUS, mode, tmp0, step); | |
2764 delta = simplify_gen_binary (MINUS, mode, tmp1, delta); | |
2765 } | |
2766 if (assumption == const_true_rtx) | |
2767 goto zero_iter_simplify; | |
2768 else if (assumption != const0_rtx) | |
2769 desc->noloop_assumptions = | |
2770 alloc_EXPR_LIST (0, assumption, desc->noloop_assumptions); | |
2771 delta = simplify_gen_binary (UDIV, mode, delta, step); | |
2772 desc->niter_expr = delta; | |
2773 } | |
2774 | |
2775 old_niter = desc->niter_expr; | |
2776 | |
2777 simplify_using_initial_values (loop, AND, &desc->assumptions); | |
2778 if (desc->assumptions | |
2779 && XEXP (desc->assumptions, 0) == const0_rtx) | |
2780 goto fail; | |
2781 simplify_using_initial_values (loop, IOR, &desc->noloop_assumptions); | |
2782 simplify_using_initial_values (loop, IOR, &desc->infinite); | |
2783 simplify_using_initial_values (loop, UNKNOWN, &desc->niter_expr); | |
2784 | |
2785 /* Rerun the simplification. Consider code (created by copying loop headers) | |
2786 | |
2787 i = 0; | |
2788 | |
2789 if (0 < n) | |
2790 { | |
2791 do | |
2792 { | |
2793 i++; | |
2794 } while (i < n); | |
2795 } | |
2796 | |
2797 The first pass determines that i = 0, the second pass uses it to eliminate | |
2798 noloop assumption. */ | |
2799 | |
2800 simplify_using_initial_values (loop, AND, &desc->assumptions); | |
2801 if (desc->assumptions | |
2802 && XEXP (desc->assumptions, 0) == const0_rtx) | |
2803 goto fail; | |
2804 simplify_using_initial_values (loop, IOR, &desc->noloop_assumptions); | |
2805 simplify_using_initial_values (loop, IOR, &desc->infinite); | |
2806 simplify_using_initial_values (loop, UNKNOWN, &desc->niter_expr); | |
2807 | |
2808 if (desc->noloop_assumptions | |
2809 && XEXP (desc->noloop_assumptions, 0) == const_true_rtx) | |
2810 goto zero_iter; | |
2811 | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2812 if (CONST_INT_P (desc->niter_expr)) |
0 | 2813 { |
111 | 2814 uint64_t val = INTVAL (desc->niter_expr); |
0 | 2815 |
2816 desc->const_iter = true; | |
111 | 2817 desc->niter = val & GET_MODE_MASK (desc->mode); |
2818 if (!desc->infinite | |
2819 && !desc->assumptions) | |
2820 record_niter_bound (loop, desc->niter, false, true); | |
0 | 2821 } |
2822 else | |
2823 { | |
111 | 2824 max = determine_max_iter (loop, desc, old_niter); |
2825 if (!max) | |
2826 goto zero_iter_simplify; | |
2827 if (!desc->infinite | |
2828 && !desc->assumptions) | |
2829 record_niter_bound (loop, max, false, true); | |
0 | 2830 |
2831 /* simplify_using_initial_values does a copy propagation on the registers | |
2832 in the expression for the number of iterations. This prolongs life | |
2833 ranges of registers and increases register pressure, and usually | |
2834 brings no gain (and if it happens to do, the cse pass will take care | |
2835 of it anyway). So prevent this behavior, unless it enabled us to | |
2836 derive that the number of iterations is a constant. */ | |
2837 desc->niter_expr = old_niter; | |
2838 } | |
2839 | |
2840 return; | |
2841 | |
2842 zero_iter_simplify: | |
2843 /* Simplify the assumptions. */ | |
2844 simplify_using_initial_values (loop, AND, &desc->assumptions); | |
2845 if (desc->assumptions | |
2846 && XEXP (desc->assumptions, 0) == const0_rtx) | |
2847 goto fail; | |
2848 simplify_using_initial_values (loop, IOR, &desc->infinite); | |
2849 | |
2850 /* Fallthru. */ | |
2851 zero_iter: | |
2852 desc->const_iter = true; | |
2853 desc->niter = 0; | |
111 | 2854 record_niter_bound (loop, 0, true, true); |
0 | 2855 desc->noloop_assumptions = NULL_RTX; |
2856 desc->niter_expr = const0_rtx; | |
2857 return; | |
2858 | |
2859 fail: | |
2860 desc->simple_p = false; | |
2861 return; | |
2862 } | |
2863 | |
2864 /* Checks whether E is a simple exit from LOOP and stores its description | |
2865 into DESC. */ | |
2866 | |
2867 static void | |
2868 check_simple_exit (struct loop *loop, edge e, struct niter_desc *desc) | |
2869 { | |
2870 basic_block exit_bb; | |
111 | 2871 rtx condition; |
2872 rtx_insn *at; | |
0 | 2873 edge ein; |
2874 | |
2875 exit_bb = e->src; | |
2876 desc->simple_p = false; | |
2877 | |
2878 /* It must belong directly to the loop. */ | |
2879 if (exit_bb->loop_father != loop) | |
2880 return; | |
2881 | |
2882 /* It must be tested (at least) once during any iteration. */ | |
2883 if (!dominated_by_p (CDI_DOMINATORS, loop->latch, exit_bb)) | |
2884 return; | |
2885 | |
2886 /* It must end in a simple conditional jump. */ | |
2887 if (!any_condjump_p (BB_END (exit_bb))) | |
2888 return; | |
2889 | |
2890 ein = EDGE_SUCC (exit_bb, 0); | |
2891 if (ein == e) | |
2892 ein = EDGE_SUCC (exit_bb, 1); | |
2893 | |
2894 desc->out_edge = e; | |
2895 desc->in_edge = ein; | |
2896 | |
2897 /* Test whether the condition is suitable. */ | |
2898 if (!(condition = get_condition (BB_END (ein->src), &at, false, false))) | |
2899 return; | |
2900 | |
2901 if (ein->flags & EDGE_FALLTHRU) | |
2902 { | |
2903 condition = reversed_condition (condition); | |
2904 if (!condition) | |
2905 return; | |
2906 } | |
2907 | |
2908 /* Check that we are able to determine number of iterations and fill | |
2909 in information about it. */ | |
2910 iv_number_of_iterations (loop, at, condition, desc); | |
2911 } | |
2912 | |
2913 /* Finds a simple exit of LOOP and stores its description into DESC. */ | |
2914 | |
2915 void | |
2916 find_simple_exit (struct loop *loop, struct niter_desc *desc) | |
2917 { | |
2918 unsigned i; | |
2919 basic_block *body; | |
2920 edge e; | |
2921 struct niter_desc act; | |
2922 bool any = false; | |
2923 edge_iterator ei; | |
2924 | |
2925 desc->simple_p = false; | |
2926 body = get_loop_body (loop); | |
2927 | |
2928 for (i = 0; i < loop->num_nodes; i++) | |
2929 { | |
2930 FOR_EACH_EDGE (e, ei, body[i]->succs) | |
2931 { | |
2932 if (flow_bb_inside_loop_p (loop, e->dest)) | |
2933 continue; | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2934 |
0 | 2935 check_simple_exit (loop, e, &act); |
2936 if (!act.simple_p) | |
2937 continue; | |
2938 | |
2939 if (!any) | |
2940 any = true; | |
2941 else | |
2942 { | |
2943 /* Prefer constant iterations; the less the better. */ | |
2944 if (!act.const_iter | |
2945 || (desc->const_iter && act.niter >= desc->niter)) | |
2946 continue; | |
2947 | |
2948 /* Also if the actual exit may be infinite, while the old one | |
2949 not, prefer the old one. */ | |
2950 if (act.infinite && !desc->infinite) | |
2951 continue; | |
2952 } | |
55
77e2b8dfacca
update it from 4.4.3 to 4.5.0
ryoma <e075725@ie.u-ryukyu.ac.jp>
parents:
0
diff
changeset
|
2953 |
0 | 2954 *desc = act; |
2955 } | |
2956 } | |
2957 | |
2958 if (dump_file) | |
2959 { | |
2960 if (desc->simple_p) | |
2961 { | |
2962 fprintf (dump_file, "Loop %d is simple:\n", loop->num); | |
2963 fprintf (dump_file, " simple exit %d -> %d\n", | |
2964 desc->out_edge->src->index, | |
2965 desc->out_edge->dest->index); | |
2966 if (desc->assumptions) | |
2967 { | |
2968 fprintf (dump_file, " assumptions: "); | |
2969 print_rtl (dump_file, desc->assumptions); | |
2970 fprintf (dump_file, "\n"); | |
2971 } | |
2972 if (desc->noloop_assumptions) | |
2973 { | |
2974 fprintf (dump_file, " does not roll if: "); | |
2975 print_rtl (dump_file, desc->noloop_assumptions); | |
2976 fprintf (dump_file, "\n"); | |
2977 } | |
2978 if (desc->infinite) | |
2979 { | |
2980 fprintf (dump_file, " infinite if: "); | |
2981 print_rtl (dump_file, desc->infinite); | |
2982 fprintf (dump_file, "\n"); | |
2983 } | |
2984 | |
2985 fprintf (dump_file, " number of iterations: "); | |
2986 print_rtl (dump_file, desc->niter_expr); | |
2987 fprintf (dump_file, "\n"); | |
2988 | |
111 | 2989 fprintf (dump_file, " upper bound: %li\n", |
2990 (long)get_max_loop_iterations_int (loop)); | |
2991 fprintf (dump_file, " likely upper bound: %li\n", | |
2992 (long)get_likely_max_loop_iterations_int (loop)); | |
2993 fprintf (dump_file, " realistic bound: %li\n", | |
2994 (long)get_estimated_loop_iterations_int (loop)); | |
0 | 2995 } |
2996 else | |
2997 fprintf (dump_file, "Loop %d is not simple.\n", loop->num); | |
2998 } | |
2999 | |
3000 free (body); | |
3001 } | |
3002 | |
3003 /* Creates a simple loop description of LOOP if it was not computed | |
3004 already. */ | |
3005 | |
3006 struct niter_desc * | |
3007 get_simple_loop_desc (struct loop *loop) | |
3008 { | |
3009 struct niter_desc *desc = simple_loop_desc (loop); | |
3010 | |
3011 if (desc) | |
3012 return desc; | |
3013 | |
3014 /* At least desc->infinite is not always initialized by | |
3015 find_simple_loop_exit. */ | |
111 | 3016 desc = ggc_cleared_alloc<niter_desc> (); |
0 | 3017 iv_analysis_loop_init (loop); |
3018 find_simple_exit (loop, desc); | |
111 | 3019 loop->simple_loop_desc = desc; |
0 | 3020 return desc; |
3021 } | |
3022 | |
3023 /* Releases simple loop description for LOOP. */ | |
3024 | |
3025 void | |
3026 free_simple_loop_desc (struct loop *loop) | |
3027 { | |
3028 struct niter_desc *desc = simple_loop_desc (loop); | |
3029 | |
3030 if (!desc) | |
3031 return; | |
3032 | |
111 | 3033 ggc_free (desc); |
3034 loop->simple_loop_desc = NULL; | |
0 | 3035 } |