1 /* Post-reload compare elimination.
2 Copyright (C) 2010, 2011
3 Free Software Foundation, Inc.
4
5 This file is part of GCC.
6
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 3, or (at your option) any later
10 version.
11
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15 for more details.
16
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3. If not see
19 <http://www.gnu.org/licenses/>. */
20
21 /* There is a set of targets whose general-purpose move or addition
22 instructions clobber the flags. These targets cannot split their
23 CBRANCH/CSTORE etc patterns before reload is complete, lest reload
24 itself insert these instructions in between the flags setter and user.
25 Because these targets cannot split the compare from the use, they
26 cannot make use of the comparison elimination offered by the combine pass.
27
28 This is a small pass intended to provide comparison elimination similar to
29 what is available via NOTICE_UPDATE_CC for cc0 targets. This should help
30 encourage cc0 targets to convert to an explicit post-reload representation
31 of the flags.
32
33 This pass assumes:
34
35 (0) CBRANCH/CSTORE etc have been split in pass_split_after_reload.
36
37 (1) All comparison patterns are represented as
38
39 [(set (reg:CC) (compare:CC (reg) (immediate)))]
40
41 (2) All insn patterns that modify the flags are represented as
42
43 [(set (reg) (operation)
44 (clobber (reg:CC))]
45
46 (3) If an insn of form (2) can usefully set the flags, there is
47 another pattern of the form
48
49 [(set (reg) (operation)
50 (set (reg:CCM) (compare:CCM (operation) (immediate)))]
51
52 The mode CCM will be chosen as if by SELECT_CC_MODE.
53
54 Note that unlike NOTICE_UPDATE_CC, we do not handle memory operands.
55 This could be handled as a future enhancement.
56 */
57
58 #include "config.h"
59 #include "system.h"
60 #include "coretypes.h"
61 #include "tm.h"
62 #include "rtl.h"
63 #include "tm_p.h"
64 #include "insn-config.h"
65 #include "recog.h"
66 #include "flags.h"
67 #include "basic-block.h"
68 #include "tree-pass.h"
69 #include "target.h"
70 #include "df.h"
71 #include "domwalk.h"
72
73
74 /* These structures describe a comparison and how it is used. */
75
76 /* The choice of maximum 3 uses comes from wanting to eliminate the two
77 duplicate compares from a three-way branch on the sign of a value.
78 This is also sufficient to eliminate the duplicate compare against the
79 high-part of a double-word comparison. */
80 #define MAX_CMP_USE 3
81
82 struct comparison_use
83 {
84 /* The instruction in which the result of the compare is used. */
85 rtx insn;
86 /* The location of the flags register within the use. */
87 rtx *loc;
88 /* The comparison code applied against the flags register. */
89 enum rtx_code code;
90 };
91
92 struct comparison
93 {
94 /* The comparison instruction. */
95 rtx insn;
96
97 /* The insn prior to the comparison insn that clobbers the flags. */
98 rtx prev_clobber;
99
100 /* The two values being compared. These will be either REGs or
101 constants. */
102 rtx in_a, in_b;
103
104 /* Information about how this comparison is used. */
105 struct comparison_use uses[MAX_CMP_USE];
106
107 /* The original CC_MODE for this comparison. */
108 enum machine_mode orig_mode;
109
110 /* The number of uses identified for this comparison. */
111 unsigned short n_uses;
112
113 /* True if not all uses of this comparison have been identified.
114 This can happen either for overflowing the array above, or if
115 the flags register is used in some unusual context. */
116 bool missing_uses;
117
118 /* True if its inputs are still valid at the end of the block. */
119 bool inputs_valid;
120 };
121
122 typedef struct comparison *comparison_struct_p;
123 DEF_VEC_P(comparison_struct_p);
124 DEF_VEC_ALLOC_P(comparison_struct_p, heap);
125
VEC(comparison_struct_p,heap)126 static VEC(comparison_struct_p, heap) *all_compares;
127
128 /* Look for a "conforming" comparison, as defined above. If valid, return
129 the rtx for the COMPARE itself. */
130
131 static rtx
132 conforming_compare (rtx insn)
133 {
134 rtx set, src, dest;
135
136 set = single_set (insn);
137 if (set == NULL)
138 return NULL;
139
140 src = SET_SRC (set);
141 if (GET_CODE (src) != COMPARE)
142 return NULL;
143
144 dest = SET_DEST (set);
145 if (!REG_P (dest) || REGNO (dest) != targetm.flags_regnum)
146 return NULL;
147
148 if (REG_P (XEXP (src, 0))
149 && REG_P (XEXP (src, 0))
150 && (REG_P (XEXP (src, 1)) || CONSTANT_P (XEXP (src, 1))))
151 return src;
152
153 return NULL;
154 }
155
156 /* Look for a pattern of the "correct" form for an insn with a flags clobber
157 for which we may be able to eliminate a compare later. We're not looking
158 to validate any inputs at this time, merely see that the basic shape is
159 correct. The term "arithmetic" may be somewhat misleading... */
160
161 static bool
arithmetic_flags_clobber_p(rtx insn)162 arithmetic_flags_clobber_p (rtx insn)
163 {
164 rtx pat, x;
165
166 if (!NONJUMP_INSN_P (insn))
167 return false;
168 pat = PATTERN (insn);
169 if (extract_asm_operands (pat))
170 return false;
171
172 if (GET_CODE (pat) == PARALLEL && XVECLEN (pat, 0) == 2)
173 {
174 x = XVECEXP (pat, 0, 0);
175 if (GET_CODE (x) != SET)
176 return false;
177 x = SET_DEST (x);
178 if (!REG_P (x))
179 return false;
180
181 x = XVECEXP (pat, 0, 1);
182 if (GET_CODE (x) == CLOBBER)
183 {
184 x = XEXP (x, 0);
185 if (REG_P (x) && REGNO (x) == targetm.flags_regnum)
186 return true;
187 }
188 }
189
190 return false;
191 }
192
193 /* Look for uses of FLAGS in INSN. If we find one we can analyze, record
194 it in CMP; otherwise indicate that we've missed a use. */
195
196 static void
find_flags_uses_in_insn(struct comparison * cmp,rtx insn)197 find_flags_uses_in_insn (struct comparison *cmp, rtx insn)
198 {
199 df_ref *use_rec, use;
200
201 /* If we've already lost track of uses, don't bother collecting more. */
202 if (cmp->missing_uses)
203 return;
204
205 /* Find a USE of the flags register. */
206 for (use_rec = DF_INSN_USES (insn); (use = *use_rec) != NULL; use_rec++)
207 if (DF_REF_REGNO (use) == targetm.flags_regnum)
208 {
209 rtx x, *loc;
210
211 /* If this is an unusual use, quit. */
212 if (DF_REF_TYPE (use) != DF_REF_REG_USE)
213 goto fail;
214
215 /* If we've run out of slots to record uses, quit. */
216 if (cmp->n_uses == MAX_CMP_USE)
217 goto fail;
218
219 /* Unfortunately the location of the flags register, while present
220 in the reference structure, doesn't help. We need to find the
221 comparison code that is outer to the actual flags use. */
222 loc = DF_REF_LOC (use);
223 x = PATTERN (insn);
224 if (GET_CODE (x) == PARALLEL)
225 x = XVECEXP (x, 0, 0);
226 x = SET_SRC (x);
227 if (GET_CODE (x) == IF_THEN_ELSE)
228 x = XEXP (x, 0);
229 if (COMPARISON_P (x)
230 && loc == &XEXP (x, 0)
231 && XEXP (x, 1) == const0_rtx)
232 {
233 /* We've found a use of the flags that we understand. */
234 struct comparison_use *cuse = &cmp->uses[cmp->n_uses++];
235 cuse->insn = insn;
236 cuse->loc = loc;
237 cuse->code = GET_CODE (x);
238 }
239 else
240 goto fail;
241 }
242 return;
243
244 fail:
245 /* We failed to recognize this use of the flags register. */
246 cmp->missing_uses = true;
247 }
248
249 /* Identify comparison instructions within BB. If the flags from the last
250 compare in the BB is live at the end of the block, install the compare
251 in BB->AUX. Called via walk_dominators_tree. */
252
253 static void
find_comparisons_in_bb(struct dom_walk_data * data ATTRIBUTE_UNUSED,basic_block bb)254 find_comparisons_in_bb (struct dom_walk_data *data ATTRIBUTE_UNUSED,
255 basic_block bb)
256 {
257 struct comparison *last_cmp;
258 rtx insn, next, last_clobber;
259 bool last_cmp_valid;
260 bitmap killed;
261
262 killed = BITMAP_ALLOC (NULL);
263
264 /* The last comparison that was made. Will be reset to NULL
265 once the flags are clobbered. */
266 last_cmp = NULL;
267
268 /* True iff the last comparison has not been clobbered, nor
269 have its inputs. Used to eliminate duplicate compares. */
270 last_cmp_valid = false;
271
272 /* The last insn that clobbered the flags, if that insn is of
273 a form that may be valid for eliminating a following compare.
274 To be reset to NULL once the flags are set otherwise. */
275 last_clobber = NULL;
276
277 /* Propagate the last live comparison throughout the extended basic block. */
278 if (single_pred_p (bb))
279 {
280 last_cmp = (struct comparison *) single_pred (bb)->aux;
281 if (last_cmp)
282 last_cmp_valid = last_cmp->inputs_valid;
283 }
284
285 for (insn = BB_HEAD (bb); insn; insn = next)
286 {
287 rtx src;
288
289 next = (insn == BB_END (bb) ? NULL_RTX : NEXT_INSN (insn));
290 if (!NONDEBUG_INSN_P (insn))
291 continue;
292
293 /* Compute the set of registers modified by this instruction. */
294 bitmap_clear (killed);
295 df_simulate_find_defs (insn, killed);
296
297 src = conforming_compare (insn);
298 if (src)
299 {
300 enum machine_mode src_mode = GET_MODE (src);
301
302 /* Eliminate a compare that's redundant with the previous. */
303 if (last_cmp_valid
304 && src_mode == last_cmp->orig_mode
305 && rtx_equal_p (last_cmp->in_a, XEXP (src, 0))
306 && rtx_equal_p (last_cmp->in_b, XEXP (src, 1)))
307 {
308 delete_insn (insn);
309 continue;
310 }
311
312 last_cmp = XCNEW (struct comparison);
313 last_cmp->insn = insn;
314 last_cmp->prev_clobber = last_clobber;
315 last_cmp->in_a = XEXP (src, 0);
316 last_cmp->in_b = XEXP (src, 1);
317 last_cmp->orig_mode = src_mode;
318 VEC_safe_push (comparison_struct_p, heap, all_compares, last_cmp);
319
320 /* It's unusual, but be prepared for comparison patterns that
321 also clobber an input, or perhaps a scratch. */
322 last_clobber = NULL;
323 last_cmp_valid = true;
324 }
325
326 /* Notice if this instruction kills the flags register. */
327 else if (bitmap_bit_p (killed, targetm.flags_regnum))
328 {
329 /* See if this insn could be the "clobber" that eliminates
330 a future comparison. */
331 last_clobber = (arithmetic_flags_clobber_p (insn) ? insn : NULL);
332
333 /* In either case, the previous compare is no longer valid. */
334 last_cmp = NULL;
335 last_cmp_valid = false;
336 continue;
337 }
338
339 /* Notice if this instruction uses the flags register. */
340 else if (last_cmp)
341 find_flags_uses_in_insn (last_cmp, insn);
342
343 /* Notice if any of the inputs to the comparison have changed. */
344 if (last_cmp_valid
345 && (bitmap_bit_p (killed, REGNO (last_cmp->in_a))
346 || (REG_P (last_cmp->in_b)
347 && bitmap_bit_p (killed, REGNO (last_cmp->in_b)))))
348 last_cmp_valid = false;
349 }
350
351 BITMAP_FREE (killed);
352
353 /* Remember the live comparison for subsequent members of
354 the extended basic block. */
355 if (last_cmp)
356 {
357 bb->aux = last_cmp;
358 last_cmp->inputs_valid = last_cmp_valid;
359
360 /* Look to see if the flags register is live outgoing here, and
361 incoming to any successor not part of the extended basic block. */
362 if (bitmap_bit_p (df_get_live_out (bb), targetm.flags_regnum))
363 {
364 edge e;
365 edge_iterator ei;
366
367 FOR_EACH_EDGE (e, ei, bb->succs)
368 {
369 basic_block dest = e->dest;
370 if (bitmap_bit_p (df_get_live_in (bb),
371 targetm.flags_regnum)
372 && !single_pred_p (dest))
373 {
374 last_cmp->missing_uses = true;
375 break;
376 }
377 }
378 }
379 }
380 }
381
382 /* Find all comparisons in the function. */
383
384 static void
find_comparisons(void)385 find_comparisons (void)
386 {
387 struct dom_walk_data data;
388
389 memset (&data, 0, sizeof(data));
390 data.dom_direction = CDI_DOMINATORS;
391 data.before_dom_children = find_comparisons_in_bb;
392
393 calculate_dominance_info (CDI_DOMINATORS);
394
395 init_walk_dominator_tree (&data);
396 walk_dominator_tree (&data, ENTRY_BLOCK_PTR);
397 fini_walk_dominator_tree (&data);
398
399 clear_aux_for_blocks ();
400 free_dominance_info (CDI_DOMINATORS);
401 }
402
403 /* Select an alternate CC_MODE for a comparison insn comparing A and B.
404 Note that inputs are almost certainly different than the IN_A and IN_B
405 stored in CMP -- we're called while attempting to eliminate the compare
406 after all. Return the new FLAGS rtx if successful, else return NULL.
407 Note that this function may start a change group. */
408
409 static rtx
maybe_select_cc_mode(struct comparison * cmp,rtx a ATTRIBUTE_UNUSED,rtx b ATTRIBUTE_UNUSED)410 maybe_select_cc_mode (struct comparison *cmp, rtx a ATTRIBUTE_UNUSED,
411 rtx b ATTRIBUTE_UNUSED)
412 {
413 enum machine_mode sel_mode;
414 const int n = cmp->n_uses;
415 rtx flags = NULL;
416
417 #ifndef SELECT_CC_MODE
418 /* Minimize code differences when this target macro is undefined. */
419 return NULL;
420 #define SELECT_CC_MODE(A,B,C) (gcc_unreachable (), VOIDmode)
421 #endif
422
423 /* If we don't have access to all of the uses, we can't validate. */
424 if (cmp->missing_uses || n == 0)
425 return NULL;
426
427 /* Find a new mode that works for all of the uses. Special case the
428 common case of exactly one use. */
429 if (n == 1)
430 {
431 sel_mode = SELECT_CC_MODE (cmp->uses[0].code, a, b);
432 if (sel_mode != cmp->orig_mode)
433 {
434 flags = gen_rtx_REG (sel_mode, targetm.flags_regnum);
435 validate_change (cmp->uses[0].insn, cmp->uses[0].loc, flags, true);
436 }
437 }
438 else
439 {
440 int i;
441
442 sel_mode = SELECT_CC_MODE (cmp->uses[0].code, a, b);
443 for (i = 1; i < n; ++i)
444 {
445 enum machine_mode new_mode;
446 new_mode = SELECT_CC_MODE (cmp->uses[i].code, a, b);
447 if (new_mode != sel_mode)
448 {
449 sel_mode = targetm.cc_modes_compatible (sel_mode, new_mode);
450 if (sel_mode == VOIDmode)
451 return NULL;
452 }
453 }
454
455 if (sel_mode != cmp->orig_mode)
456 {
457 flags = gen_rtx_REG (sel_mode, targetm.flags_regnum);
458 for (i = 0; i < n; ++i)
459 validate_change (cmp->uses[i].insn, cmp->uses[i].loc, flags, true);
460 }
461 }
462
463 return flags;
464 }
465
466 /* Attempt to replace a comparison with a prior arithmetic insn that can
467 compute the same flags value as the comparison itself. Return true if
468 successful, having made all rtl modifications necessary. */
469
470 static bool
try_eliminate_compare(struct comparison * cmp)471 try_eliminate_compare (struct comparison *cmp)
472 {
473 rtx x, insn, bb_head, flags, in_a, cmp_src;
474
475 /* We must have found an interesting "clobber" preceeding the compare. */
476 if (cmp->prev_clobber == NULL)
477 return false;
478
479 /* ??? For the moment we don't handle comparisons for which IN_B
480 is a register. We accepted these during initial comparison
481 recognition in order to eliminate duplicate compares.
482 An improvement here would be to handle x = a - b; if (a cmp b). */
483 if (!CONSTANT_P (cmp->in_b))
484 return false;
485
486 /* Verify that IN_A is not clobbered in between CMP and PREV_CLOBBER.
487 Given that this target requires this pass, we can assume that most
488 insns do clobber the flags, and so the distance between the compare
489 and the clobber is likely to be small. */
490 /* ??? This is one point at which one could argue that DF_REF_CHAIN would
491 be useful, but it is thought to be too heavy-weight a solution here. */
492
493 in_a = cmp->in_a;
494 insn = cmp->insn;
495 bb_head = BB_HEAD (BLOCK_FOR_INSN (insn));
496 for (insn = PREV_INSN (insn);
497 insn != cmp->prev_clobber;
498 insn = PREV_INSN (insn))
499 {
500 const int abnormal_flags
501 = (DF_REF_CONDITIONAL | DF_REF_PARTIAL | DF_REF_MAY_CLOBBER
502 | DF_REF_MUST_CLOBBER | DF_REF_SIGN_EXTRACT
503 | DF_REF_ZERO_EXTRACT | DF_REF_STRICT_LOW_PART
504 | DF_REF_PRE_POST_MODIFY);
505 df_ref *def_rec, def;
506
507 /* Note that the BB_HEAD is always either a note or a label, but in
508 any case it means that IN_A is defined outside the block. */
509 if (insn == bb_head)
510 return false;
511 if (NOTE_P (insn) || DEBUG_INSN_P (insn))
512 continue;
513
514 /* Find a possible def of IN_A in INSN. */
515 for (def_rec = DF_INSN_DEFS (insn); (def = *def_rec) != NULL; def_rec++)
516 if (DF_REF_REGNO (def) == REGNO (in_a))
517 break;
518
519 /* No definitions of IN_A; continue searching. */
520 if (def == NULL)
521 continue;
522
523 /* Bail if this is not a totally normal set of IN_A. */
524 if (DF_REF_IS_ARTIFICIAL (def))
525 return false;
526 if (DF_REF_FLAGS (def) & abnormal_flags)
527 return false;
528
529 /* We've found an insn between the compare and the clobber that sets
530 IN_A. Given that pass_cprop_hardreg has not yet run, we still find
531 situations in which we can usefully look through a copy insn. */
532 x = single_set (insn);
533 if (x == NULL)
534 return false;
535 in_a = SET_SRC (x);
536 if (!REG_P (in_a))
537 return false;
538 }
539
540 /* We've reached PREV_CLOBBER without finding a modification of IN_A.
541 Validate that PREV_CLOBBER itself does in fact refer to IN_A. Do
542 recall that we've already validated the shape of PREV_CLOBBER. */
543 x = XVECEXP (PATTERN (insn), 0, 0);
544 if (!rtx_equal_p (SET_DEST (x), in_a))
545 return false;
546 cmp_src = SET_SRC (x);
547
548 /* Determine if we ought to use a different CC_MODE here. */
549 flags = maybe_select_cc_mode (cmp, cmp_src, cmp->in_b);
550 if (flags == NULL)
551 flags = gen_rtx_REG (cmp->orig_mode, targetm.flags_regnum);
552
553 /* Generate a new comparison for installation in the setter. */
554 x = copy_rtx (cmp_src);
555 x = gen_rtx_COMPARE (GET_MODE (flags), x, cmp->in_b);
556 x = gen_rtx_SET (VOIDmode, flags, x);
557
558 /* Succeed if the new instruction is valid. Note that we may have started
559 a change group within maybe_select_cc_mode, therefore we must continue. */
560 validate_change (insn, &XVECEXP (PATTERN (insn), 0, 1), x, true);
561 if (!apply_change_group ())
562 return false;
563
564 /* Success. Delete the compare insn... */
565 delete_insn (cmp->insn);
566
567 /* ... and any notes that are now invalid due to multiple sets. */
568 x = find_regno_note (insn, REG_UNUSED, targetm.flags_regnum);
569 if (x)
570 remove_note (insn, x);
571 x = find_reg_note (insn, REG_EQUAL, NULL);
572 if (x)
573 remove_note (insn, x);
574 x = find_reg_note (insn, REG_EQUIV, NULL);
575 if (x)
576 remove_note (insn, x);
577
578 return true;
579 }
580
581 /* Main entry point to the pass. */
582
583 static unsigned int
execute_compare_elim_after_reload(void)584 execute_compare_elim_after_reload (void)
585 {
586 df_analyze ();
587
588 gcc_checking_assert (all_compares == NULL);
589
590 /* Locate all comparisons and their uses, and eliminate duplicates. */
591 find_comparisons ();
592 if (all_compares)
593 {
594 struct comparison *cmp;
595 size_t i;
596
597 /* Eliminate comparisons that are redundant with flags computation. */
598 FOR_EACH_VEC_ELT (comparison_struct_p, all_compares, i, cmp)
599 {
600 try_eliminate_compare (cmp);
601 XDELETE (cmp);
602 }
603
604 VEC_free (comparison_struct_p, heap, all_compares);
605 all_compares = NULL;
606 }
607
608 return 0;
609 }
610
611 static bool
gate_compare_elim_after_reload(void)612 gate_compare_elim_after_reload (void)
613 {
614 /* Setting this target hook value is how a backend indicates the need. */
615 if (targetm.flags_regnum == INVALID_REGNUM)
616 return false;
617 return flag_compare_elim_after_reload;
618 }
619
620 struct rtl_opt_pass pass_compare_elim_after_reload =
621 {
622 {
623 RTL_PASS,
624 "cmpelim", /* name */
625 gate_compare_elim_after_reload, /* gate */
626 execute_compare_elim_after_reload, /* execute */
627 NULL, /* sub */
628 NULL, /* next */
629 0, /* static_pass_number */
630 TV_NONE, /* tv_id */
631 0, /* properties_required */
632 0, /* properties_provided */
633 0, /* properties_destroyed */
634 0, /* todo_flags_start */
635 TODO_df_finish
636 | TODO_df_verify
637 | TODO_verify_rtl_sharing
638 | TODO_ggc_collect /* todo_flags_finish */
639 }
640 };
641