1*e4b17023SJohn Marino /* Loop header copying on trees.
2*e4b17023SJohn Marino Copyright (C) 2004, 2005, 2006, 2007, 2008, 2010
3*e4b17023SJohn Marino Free Software Foundation, Inc.
4*e4b17023SJohn Marino
5*e4b17023SJohn Marino This file is part of GCC.
6*e4b17023SJohn Marino
7*e4b17023SJohn Marino GCC is free software; you can redistribute it and/or modify it
8*e4b17023SJohn Marino under the terms of the GNU General Public License as published by the
9*e4b17023SJohn Marino Free Software Foundation; either version 3, or (at your option) any
10*e4b17023SJohn Marino later version.
11*e4b17023SJohn Marino
12*e4b17023SJohn Marino GCC is distributed in the hope that it will be useful, but WITHOUT
13*e4b17023SJohn Marino ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
14*e4b17023SJohn Marino FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
15*e4b17023SJohn Marino for more details.
16*e4b17023SJohn Marino
17*e4b17023SJohn Marino You should have received a copy of the GNU General Public License
18*e4b17023SJohn Marino along with GCC; see the file COPYING3. If not see
19*e4b17023SJohn Marino <http://www.gnu.org/licenses/>. */
20*e4b17023SJohn Marino
21*e4b17023SJohn Marino #include "config.h"
22*e4b17023SJohn Marino #include "system.h"
23*e4b17023SJohn Marino #include "coretypes.h"
24*e4b17023SJohn Marino #include "tm.h"
25*e4b17023SJohn Marino #include "tree.h"
26*e4b17023SJohn Marino #include "tm_p.h"
27*e4b17023SJohn Marino #include "basic-block.h"
28*e4b17023SJohn Marino #include "output.h"
29*e4b17023SJohn Marino #include "tree-flow.h"
30*e4b17023SJohn Marino #include "tree-dump.h"
31*e4b17023SJohn Marino #include "tree-pass.h"
32*e4b17023SJohn Marino #include "timevar.h"
33*e4b17023SJohn Marino #include "cfgloop.h"
34*e4b17023SJohn Marino #include "tree-inline.h"
35*e4b17023SJohn Marino #include "flags.h"
36*e4b17023SJohn Marino #include "tree-inline.h"
37*e4b17023SJohn Marino
38*e4b17023SJohn Marino /* Duplicates headers of loops if they are small enough, so that the statements
39*e4b17023SJohn Marino in the loop body are always executed when the loop is entered. This
40*e4b17023SJohn Marino increases effectiveness of code motion optimizations, and reduces the need
41*e4b17023SJohn Marino for loop preconditioning. */
42*e4b17023SJohn Marino
43*e4b17023SJohn Marino /* Check whether we should duplicate HEADER of LOOP. At most *LIMIT
44*e4b17023SJohn Marino instructions should be duplicated, limit is decreased by the actual
45*e4b17023SJohn Marino amount. */
46*e4b17023SJohn Marino
47*e4b17023SJohn Marino static bool
should_duplicate_loop_header_p(basic_block header,struct loop * loop,int * limit)48*e4b17023SJohn Marino should_duplicate_loop_header_p (basic_block header, struct loop *loop,
49*e4b17023SJohn Marino int *limit)
50*e4b17023SJohn Marino {
51*e4b17023SJohn Marino gimple_stmt_iterator bsi;
52*e4b17023SJohn Marino gimple last;
53*e4b17023SJohn Marino
54*e4b17023SJohn Marino /* Do not copy one block more than once (we do not really want to do
55*e4b17023SJohn Marino loop peeling here). */
56*e4b17023SJohn Marino if (header->aux)
57*e4b17023SJohn Marino return false;
58*e4b17023SJohn Marino
59*e4b17023SJohn Marino /* Loop header copying usually increases size of the code. This used not to
60*e4b17023SJohn Marino be true, since quite often it is possible to verify that the condition is
61*e4b17023SJohn Marino satisfied in the first iteration and therefore to eliminate it. Jump
62*e4b17023SJohn Marino threading handles these cases now. */
63*e4b17023SJohn Marino if (optimize_loop_for_size_p (loop))
64*e4b17023SJohn Marino return false;
65*e4b17023SJohn Marino
66*e4b17023SJohn Marino gcc_assert (EDGE_COUNT (header->succs) > 0);
67*e4b17023SJohn Marino if (single_succ_p (header))
68*e4b17023SJohn Marino return false;
69*e4b17023SJohn Marino if (flow_bb_inside_loop_p (loop, EDGE_SUCC (header, 0)->dest)
70*e4b17023SJohn Marino && flow_bb_inside_loop_p (loop, EDGE_SUCC (header, 1)->dest))
71*e4b17023SJohn Marino return false;
72*e4b17023SJohn Marino
73*e4b17023SJohn Marino /* If this is not the original loop header, we want it to have just
74*e4b17023SJohn Marino one predecessor in order to match the && pattern. */
75*e4b17023SJohn Marino if (header != loop->header && !single_pred_p (header))
76*e4b17023SJohn Marino return false;
77*e4b17023SJohn Marino
78*e4b17023SJohn Marino last = last_stmt (header);
79*e4b17023SJohn Marino if (gimple_code (last) != GIMPLE_COND)
80*e4b17023SJohn Marino return false;
81*e4b17023SJohn Marino
82*e4b17023SJohn Marino /* Approximately copy the conditions that used to be used in jump.c --
83*e4b17023SJohn Marino at most 20 insns and no calls. */
84*e4b17023SJohn Marino for (bsi = gsi_start_bb (header); !gsi_end_p (bsi); gsi_next (&bsi))
85*e4b17023SJohn Marino {
86*e4b17023SJohn Marino last = gsi_stmt (bsi);
87*e4b17023SJohn Marino
88*e4b17023SJohn Marino if (gimple_code (last) == GIMPLE_LABEL)
89*e4b17023SJohn Marino continue;
90*e4b17023SJohn Marino
91*e4b17023SJohn Marino if (is_gimple_debug (last))
92*e4b17023SJohn Marino continue;
93*e4b17023SJohn Marino
94*e4b17023SJohn Marino if (is_gimple_call (last))
95*e4b17023SJohn Marino return false;
96*e4b17023SJohn Marino
97*e4b17023SJohn Marino *limit -= estimate_num_insns (last, &eni_size_weights);
98*e4b17023SJohn Marino if (*limit < 0)
99*e4b17023SJohn Marino return false;
100*e4b17023SJohn Marino }
101*e4b17023SJohn Marino
102*e4b17023SJohn Marino return true;
103*e4b17023SJohn Marino }
104*e4b17023SJohn Marino
105*e4b17023SJohn Marino /* Checks whether LOOP is a do-while style loop. */
106*e4b17023SJohn Marino
107*e4b17023SJohn Marino bool
do_while_loop_p(struct loop * loop)108*e4b17023SJohn Marino do_while_loop_p (struct loop *loop)
109*e4b17023SJohn Marino {
110*e4b17023SJohn Marino gimple stmt = last_stmt (loop->latch);
111*e4b17023SJohn Marino
112*e4b17023SJohn Marino /* If the latch of the loop is not empty, it is not a do-while loop. */
113*e4b17023SJohn Marino if (stmt
114*e4b17023SJohn Marino && gimple_code (stmt) != GIMPLE_LABEL)
115*e4b17023SJohn Marino return false;
116*e4b17023SJohn Marino
117*e4b17023SJohn Marino /* If the header contains just a condition, it is not a do-while loop. */
118*e4b17023SJohn Marino stmt = last_and_only_stmt (loop->header);
119*e4b17023SJohn Marino if (stmt
120*e4b17023SJohn Marino && gimple_code (stmt) == GIMPLE_COND)
121*e4b17023SJohn Marino return false;
122*e4b17023SJohn Marino
123*e4b17023SJohn Marino return true;
124*e4b17023SJohn Marino }
125*e4b17023SJohn Marino
126*e4b17023SJohn Marino /* For all loops, copy the condition at the end of the loop body in front
127*e4b17023SJohn Marino of the loop. This is beneficial since it increases efficiency of
128*e4b17023SJohn Marino code motion optimizations. It also saves one jump on entry to the loop. */
129*e4b17023SJohn Marino
130*e4b17023SJohn Marino static unsigned int
copy_loop_headers(void)131*e4b17023SJohn Marino copy_loop_headers (void)
132*e4b17023SJohn Marino {
133*e4b17023SJohn Marino loop_iterator li;
134*e4b17023SJohn Marino struct loop *loop;
135*e4b17023SJohn Marino basic_block header;
136*e4b17023SJohn Marino edge exit, entry;
137*e4b17023SJohn Marino basic_block *bbs, *copied_bbs;
138*e4b17023SJohn Marino unsigned n_bbs;
139*e4b17023SJohn Marino unsigned bbs_size;
140*e4b17023SJohn Marino
141*e4b17023SJohn Marino loop_optimizer_init (LOOPS_HAVE_PREHEADERS
142*e4b17023SJohn Marino | LOOPS_HAVE_SIMPLE_LATCHES);
143*e4b17023SJohn Marino if (number_of_loops () <= 1)
144*e4b17023SJohn Marino {
145*e4b17023SJohn Marino loop_optimizer_finalize ();
146*e4b17023SJohn Marino return 0;
147*e4b17023SJohn Marino }
148*e4b17023SJohn Marino
149*e4b17023SJohn Marino #ifdef ENABLE_CHECKING
150*e4b17023SJohn Marino verify_loop_structure ();
151*e4b17023SJohn Marino #endif
152*e4b17023SJohn Marino
153*e4b17023SJohn Marino bbs = XNEWVEC (basic_block, n_basic_blocks);
154*e4b17023SJohn Marino copied_bbs = XNEWVEC (basic_block, n_basic_blocks);
155*e4b17023SJohn Marino bbs_size = n_basic_blocks;
156*e4b17023SJohn Marino
157*e4b17023SJohn Marino FOR_EACH_LOOP (li, loop, 0)
158*e4b17023SJohn Marino {
159*e4b17023SJohn Marino /* Copy at most 20 insns. */
160*e4b17023SJohn Marino int limit = 20;
161*e4b17023SJohn Marino
162*e4b17023SJohn Marino header = loop->header;
163*e4b17023SJohn Marino
164*e4b17023SJohn Marino /* If the loop is already a do-while style one (either because it was
165*e4b17023SJohn Marino written as such, or because jump threading transformed it into one),
166*e4b17023SJohn Marino we might be in fact peeling the first iteration of the loop. This
167*e4b17023SJohn Marino in general is not a good idea. */
168*e4b17023SJohn Marino if (do_while_loop_p (loop))
169*e4b17023SJohn Marino continue;
170*e4b17023SJohn Marino
171*e4b17023SJohn Marino /* Iterate the header copying up to limit; this takes care of the cases
172*e4b17023SJohn Marino like while (a && b) {...}, where we want to have both of the conditions
173*e4b17023SJohn Marino copied. TODO -- handle while (a || b) - like cases, by not requiring
174*e4b17023SJohn Marino the header to have just a single successor and copying up to
175*e4b17023SJohn Marino postdominator. */
176*e4b17023SJohn Marino
177*e4b17023SJohn Marino exit = NULL;
178*e4b17023SJohn Marino n_bbs = 0;
179*e4b17023SJohn Marino while (should_duplicate_loop_header_p (header, loop, &limit))
180*e4b17023SJohn Marino {
181*e4b17023SJohn Marino /* Find a successor of header that is inside a loop; i.e. the new
182*e4b17023SJohn Marino header after the condition is copied. */
183*e4b17023SJohn Marino if (flow_bb_inside_loop_p (loop, EDGE_SUCC (header, 0)->dest))
184*e4b17023SJohn Marino exit = EDGE_SUCC (header, 0);
185*e4b17023SJohn Marino else
186*e4b17023SJohn Marino exit = EDGE_SUCC (header, 1);
187*e4b17023SJohn Marino bbs[n_bbs++] = header;
188*e4b17023SJohn Marino gcc_assert (bbs_size > n_bbs);
189*e4b17023SJohn Marino header = exit->dest;
190*e4b17023SJohn Marino }
191*e4b17023SJohn Marino
192*e4b17023SJohn Marino if (!exit)
193*e4b17023SJohn Marino continue;
194*e4b17023SJohn Marino
195*e4b17023SJohn Marino if (dump_file && (dump_flags & TDF_DETAILS))
196*e4b17023SJohn Marino fprintf (dump_file,
197*e4b17023SJohn Marino "Duplicating header of the loop %d up to edge %d->%d.\n",
198*e4b17023SJohn Marino loop->num, exit->src->index, exit->dest->index);
199*e4b17023SJohn Marino
200*e4b17023SJohn Marino /* Ensure that the header will have just the latch as a predecessor
201*e4b17023SJohn Marino inside the loop. */
202*e4b17023SJohn Marino if (!single_pred_p (exit->dest))
203*e4b17023SJohn Marino exit = single_pred_edge (split_edge (exit));
204*e4b17023SJohn Marino
205*e4b17023SJohn Marino entry = loop_preheader_edge (loop);
206*e4b17023SJohn Marino
207*e4b17023SJohn Marino if (!gimple_duplicate_sese_region (entry, exit, bbs, n_bbs, copied_bbs))
208*e4b17023SJohn Marino {
209*e4b17023SJohn Marino fprintf (dump_file, "Duplication failed.\n");
210*e4b17023SJohn Marino continue;
211*e4b17023SJohn Marino }
212*e4b17023SJohn Marino
213*e4b17023SJohn Marino /* If the loop has the form "for (i = j; i < j + 10; i++)" then
214*e4b17023SJohn Marino this copying can introduce a case where we rely on undefined
215*e4b17023SJohn Marino signed overflow to eliminate the preheader condition, because
216*e4b17023SJohn Marino we assume that "j < j + 10" is true. We don't want to warn
217*e4b17023SJohn Marino about that case for -Wstrict-overflow, because in general we
218*e4b17023SJohn Marino don't warn about overflow involving loops. Prevent the
219*e4b17023SJohn Marino warning by setting the no_warning flag in the condition. */
220*e4b17023SJohn Marino if (warn_strict_overflow > 0)
221*e4b17023SJohn Marino {
222*e4b17023SJohn Marino unsigned int i;
223*e4b17023SJohn Marino
224*e4b17023SJohn Marino for (i = 0; i < n_bbs; ++i)
225*e4b17023SJohn Marino {
226*e4b17023SJohn Marino gimple_stmt_iterator bsi;
227*e4b17023SJohn Marino
228*e4b17023SJohn Marino for (bsi = gsi_start_bb (copied_bbs[i]);
229*e4b17023SJohn Marino !gsi_end_p (bsi);
230*e4b17023SJohn Marino gsi_next (&bsi))
231*e4b17023SJohn Marino {
232*e4b17023SJohn Marino gimple stmt = gsi_stmt (bsi);
233*e4b17023SJohn Marino if (gimple_code (stmt) == GIMPLE_COND)
234*e4b17023SJohn Marino gimple_set_no_warning (stmt, true);
235*e4b17023SJohn Marino else if (is_gimple_assign (stmt))
236*e4b17023SJohn Marino {
237*e4b17023SJohn Marino enum tree_code rhs_code = gimple_assign_rhs_code (stmt);
238*e4b17023SJohn Marino if (TREE_CODE_CLASS (rhs_code) == tcc_comparison)
239*e4b17023SJohn Marino gimple_set_no_warning (stmt, true);
240*e4b17023SJohn Marino }
241*e4b17023SJohn Marino }
242*e4b17023SJohn Marino }
243*e4b17023SJohn Marino }
244*e4b17023SJohn Marino
245*e4b17023SJohn Marino /* Ensure that the latch and the preheader is simple (we know that they
246*e4b17023SJohn Marino are not now, since there was the loop exit condition. */
247*e4b17023SJohn Marino split_edge (loop_preheader_edge (loop));
248*e4b17023SJohn Marino split_edge (loop_latch_edge (loop));
249*e4b17023SJohn Marino }
250*e4b17023SJohn Marino
251*e4b17023SJohn Marino free (bbs);
252*e4b17023SJohn Marino free (copied_bbs);
253*e4b17023SJohn Marino
254*e4b17023SJohn Marino loop_optimizer_finalize ();
255*e4b17023SJohn Marino return 0;
256*e4b17023SJohn Marino }
257*e4b17023SJohn Marino
258*e4b17023SJohn Marino static bool
gate_ch(void)259*e4b17023SJohn Marino gate_ch (void)
260*e4b17023SJohn Marino {
261*e4b17023SJohn Marino return flag_tree_ch != 0;
262*e4b17023SJohn Marino }
263*e4b17023SJohn Marino
264*e4b17023SJohn Marino struct gimple_opt_pass pass_ch =
265*e4b17023SJohn Marino {
266*e4b17023SJohn Marino {
267*e4b17023SJohn Marino GIMPLE_PASS,
268*e4b17023SJohn Marino "ch", /* name */
269*e4b17023SJohn Marino gate_ch, /* gate */
270*e4b17023SJohn Marino copy_loop_headers, /* execute */
271*e4b17023SJohn Marino NULL, /* sub */
272*e4b17023SJohn Marino NULL, /* next */
273*e4b17023SJohn Marino 0, /* static_pass_number */
274*e4b17023SJohn Marino TV_TREE_CH, /* tv_id */
275*e4b17023SJohn Marino PROP_cfg | PROP_ssa, /* properties_required */
276*e4b17023SJohn Marino 0, /* properties_provided */
277*e4b17023SJohn Marino 0, /* properties_destroyed */
278*e4b17023SJohn Marino 0, /* todo_flags_start */
279*e4b17023SJohn Marino TODO_cleanup_cfg
280*e4b17023SJohn Marino | TODO_verify_ssa
281*e4b17023SJohn Marino | TODO_verify_flow /* todo_flags_finish */
282*e4b17023SJohn Marino }
283*e4b17023SJohn Marino };
284