xref: /netbsd-src/external/gpl3/gcc/dist/gcc/graphite.cc (revision b1e838363e3c6fc78a55519254d99869742dd33c)
1 /* Gimple Represented as Polyhedra.
2    Copyright (C) 2006-2022 Free Software Foundation, Inc.
3    Contributed by Sebastian Pop <sebastian.pop@inria.fr>.
4 
5 This file is part of GCC.
6 
7 GCC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3, or (at your option)
10 any later version.
11 
12 GCC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 GNU General Public License for more details.
16 
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING3.  If not see
19 <http://www.gnu.org/licenses/>.  */
20 
21 /* This pass converts GIMPLE to GRAPHITE, performs some loop
22    transformations and then converts the resulting representation back
23    to GIMPLE.
24 
25    An early description of this pass can be found in the GCC Summit'06
26    paper "GRAPHITE: Polyhedral Analyses and Optimizations for GCC".
27    The wiki page http://gcc.gnu.org/wiki/Graphite contains pointers to
28    the related work.  */
29 
30 #define INCLUDE_ISL
31 
32 #include "config.h"
33 #include "system.h"
34 #include "coretypes.h"
35 #include "backend.h"
36 #include "diagnostic-core.h"
37 #include "cfgloop.h"
38 #include "tree-pass.h"
39 #include "pretty-print.h"
40 #include "cfganal.h"
41 
42 #ifdef HAVE_isl
43 #include "cfghooks.h"
44 #include "tree.h"
45 #include "gimple.h"
46 #include "ssa.h"
47 #include "fold-const.h"
48 #include "gimple-iterator.h"
49 #include "tree-cfg.h"
50 #include "tree-ssa-loop.h"
51 #include "tree-data-ref.h"
52 #include "tree-scalar-evolution.h"
53 #include "dbgcnt.h"
54 #include "tree-parloops.h"
55 #include "tree-cfgcleanup.h"
56 #include "tree-vectorizer.h"
57 #include "tree-ssa-loop-manip.h"
58 #include "tree-ssa.h"
59 #include "tree-into-ssa.h"
60 #include "graphite.h"
61 
62 /* Print global statistics to FILE.  */
63 
64 static void
print_global_statistics(FILE * file)65 print_global_statistics (FILE* file)
66 {
67   long n_bbs = 0;
68   long n_loops = 0;
69   long n_stmts = 0;
70   long n_conditions = 0;
71   profile_count n_p_bbs = profile_count::zero ();
72   profile_count n_p_loops = profile_count::zero ();
73   profile_count n_p_stmts = profile_count::zero ();
74   profile_count n_p_conditions = profile_count::zero ();
75 
76   basic_block bb;
77 
78   FOR_ALL_BB_FN (bb, cfun)
79     {
80       gimple_stmt_iterator psi;
81 
82       n_bbs++;
83       if (bb->count.initialized_p ())
84         n_p_bbs += bb->count;
85 
86       /* Ignore artificial surrounding loop.  */
87       if (bb == bb->loop_father->header
88 	  && bb->index != 0)
89 	{
90 	  n_loops++;
91 	  n_p_loops += bb->count;
92 	}
93 
94       if (EDGE_COUNT (bb->succs) > 1)
95 	{
96 	  n_conditions++;
97 	  if (bb->count.initialized_p ())
98 	    n_p_conditions += bb->count;
99 	}
100 
101       for (psi = gsi_start_bb (bb); !gsi_end_p (psi); gsi_next (&psi))
102 	{
103 	  n_stmts++;
104 	  if (bb->count.initialized_p ())
105 	    n_p_stmts += bb->count;
106 	}
107     }
108 
109   fprintf (file, "\nGlobal statistics (");
110   fprintf (file, "BBS:%ld, ", n_bbs);
111   fprintf (file, "LOOPS:%ld, ", n_loops);
112   fprintf (file, "CONDITIONS:%ld, ", n_conditions);
113   fprintf (file, "STMTS:%ld)\n", n_stmts);
114   fprintf (file, "Global profiling statistics (");
115   fprintf (file, "BBS:");
116   n_p_bbs.dump (file);
117   fprintf (file, ", LOOPS:");
118   n_p_loops.dump (file);
119   fprintf (file, ", CONDITIONS:");
120   n_p_conditions.dump (file);
121   fprintf (file, ", STMTS:");
122   n_p_stmts.dump (file);
123   fprintf (file, ")\n\n");
124 }
125 
126 /* Print statistics for SCOP to FILE.  */
127 
128 static void
print_graphite_scop_statistics(FILE * file,scop_p scop)129 print_graphite_scop_statistics (FILE* file, scop_p scop)
130 {
131   long n_bbs = 0;
132   long n_loops = 0;
133   long n_stmts = 0;
134   long n_conditions = 0;
135   profile_count n_p_bbs = profile_count::zero ();
136   profile_count n_p_loops = profile_count::zero ();
137   profile_count n_p_stmts = profile_count::zero ();
138   profile_count n_p_conditions = profile_count::zero ();
139 
140   basic_block bb;
141 
142   FOR_ALL_BB_FN (bb, cfun)
143     {
144       gimple_stmt_iterator psi;
145       loop_p loop = bb->loop_father;
146 
147       if (!bb_in_sese_p (bb, scop->scop_info->region))
148 	continue;
149 
150       n_bbs++;
151       if (bb->count.initialized_p ())
152         n_p_bbs += bb->count;
153 
154       if (EDGE_COUNT (bb->succs) > 1)
155 	{
156 	  n_conditions++;
157 	  n_p_conditions += bb->count;
158 	}
159 
160       for (psi = gsi_start_bb (bb); !gsi_end_p (psi); gsi_next (&psi))
161 	{
162 	  n_stmts++;
163 	  n_p_stmts += bb->count;
164 	}
165 
166       if (loop->header == bb && loop_in_sese_p (loop, scop->scop_info->region))
167 	{
168 	  n_loops++;
169 	  n_p_loops += bb->count;
170 	}
171     }
172 
173   fprintf (file, "\nFunction Name: %s\n", current_function_name ());
174 
175   edge scop_begin = scop->scop_info->region.entry;
176   edge scop_end = scop->scop_info->region.exit;
177 
178   fprintf (file, "\nSCoP (entry_edge (bb_%d, bb_%d), ",
179 	   scop_begin->src->index, scop_begin->dest->index);
180   fprintf (file, "exit_edge (bb_%d, bb_%d))",
181 	   scop_end->src->index, scop_end->dest->index);
182 
183   fprintf (file, "\nSCoP statistics (");
184   fprintf (file, "BBS:%ld, ", n_bbs);
185   fprintf (file, "LOOPS:%ld, ", n_loops);
186   fprintf (file, "CONDITIONS:%ld, ", n_conditions);
187   fprintf (file, "STMTS:%ld)\n", n_stmts);
188   fprintf (file, "SCoP profiling statistics (");
189   fprintf (file, "BBS:");
190   n_p_bbs.dump (file);
191   fprintf (file, ", LOOPS:");
192   n_p_loops.dump (file);
193   fprintf (file, ", CONDITIONS:");
194   n_p_conditions.dump (file);
195   fprintf (file, ", STMTS:");
196   n_p_stmts.dump (file);
197   fprintf (file, ")\n\n");
198 }
199 
200 /* Print statistics for SCOPS to FILE.  */
201 
202 static void
print_graphite_statistics(FILE * file,vec<scop_p> scops)203 print_graphite_statistics (FILE* file, vec<scop_p> scops)
204 {
205   int i;
206   scop_p scop;
207 
208   FOR_EACH_VEC_ELT (scops, i, scop)
209     print_graphite_scop_statistics (file, scop);
210 }
211 
212 struct seir_cache_key
213 {
214   hashval_t hash;
215   int entry_dest;
216   int exit_src;
217   int loop_num;
218   tree expr;
219 };
220 
221 struct sese_scev_hash : typed_noop_remove <seir_cache_key>
222 {
223   typedef seir_cache_key value_type;
224   typedef seir_cache_key compare_type;
hashsese_scev_hash225   static hashval_t hash (const seir_cache_key &key) { return key.hash; }
226   static bool
equalsese_scev_hash227   equal (const seir_cache_key &key1, const seir_cache_key &key2)
228   {
229     return (key1.hash == key2.hash
230 	    && key1.entry_dest == key2.entry_dest
231 	    && key1.exit_src == key2.exit_src
232 	    && key1.loop_num == key2.loop_num
233 	    && operand_equal_p (key1.expr, key2.expr, 0));
234   }
mark_deletedsese_scev_hash235   static void mark_deleted (seir_cache_key &key) { key.expr = NULL_TREE; }
236   static const bool empty_zero_p = false;
mark_emptysese_scev_hash237   static void mark_empty (seir_cache_key &key) { key.entry_dest = 0; }
is_deletedsese_scev_hash238   static bool is_deleted (const seir_cache_key &key) { return !key.expr; }
is_emptysese_scev_hash239   static bool is_empty (const seir_cache_key &key) { return key.entry_dest == 0; }
240 };
241 
242 static hash_map<sese_scev_hash, tree> *seir_cache;
243 
244 /* Same as scalar_evolution_in_region but caches results so we avoid
245    re-computing evolutions during transform phase.  */
246 
247 tree
cached_scalar_evolution_in_region(const sese_l & region,loop_p loop,tree expr)248 cached_scalar_evolution_in_region (const sese_l &region, loop_p loop,
249 				   tree expr)
250 {
251   seir_cache_key key;
252   key.entry_dest = region.entry->dest->index;
253   key.exit_src = region.exit->src->index;
254   key.loop_num = loop->num;
255   key.expr = expr;
256   inchash::hash hstate (0);
257   hstate.add_int (key.entry_dest);
258   hstate.add_int (key.exit_src);
259   hstate.add_int (key.loop_num);
260   inchash::add_expr (key.expr, hstate);
261   key.hash = hstate.end ();
262 
263   bool existed;
264   tree &chrec = seir_cache->get_or_insert (key, &existed);
265   if (!existed)
266     chrec = scalar_evolution_in_region (region, loop, expr);
267   return chrec;
268 }
269 
270 /* Deletes all scops in SCOPS.  */
271 
272 static void
free_scops(vec<scop_p> scops)273 free_scops (vec<scop_p> scops)
274 {
275   int i;
276   scop_p scop;
277 
278   FOR_EACH_VEC_ELT (scops, i, scop)
279     free_scop (scop);
280 
281   scops.release ();
282 }
283 
284 /* Transforms LOOP to the canonical loop closed SSA form.  */
285 
286 static void
canonicalize_loop_closed_ssa(loop_p loop,edge e)287 canonicalize_loop_closed_ssa (loop_p loop, edge e)
288 {
289   basic_block bb;
290   gphi_iterator psi;
291 
292   bb = e->dest;
293 
294   /* Make the loop-close PHI node BB contain only PHIs and have a
295      single predecessor.  */
296   if (single_pred_p (bb))
297     {
298       e = split_block_after_labels (bb);
299       bb = e->src;
300     }
301   else
302     {
303       basic_block close = split_edge (e);
304       e = single_succ_edge (close);
305       for (psi = gsi_start_phis (bb); !gsi_end_p (psi); gsi_next (&psi))
306 	{
307 	  gphi *phi = psi.phi ();
308 	  use_operand_p use_p = PHI_ARG_DEF_PTR_FROM_EDGE (phi, e);
309 	  tree arg = USE_FROM_PTR (use_p);
310 
311 	  /* Only add close phi nodes for SSA_NAMEs defined in LOOP.  */
312 	  if (TREE_CODE (arg) != SSA_NAME
313 	      || SSA_NAME_IS_DEFAULT_DEF (arg)
314 	      || ! flow_bb_inside_loop_p (loop,
315 					  gimple_bb (SSA_NAME_DEF_STMT (arg))))
316 	    continue;
317 
318 	  tree res = copy_ssa_name (arg);
319 	  gphi *close_phi = create_phi_node (res, close);
320 	  add_phi_arg (close_phi, arg, gimple_phi_arg_edge (close_phi, 0),
321 		       UNKNOWN_LOCATION);
322 	  SET_USE (use_p, res);
323 	}
324       bb = close;
325     }
326 
327   /* Eliminate duplicates.  This relies on processing loops from
328      innermost to outer.  */
329   for (psi = gsi_start_phis (bb); !gsi_end_p (psi); gsi_next (&psi))
330     {
331       gphi_iterator gsi = psi;
332       gphi *phi = psi.phi ();
333 
334       /* At this point, PHI should be a close phi in normal form.  */
335       gcc_assert (gimple_phi_num_args (phi) == 1);
336 
337       /* Iterate over the next phis and remove duplicates.  */
338       gsi_next (&gsi);
339       while (!gsi_end_p (gsi))
340 	if (gimple_phi_arg_def (phi, 0) == gimple_phi_arg_def (gsi.phi (), 0))
341 	  {
342 	    replace_uses_by (gimple_phi_result (gsi.phi ()),
343 			     gimple_phi_result (phi));
344 	    remove_phi_node (&gsi, true);
345 	  }
346 	else
347 	  gsi_next (&gsi);
348     }
349 }
350 
351 /* Converts the current loop closed SSA form to a canonical form
352    expected by the Graphite code generation.
353 
354    The loop closed SSA form has the following invariant: a variable
355    defined in a loop that is used outside the loop appears only in the
356    phi nodes in the destination of the loop exit.  These phi nodes are
357    called close phi nodes.
358 
359    The canonical loop closed SSA form contains the extra invariants:
360 
361    - when the loop contains only one exit, the close phi nodes contain
362    only one argument.  That implies that the basic block that contains
363    the close phi nodes has only one predecessor, that is a basic block
364    in the loop.
365 
366    - the basic block containing the close phi nodes does not contain
367    other statements.
368 
369    - there exist only one phi node per definition in the loop.
370 
371    In addition to that we also make sure that loop exit edges are
372    first in the successor edge vector.  This is to make RPO order
373    as computed by pre_and_rev_post_order_compute be consistent with
374    what initial schedule generation expects.
375 */
376 
377 static void
canonicalize_loop_form(void)378 canonicalize_loop_form (void)
379 {
380   for (auto loop : loops_list (cfun, LI_FROM_INNERMOST))
381     {
382       edge e = single_exit (loop);
383       if (!e || (e->flags & (EDGE_COMPLEX|EDGE_FAKE)))
384 	continue;
385 
386       canonicalize_loop_closed_ssa (loop, e);
387 
388       /* If the exit is not first in the edge vector make it so.  */
389       if (e != EDGE_SUCC (e->src, 0))
390 	{
391 	  unsigned ei;
392 	  for (ei = 0; EDGE_SUCC (e->src, ei) != e; ++ei)
393 	    ;
394 	  std::swap (EDGE_SUCC (e->src, ei), EDGE_SUCC (e->src, 0));
395 	}
396     }
397 
398   /* We can end up releasing duplicate exit PHIs and also introduce
399      additional copies so the cached information isn't correct anymore.  */
400   scev_reset ();
401 
402   checking_verify_loop_closed_ssa (true);
403 }
404 
405 isl_ctx *the_isl_ctx;
406 
407 /* Perform a set of linear transforms on the loops of the current
408    function.  */
409 
410 void
graphite_transform_loops(void)411 graphite_transform_loops (void)
412 {
413   int i;
414   scop_p scop;
415   bool changed = false;
416   vec<scop_p> scops = vNULL;
417   isl_ctx *ctx;
418 
419   /* If a function is parallel it was most probably already run through graphite
420      once. No need to run again.  */
421   if (parallelized_function_p (cfun->decl))
422     return;
423 
424   calculate_dominance_info (CDI_DOMINATORS);
425 
426   /* We rely on post-dominators during merging of SESE regions so those
427      have to be meaningful.  */
428   connect_infinite_loops_to_exit ();
429 
430   ctx = isl_ctx_alloc ();
431   isl_options_set_on_error (ctx, ISL_ON_ERROR_ABORT);
432   the_isl_ctx = ctx;
433 
434   sort_sibling_loops (cfun);
435   canonicalize_loop_form ();
436 
437   /* Print the loop structure.  */
438   if (dump_file && (dump_flags & TDF_DETAILS))
439     {
440       print_loops (dump_file, 2);
441       print_loops (dump_file, 3);
442     }
443 
444   seir_cache = new hash_map<sese_scev_hash, tree>;
445 
446   calculate_dominance_info (CDI_POST_DOMINATORS);
447   build_scops (&scops);
448   free_dominance_info (CDI_POST_DOMINATORS);
449 
450   /* Remove the fake exits before transform given they are not reflected
451      in loop structures we end up verifying.  */
452   remove_fake_exit_edges ();
453 
454   if (dump_file && (dump_flags & TDF_DETAILS))
455     {
456       print_graphite_statistics (dump_file, scops);
457       print_global_statistics (dump_file);
458     }
459 
460   FOR_EACH_VEC_ELT (scops, i, scop)
461     if (dbg_cnt (graphite_scop))
462       {
463 	scop->isl_context = ctx;
464 	if (!build_poly_scop (scop))
465 	  continue;
466 
467 	if (!apply_poly_transforms (scop))
468 	  continue;
469 
470 	changed = true;
471 	if (graphite_regenerate_ast_isl (scop)
472 	    && dump_enabled_p ())
473 	  {
474 	    dump_user_location_t loc = find_loop_location
475 	      (scops[i]->scop_info->region.entry->dest->loop_father);
476 	    dump_printf_loc (MSG_OPTIMIZED_LOCATIONS, loc,
477 			     "loop nest optimized\n");
478 	  }
479       }
480 
481   delete seir_cache;
482   seir_cache = NULL;
483 
484   if (changed)
485     {
486       mark_virtual_operands_for_renaming (cfun);
487       update_ssa (TODO_update_ssa);
488       checking_verify_ssa (true, true);
489       rewrite_into_loop_closed_ssa (NULL, 0);
490       scev_reset ();
491       checking_verify_loop_structure ();
492     }
493 
494   if (dump_file && (dump_flags & TDF_DETAILS))
495     {
496       int num_no_dependency = 0;
497 
498       for (auto loop : loops_list (cfun, 0))
499 	if (loop->can_be_parallel)
500 	  num_no_dependency++;
501 
502       fprintf (dump_file, "%d loops carried no dependency.\n",
503 	       num_no_dependency);
504     }
505 
506   free_scops (scops);
507   the_isl_ctx = NULL;
508   isl_ctx_free (ctx);
509 
510   if (changed)
511     {
512       cleanup_tree_cfg ();
513       profile_status_for_fn (cfun) = PROFILE_ABSENT;
514       release_recorded_exits (cfun);
515       tree_estimate_probability (false);
516     }
517 }
518 
519 #else /* If isl is not available: #ifndef HAVE_isl.  */
520 
521 static void
graphite_transform_loops(void)522 graphite_transform_loops (void)
523 {
524   sorry ("Graphite loop optimizations cannot be used (isl is not available).");
525 }
526 
527 #endif
528 
529 
530 static unsigned int
graphite_transforms(struct function * fun)531 graphite_transforms (struct function *fun)
532 {
533   if (number_of_loops (fun) <= 1)
534     return 0;
535 
536   graphite_transform_loops ();
537 
538   return 0;
539 }
540 
541 static bool
gate_graphite_transforms(void)542 gate_graphite_transforms (void)
543 {
544   /* Enable -fgraphite pass if any one of the graphite optimization flags
545      is turned on.  */
546   if (flag_graphite_identity
547       || flag_loop_parallelize_all
548       || flag_loop_nest_optimize)
549     flag_graphite = 1;
550 
551   return flag_graphite != 0;
552 }
553 
554 namespace {
555 
556 const pass_data pass_data_graphite =
557 {
558   GIMPLE_PASS, /* type */
559   "graphite0", /* name */
560   OPTGROUP_LOOP, /* optinfo_flags */
561   TV_GRAPHITE, /* tv_id */
562   ( PROP_cfg | PROP_ssa ), /* properties_required */
563   0, /* properties_provided */
564   0, /* properties_destroyed */
565   0, /* todo_flags_start */
566   0, /* todo_flags_finish */
567 };
568 
569 class pass_graphite : public gimple_opt_pass
570 {
571 public:
pass_graphite(gcc::context * ctxt)572   pass_graphite (gcc::context *ctxt)
573     : gimple_opt_pass (pass_data_graphite, ctxt)
574   {}
575 
576   /* opt_pass methods: */
gate(function *)577   virtual bool gate (function *) { return gate_graphite_transforms (); }
578 
579 }; // class pass_graphite
580 
581 } // anon namespace
582 
583 gimple_opt_pass *
make_pass_graphite(gcc::context * ctxt)584 make_pass_graphite (gcc::context *ctxt)
585 {
586   return new pass_graphite (ctxt);
587 }
588 
589 namespace {
590 
591 const pass_data pass_data_graphite_transforms =
592 {
593   GIMPLE_PASS, /* type */
594   "graphite", /* name */
595   OPTGROUP_LOOP, /* optinfo_flags */
596   TV_GRAPHITE_TRANSFORMS, /* tv_id */
597   ( PROP_cfg | PROP_ssa ), /* properties_required */
598   0, /* properties_provided */
599   0, /* properties_destroyed */
600   0, /* todo_flags_start */
601   0, /* todo_flags_finish */
602 };
603 
604 class pass_graphite_transforms : public gimple_opt_pass
605 {
606 public:
pass_graphite_transforms(gcc::context * ctxt)607   pass_graphite_transforms (gcc::context *ctxt)
608     : gimple_opt_pass (pass_data_graphite_transforms, ctxt)
609   {}
610 
611   /* opt_pass methods: */
gate(function *)612   virtual bool gate (function *) { return gate_graphite_transforms (); }
execute(function * fun)613   virtual unsigned int execute (function *fun) { return graphite_transforms (fun); }
614 
615 }; // class pass_graphite_transforms
616 
617 } // anon namespace
618 
619 gimple_opt_pass *
make_pass_graphite_transforms(gcc::context * ctxt)620 make_pass_graphite_transforms (gcc::context *ctxt)
621 {
622   return new pass_graphite_transforms (ctxt);
623 }
624 
625 
626