1 /* If-conversion for vectorizer.
2    Copyright (C) 2004, 2005 Free Software Foundation, Inc.
3    Contributed by Devang Patel <dpatel@apple.com>
4 
5 This file is part of GCC.
6 
7 GCC is free software; you can redistribute it and/or modify it under
8 the terms of the GNU General Public License as published by the Free
9 Software Foundation; either version 2, or (at your option) any later
10 version.
11 
12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
15 for more details.
16 
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING.  If not, write to the Free
19 Software Foundation, 51 Franklin Street, Fifth Floor, Boston, MA
20 02110-1301, USA.  */
21 
22 /* This pass implements tree level if-conversion transformation of loops.
23    Initial goal is to help vectorizer vectorize loops with conditions.
24 
25    A short description of if-conversion:
26 
27      o Decide if a loop is if-convertible or not.
28      o Walk all loop basic blocks in breadth first order (BFS order).
29        o Remove conditional statements (at the end of basic block)
30          and propagate condition into destination basic blocks'
31 	 predicate list.
32        o Replace modify expression with conditional modify expression
33          using current basic block's condition.
34      o Merge all basic blocks
35        o Replace phi nodes with conditional modify expr
36        o Merge all basic blocks into header
37 
38      Sample transformation:
39 
40      INPUT
41      -----
42 
43      # i_23 = PHI <0(0), i_18(10)>;
44      <L0>:;
45      j_15 = A[i_23];
46      if (j_15 > 41) goto <L1>; else goto <L17>;
47 
48      <L17>:;
49      goto <bb 3> (<L3>);
50 
51      <L1>:;
52 
53      # iftmp.2_4 = PHI <0(8), 42(2)>;
54      <L3>:;
55      A[i_23] = iftmp.2_4;
56      i_18 = i_23 + 1;
57      if (i_18 <= 15) goto <L19>; else goto <L18>;
58 
59      <L19>:;
60      goto <bb 1> (<L0>);
61 
62      <L18>:;
63 
64      OUTPUT
65      ------
66 
67      # i_23 = PHI <0(0), i_18(10)>;
68      <L0>:;
69      j_15 = A[i_23];
70 
71      <L3>:;
72      iftmp.2_4 = j_15 > 41 ? 42 : 0;
73      A[i_23] = iftmp.2_4;
74      i_18 = i_23 + 1;
75      if (i_18 <= 15) goto <L19>; else goto <L18>;
76 
77      <L19>:;
78      goto <bb 1> (<L0>);
79 
80      <L18>:;
81 */
82 
83 #include "config.h"
84 #include "system.h"
85 #include "coretypes.h"
86 #include "tm.h"
87 #include "tree.h"
88 #include "c-common.h"
89 #include "flags.h"
90 #include "timevar.h"
91 #include "varray.h"
92 #include "rtl.h"
93 #include "basic-block.h"
94 #include "diagnostic.h"
95 #include "tree-flow.h"
96 #include "tree-dump.h"
97 #include "cfgloop.h"
98 #include "tree-chrec.h"
99 #include "tree-data-ref.h"
100 #include "tree-scalar-evolution.h"
101 #include "tree-pass.h"
102 #include "target.h"
103 
104 /* local function prototypes */
105 static unsigned int main_tree_if_conversion (void);
106 static tree tree_if_convert_stmt (struct loop *loop, tree, tree,
107 				  block_stmt_iterator *);
108 static void tree_if_convert_cond_expr (struct loop *, tree, tree,
109 				       block_stmt_iterator *);
110 static bool if_convertible_phi_p (struct loop *, basic_block, tree);
111 static bool if_convertible_modify_expr_p (struct loop *, basic_block, tree);
112 static bool if_convertible_stmt_p (struct loop *, basic_block, tree);
113 static bool if_convertible_bb_p (struct loop *, basic_block, basic_block);
114 static bool if_convertible_loop_p (struct loop *, bool);
115 static void add_to_predicate_list (basic_block, tree);
116 static tree add_to_dst_predicate_list (struct loop * loop, edge,
117 				       tree, tree,
118 				       block_stmt_iterator *);
119 static void clean_predicate_lists (struct loop *loop);
120 static basic_block find_phi_replacement_condition (struct loop *loop,
121 						   basic_block, tree *,
122 						   block_stmt_iterator *);
123 static void replace_phi_with_cond_modify_expr (tree, tree, basic_block,
124                                                block_stmt_iterator *);
125 static void process_phi_nodes (struct loop *);
126 static void combine_blocks (struct loop *);
127 static tree ifc_temp_var (tree, tree);
128 static bool pred_blocks_visited_p (basic_block, bitmap *);
129 static basic_block * get_loop_body_in_if_conv_order (const struct loop *loop);
130 static bool bb_with_exit_edge_p (struct loop *, basic_block);
131 
132 /* List of basic blocks in if-conversion-suitable order.  */
133 static basic_block *ifc_bbs;
134 
135 /* Main entry point.
136    Apply if-conversion to the LOOP. Return true if successful otherwise return
137    false. If false is returned then loop remains unchanged.
138    FOR_VECTORIZER is a boolean flag. It indicates whether if-conversion is used
139    for vectorizer or not. If it is used for vectorizer, additional checks are
140    used. (Vectorization checks are not yet implemented).  */
141 
142 static bool
tree_if_conversion(struct loop * loop,bool for_vectorizer)143 tree_if_conversion (struct loop *loop, bool for_vectorizer)
144 {
145   basic_block bb;
146   block_stmt_iterator itr;
147   unsigned int i;
148 
149   ifc_bbs = NULL;
150 
151   /* if-conversion is not appropriate for all loops. First, check if loop  is
152      if-convertible or not.  */
153   if (!if_convertible_loop_p (loop, for_vectorizer))
154     {
155       if (dump_file && (dump_flags & TDF_DETAILS))
156 	fprintf (dump_file,"-------------------------\n");
157       if (ifc_bbs)
158 	{
159 	  free (ifc_bbs);
160 	  ifc_bbs = NULL;
161 	}
162       free_dominance_info (CDI_POST_DOMINATORS);
163       return false;
164     }
165 
166   /* Do actual work now.  */
167   for (i = 0; i < loop->num_nodes; i++)
168     {
169       tree cond;
170 
171       bb = ifc_bbs [i];
172 
173       /* Update condition using predicate list.  */
174       cond = bb->aux;
175 
176       /* Process all statements in this basic block.
177 	 Remove conditional expression, if any, and annotate
178 	 destination basic block(s) appropriately.  */
179       for (itr = bsi_start (bb); !bsi_end_p (itr); /* empty */)
180 	{
181 	  tree t = bsi_stmt (itr);
182 	  cond = tree_if_convert_stmt (loop, t, cond, &itr);
183 	  if (!bsi_end_p (itr))
184 	    bsi_next (&itr);
185 	}
186 
187       /* If current bb has only one successor, then consider it as an
188 	 unconditional goto.  */
189       if (single_succ_p (bb))
190 	{
191 	  basic_block bb_n = single_succ (bb);
192 	  if (cond != NULL_TREE)
193 	    add_to_predicate_list (bb_n, cond);
194 	}
195     }
196 
197   /* Now, all statements are if-converted and basic blocks are
198      annotated appropriately. Combine all basic block into one huge
199      basic block.  */
200   combine_blocks (loop);
201 
202   /* clean up */
203   clean_predicate_lists (loop);
204   free (ifc_bbs);
205   ifc_bbs = NULL;
206 
207   return true;
208 }
209 
210 /* if-convert stmt T which is part of LOOP.
211    If T is a MODIFY_EXPR than it is converted into conditional modify
212    expression using COND.  For conditional expressions, add condition in the
213    destination basic block's predicate list and remove conditional
214    expression itself. BSI is the iterator used to traverse statements of
215    loop. It is used here when it is required to delete current statement.  */
216 
217 static tree
tree_if_convert_stmt(struct loop * loop,tree t,tree cond,block_stmt_iterator * bsi)218 tree_if_convert_stmt (struct loop *  loop, tree t, tree cond,
219 		      block_stmt_iterator *bsi)
220 {
221   if (dump_file && (dump_flags & TDF_DETAILS))
222     {
223       fprintf (dump_file, "------if-convert stmt\n");
224       print_generic_stmt (dump_file, t, TDF_SLIM);
225       print_generic_stmt (dump_file, cond, TDF_SLIM);
226     }
227 
228   switch (TREE_CODE (t))
229     {
230       /* Labels are harmless here.  */
231     case LABEL_EXPR:
232       break;
233 
234     case MODIFY_EXPR:
235       /* This modify_expr is killing previous value of LHS. Appropriate value will
236 	 be selected by PHI node based on condition. It is possible that before
237 	 this transformation, PHI nodes was selecting default value and now it will
238 	 use this new value. This is OK because it does not change validity the
239 	 program.  */
240       break;
241 
242     case COND_EXPR:
243       /* Update destination blocks' predicate list and remove this
244 	 condition expression.  */
245       tree_if_convert_cond_expr (loop, t, cond, bsi);
246       cond = NULL_TREE;
247       break;
248 
249     default:
250       gcc_unreachable ();
251     }
252   return cond;
253 }
254 
255 /* STMT is COND_EXPR. Update two destination's predicate list.
256    Remove COND_EXPR, if it is not the loop exit condition. Otherwise
257    update loop exit condition appropriately.  BSI is the iterator
258    used to traverse statement list. STMT is part of loop LOOP.  */
259 
260 static void
tree_if_convert_cond_expr(struct loop * loop,tree stmt,tree cond,block_stmt_iterator * bsi)261 tree_if_convert_cond_expr (struct loop *loop, tree stmt, tree cond,
262 			   block_stmt_iterator *bsi)
263 {
264   tree c, c2;
265   edge true_edge, false_edge;
266 
267   gcc_assert (TREE_CODE (stmt) == COND_EXPR);
268 
269   c = COND_EXPR_COND (stmt);
270 
271   extract_true_false_edges_from_block (bb_for_stmt (stmt),
272  				       &true_edge, &false_edge);
273 
274   /* Add new condition into destination's predicate list.  */
275 
276   /* If 'c' is true then TRUE_EDGE is taken.  */
277   add_to_dst_predicate_list (loop, true_edge, cond,
278 			     unshare_expr (c), bsi);
279 
280   /* If 'c' is false then FALSE_EDGE is taken.  */
281   c2 = invert_truthvalue (unshare_expr (c));
282   add_to_dst_predicate_list (loop, false_edge, cond, c2, bsi);
283 
284   /* Now this conditional statement is redundant. Remove it.
285      But, do not remove exit condition! Update exit condition
286      using new condition.  */
287   if (!bb_with_exit_edge_p (loop, bb_for_stmt (stmt)))
288     {
289       bsi_remove (bsi, true);
290       cond = NULL_TREE;
291     }
292   return;
293 }
294 
295 /* Return true, iff PHI is if-convertible. PHI is part of loop LOOP
296    and it belongs to basic block BB.
297    PHI is not if-convertible
298    - if it has more than 2 arguments.
299    - Virtual PHI is immediately used in another PHI node.  */
300 
301 static bool
if_convertible_phi_p(struct loop * loop,basic_block bb,tree phi)302 if_convertible_phi_p (struct loop *loop, basic_block bb, tree phi)
303 {
304   if (dump_file && (dump_flags & TDF_DETAILS))
305     {
306       fprintf (dump_file, "-------------------------\n");
307       print_generic_stmt (dump_file, phi, TDF_SLIM);
308     }
309 
310   if (bb != loop->header && PHI_NUM_ARGS (phi) != 2)
311     {
312       if (dump_file && (dump_flags & TDF_DETAILS))
313 	fprintf (dump_file, "More than two phi node args.\n");
314       return false;
315     }
316 
317   if (!is_gimple_reg (SSA_NAME_VAR (PHI_RESULT (phi))))
318     {
319       imm_use_iterator imm_iter;
320       use_operand_p use_p;
321       FOR_EACH_IMM_USE_FAST (use_p, imm_iter, PHI_RESULT (phi))
322 	{
323 	  if (TREE_CODE (USE_STMT (use_p)) == PHI_NODE)
324 	    {
325 	      if (dump_file && (dump_flags & TDF_DETAILS))
326 		fprintf (dump_file, "Difficult to handle this virtual phi.\n");
327 	      return false;
328 	    }
329 	}
330     }
331 
332   return true;
333 }
334 
335 /* Return true, if M_EXPR is if-convertible.
336    MODIFY_EXPR is not if-convertible if,
337    - It is not movable.
338    - It could trap.
339    - LHS is not var decl.
340   MODIFY_EXPR is part of block BB, which is inside loop LOOP.
341 */
342 
343 static bool
if_convertible_modify_expr_p(struct loop * loop,basic_block bb,tree m_expr)344 if_convertible_modify_expr_p (struct loop *loop, basic_block bb, tree m_expr)
345 {
346   if (dump_file && (dump_flags & TDF_DETAILS))
347     {
348       fprintf (dump_file, "-------------------------\n");
349       print_generic_stmt (dump_file, m_expr, TDF_SLIM);
350     }
351 
352   /* Be conservative and do not handle immovable expressions.  */
353   if (movement_possibility (m_expr) == MOVE_IMPOSSIBLE)
354     {
355       if (dump_file && (dump_flags & TDF_DETAILS))
356 	fprintf (dump_file, "stmt is movable. Don't take risk\n");
357       return false;
358     }
359 
360   /* See if it needs speculative loading or not.  */
361   if (bb != loop->header
362       && tree_could_trap_p (TREE_OPERAND (m_expr, 1)))
363     {
364       if (dump_file && (dump_flags & TDF_DETAILS))
365 	fprintf (dump_file, "tree could trap...\n");
366       return false;
367     }
368 
369   if (TREE_CODE (TREE_OPERAND (m_expr, 1)) == CALL_EXPR)
370     {
371       if (dump_file && (dump_flags & TDF_DETAILS))
372 	fprintf (dump_file, "CALL_EXPR \n");
373       return false;
374     }
375 
376   if (TREE_CODE (TREE_OPERAND (m_expr, 0)) != SSA_NAME
377       && bb != loop->header
378       && !bb_with_exit_edge_p (loop, bb))
379     {
380       if (dump_file && (dump_flags & TDF_DETAILS))
381 	{
382 	  fprintf (dump_file, "LHS is not var\n");
383 	  print_generic_stmt (dump_file, m_expr, TDF_SLIM);
384 	}
385       return false;
386     }
387 
388 
389   return true;
390 }
391 
392 /* Return true, iff STMT is if-convertible.
393    Statement is if-convertible if,
394    - It is if-convertible MODIFY_EXPR
395    - IT is LABEL_EXPR or COND_EXPR.
396    STMT is inside block BB, which is inside loop LOOP.  */
397 
398 static bool
if_convertible_stmt_p(struct loop * loop,basic_block bb,tree stmt)399 if_convertible_stmt_p (struct loop *loop, basic_block bb, tree stmt)
400 {
401   switch (TREE_CODE (stmt))
402     {
403     case LABEL_EXPR:
404       break;
405 
406     case MODIFY_EXPR:
407 
408       if (!if_convertible_modify_expr_p (loop, bb, stmt))
409 	return false;
410       break;
411 
412     case COND_EXPR:
413       break;
414 
415     default:
416       /* Don't know what to do with 'em so don't do anything.  */
417       if (dump_file && (dump_flags & TDF_DETAILS))
418 	{
419 	  fprintf (dump_file, "don't know what to do\n");
420 	  print_generic_stmt (dump_file, stmt, TDF_SLIM);
421 	}
422       return false;
423       break;
424     }
425 
426   return true;
427 }
428 
429 /* Return true, iff BB is if-convertible.
430    Note: This routine does _not_ check basic block statements and phis.
431    Basic block is not if-convertible if,
432    - Basic block is non-empty and it is after exit block (in BFS order).
433    - Basic block is after exit block but before latch.
434    - Basic block edge(s) is not normal.
435    EXIT_BB_SEEN is true if basic block with exit edge is already seen.
436    BB is inside loop LOOP.  */
437 
438 static bool
if_convertible_bb_p(struct loop * loop,basic_block bb,basic_block exit_bb)439 if_convertible_bb_p (struct loop *loop, basic_block bb, basic_block exit_bb)
440 {
441   edge e;
442   edge_iterator ei;
443 
444   if (dump_file && (dump_flags & TDF_DETAILS))
445     fprintf (dump_file, "----------[%d]-------------\n", bb->index);
446 
447   if (exit_bb)
448     {
449       if (bb != loop->latch)
450 	{
451 	  if (dump_file && (dump_flags & TDF_DETAILS))
452 	    fprintf (dump_file, "basic block after exit bb but before latch\n");
453 	  return false;
454 	}
455       else if (!empty_block_p (bb))
456 	{
457 	  if (dump_file && (dump_flags & TDF_DETAILS))
458 	    fprintf (dump_file, "non empty basic block after exit bb\n");
459 	  return false;
460 	}
461       else if (bb == loop->latch
462 	       && bb != exit_bb
463 	       && !dominated_by_p (CDI_DOMINATORS, bb, exit_bb))
464 	  {
465 	    if (dump_file && (dump_flags & TDF_DETAILS))
466 	      fprintf (dump_file, "latch is not dominated by exit_block\n");
467 	    return false;
468 	  }
469     }
470 
471   /* Be less adventurous and handle only normal edges.  */
472   FOR_EACH_EDGE (e, ei, bb->succs)
473     if (e->flags &
474 	(EDGE_ABNORMAL_CALL | EDGE_EH | EDGE_ABNORMAL | EDGE_IRREDUCIBLE_LOOP))
475       {
476 	if (dump_file && (dump_flags & TDF_DETAILS))
477 	  fprintf (dump_file,"Difficult to handle edges\n");
478 	return false;
479       }
480 
481   return true;
482 }
483 
484 /* Return true, iff LOOP is if-convertible.
485    LOOP is if-convertible if,
486    - It is innermost.
487    - It has two or more basic blocks.
488    - It has only one exit.
489    - Loop header is not the exit edge.
490    - If its basic blocks and phi nodes are if convertible. See above for
491      more info.
492    FOR_VECTORIZER enables vectorizer specific checks. For example, support
493    for vector conditions, data dependency checks etc.. (Not implemented yet).  */
494 
495 static bool
if_convertible_loop_p(struct loop * loop,bool for_vectorizer ATTRIBUTE_UNUSED)496 if_convertible_loop_p (struct loop *loop, bool for_vectorizer ATTRIBUTE_UNUSED)
497 {
498   tree phi;
499   basic_block bb;
500   block_stmt_iterator itr;
501   unsigned int i;
502   edge e;
503   edge_iterator ei;
504   basic_block exit_bb = NULL;
505 
506   /* Handle only inner most loop.  */
507   if (!loop || loop->inner)
508     {
509       if (dump_file && (dump_flags & TDF_DETAILS))
510 	fprintf (dump_file, "not inner most loop\n");
511       return false;
512     }
513 
514   /* If only one block, no need for if-conversion.  */
515   if (loop->num_nodes <= 2)
516     {
517       if (dump_file && (dump_flags & TDF_DETAILS))
518 	fprintf (dump_file, "less than 2 basic blocks\n");
519       return false;
520     }
521 
522   /* More than one loop exit is too much to handle.  */
523   if (!loop->single_exit)
524     {
525       if (dump_file && (dump_flags & TDF_DETAILS))
526 	fprintf (dump_file, "multiple exits\n");
527       return false;
528     }
529 
530   /* ??? Check target's vector conditional operation support for vectorizer.  */
531 
532   /* If one of the loop header's edge is exit edge then do not apply
533      if-conversion.  */
534   FOR_EACH_EDGE (e, ei, loop->header->succs)
535     {
536       if (loop_exit_edge_p (loop, e))
537 	return false;
538     }
539 
540   calculate_dominance_info (CDI_DOMINATORS);
541   calculate_dominance_info (CDI_POST_DOMINATORS);
542 
543   /* Allow statements that can be handled during if-conversion.  */
544   ifc_bbs = get_loop_body_in_if_conv_order (loop);
545   if (!ifc_bbs)
546     {
547       if (dump_file && (dump_flags & TDF_DETAILS))
548 	fprintf (dump_file,"Irreducible loop\n");
549       free_dominance_info (CDI_POST_DOMINATORS);
550       return false;
551     }
552 
553   for (i = 0; i < loop->num_nodes; i++)
554     {
555       bb = ifc_bbs[i];
556 
557       if (!if_convertible_bb_p (loop, bb, exit_bb))
558 	return false;
559 
560       /* Check statements.  */
561       for (itr = bsi_start (bb); !bsi_end_p (itr); bsi_next (&itr))
562 	if (!if_convertible_stmt_p (loop, bb, bsi_stmt (itr)))
563 	  return false;
564       /* ??? Check data dependency for vectorizer.  */
565 
566       /* What about phi nodes ? */
567       phi = phi_nodes (bb);
568 
569       /* Clear aux field of incoming edges to a bb with a phi node.  */
570       if (phi)
571 	FOR_EACH_EDGE (e, ei, bb->preds)
572 	  e->aux = NULL;
573 
574       /* Check statements.  */
575       for (; phi; phi = PHI_CHAIN (phi))
576 	if (!if_convertible_phi_p (loop, bb, phi))
577 	  return false;
578 
579       if (bb_with_exit_edge_p (loop, bb))
580 	exit_bb = bb;
581     }
582 
583   /* OK. Did not find any potential issues so go ahead in if-convert
584      this loop. Now there is no looking back.  */
585   if (dump_file)
586     fprintf (dump_file,"Applying if-conversion\n");
587 
588   free_dominance_info (CDI_POST_DOMINATORS);
589   return true;
590 }
591 
592 /* Add condition COND into predicate list of basic block BB.  */
593 
594 static void
add_to_predicate_list(basic_block bb,tree new_cond)595 add_to_predicate_list (basic_block bb, tree new_cond)
596 {
597   tree cond = bb->aux;
598 
599   if (cond)
600     cond = fold_build2 (TRUTH_OR_EXPR, boolean_type_node,
601 			unshare_expr (cond), new_cond);
602   else
603     cond = new_cond;
604 
605   bb->aux = cond;
606 }
607 
608 /* Add condition COND into BB's predicate list.  PREV_COND is
609    existing condition.  */
610 
611 static tree
add_to_dst_predicate_list(struct loop * loop,edge e,tree prev_cond,tree cond,block_stmt_iterator * bsi)612 add_to_dst_predicate_list (struct loop * loop, edge e,
613 			   tree prev_cond, tree cond,
614 			   block_stmt_iterator *bsi)
615 {
616   tree new_cond = NULL_TREE;
617 
618   if (!flow_bb_inside_loop_p (loop, e->dest))
619     return NULL_TREE;
620 
621   if (prev_cond == boolean_true_node || !prev_cond)
622     new_cond = unshare_expr (cond);
623   else
624     {
625       tree tmp;
626       tree tmp_stmt = NULL_TREE;
627       tree tmp_stmts1 = NULL_TREE;
628       tree tmp_stmts2 = NULL_TREE;
629       prev_cond = force_gimple_operand (unshare_expr (prev_cond),
630 					&tmp_stmts1, true, NULL);
631       if (tmp_stmts1)
632         bsi_insert_before (bsi, tmp_stmts1, BSI_SAME_STMT);
633 
634       cond = force_gimple_operand (unshare_expr (cond),
635 				   &tmp_stmts2, true, NULL);
636       if (tmp_stmts2)
637         bsi_insert_before (bsi, tmp_stmts2, BSI_SAME_STMT);
638 
639       /* Add the condition to aux field of the edge.  In case edge
640 	 destination is a PHI node, this condition will be ANDed with
641 	 block predicate to construct complete condition.  */
642       e->aux = cond;
643 
644       /* new_cond == prev_cond AND cond */
645       tmp = build2 (TRUTH_AND_EXPR, boolean_type_node,
646 		    unshare_expr (prev_cond), cond);
647       tmp_stmt = ifc_temp_var (boolean_type_node, tmp);
648       bsi_insert_before (bsi, tmp_stmt, BSI_SAME_STMT);
649       new_cond = TREE_OPERAND (tmp_stmt, 0);
650     }
651   add_to_predicate_list (e->dest, new_cond);
652   return new_cond;
653 }
654 
655 /* During if-conversion aux field from basic block structure is used to hold
656    predicate list. Clean each basic block's predicate list for the given LOOP.
657    Also clean aux field of succesor edges, used to hold true and false
658    condition from conditional expression.  */
659 
660 static void
clean_predicate_lists(struct loop * loop)661 clean_predicate_lists (struct loop *loop)
662 {
663   basic_block *bb;
664   unsigned int i;
665   edge e;
666   edge_iterator ei;
667 
668   bb = get_loop_body (loop);
669   for (i = 0; i < loop->num_nodes; i++)
670     {
671       bb[i]->aux = NULL;
672       FOR_EACH_EDGE (e, ei, bb[i]->succs)
673 	e->aux = NULL;
674     }
675   free (bb);
676 }
677 
678 /* Basic block BB has two predecessors. Using predecessor's aux field, set
679    appropriate condition COND for the PHI node replacement. Return true block
680    whose phi arguments are selected when cond is true.  */
681 
682 static basic_block
find_phi_replacement_condition(struct loop * loop,basic_block bb,tree * cond,block_stmt_iterator * bsi)683 find_phi_replacement_condition (struct loop *loop,
684 				basic_block bb, tree *cond,
685                                 block_stmt_iterator *bsi)
686 {
687   edge first_edge, second_edge;
688   tree tmp_cond, new_stmts;
689 
690   gcc_assert (EDGE_COUNT (bb->preds) == 2);
691   first_edge = EDGE_PRED (bb, 0);
692   second_edge = EDGE_PRED (bb, 1);
693 
694   /* Use condition based on following criteria:
695      1)
696        S1: x = !c ? a : b;
697 
698        S2: x = c ? b : a;
699 
700        S2 is preferred over S1. Make 'b' first_bb and use its condition.
701 
702      2) Do not make loop header first_bb.
703 
704      3)
705        S1: x = !(c == d)? a : b;
706 
707        S21: t1 = c == d;
708        S22: x = t1 ? b : a;
709 
710        S3: x = (c == d) ? b : a;
711 
712        S3 is preferred over S1 and S2*, Make 'b' first_bb and use
713        its condition.
714 
715      4) If  pred B is dominated by pred A then use pred B's condition.
716         See PR23115.  */
717 
718   /* Select condition that is not TRUTH_NOT_EXPR.  */
719   tmp_cond = (first_edge->src)->aux;
720   if (TREE_CODE (tmp_cond) == TRUTH_NOT_EXPR)
721     {
722       edge tmp_edge;
723 
724       tmp_edge = first_edge;
725       first_edge = second_edge;
726       second_edge = tmp_edge;
727     }
728 
729   /* Check if FIRST_BB is loop header or not and make sure that
730      FIRST_BB does not dominate SECOND_BB.  */
731   if (first_edge->src == loop->header
732       || dominated_by_p (CDI_DOMINATORS,
733 			 second_edge->src, first_edge->src))
734     {
735       *cond = (second_edge->src)->aux;
736 
737       /* If there is a condition on an incoming edge,
738 	 AND it with the incoming bb predicate.  */
739       if (second_edge->aux)
740 	*cond = build2 (TRUTH_AND_EXPR, boolean_type_node,
741 			*cond, second_edge->aux);
742 
743       if (TREE_CODE (*cond) == TRUTH_NOT_EXPR)
744 	/* We can be smart here and choose inverted
745 	   condition without switching bbs.  */
746 	*cond = invert_truthvalue (*cond);
747       else
748 	/* Select non loop header bb.  */
749 	first_edge = second_edge;
750     }
751   else
752     {
753       /* FIRST_BB is not loop header */
754       *cond = (first_edge->src)->aux;
755 
756       /* If there is a condition on an incoming edge,
757 	 AND it with the incoming bb predicate.  */
758       if (first_edge->aux)
759 	*cond = build2 (TRUTH_AND_EXPR, boolean_type_node,
760 			*cond, first_edge->aux);
761     }
762 
763   /* Create temp. for the condition. Vectorizer prefers to have gimple
764      value as condition. Various targets use different means to communicate
765      condition in vector compare operation. Using gimple value allows
766      compiler to emit vector compare and select RTL without exposing
767      compare's result.  */
768   *cond = force_gimple_operand (unshare_expr (*cond), &new_stmts,
769 				false, NULL_TREE);
770   if (new_stmts)
771     bsi_insert_before (bsi, new_stmts, BSI_SAME_STMT);
772   if (!is_gimple_reg (*cond) && !is_gimple_condexpr (*cond))
773     {
774       tree new_stmt;
775 
776       new_stmt = ifc_temp_var (TREE_TYPE (*cond), unshare_expr (*cond));
777       bsi_insert_before (bsi, new_stmt, BSI_SAME_STMT);
778       *cond = TREE_OPERAND (new_stmt, 0);
779     }
780 
781   gcc_assert (*cond);
782 
783   return first_edge->src;
784 }
785 
786 
787 /* Replace PHI node with conditional modify expr using COND.
788    This routine does not handle PHI nodes with more than two arguments.
789    For example,
790      S1: A = PHI <x1(1), x2(5)
791    is converted into,
792      S2: A = cond ? x1 : x2;
793    S2 is inserted at the top of basic block's statement list.
794    When COND is true, phi arg from TRUE_BB is selected.
795 */
796 
797 static void
replace_phi_with_cond_modify_expr(tree phi,tree cond,basic_block true_bb,block_stmt_iterator * bsi)798 replace_phi_with_cond_modify_expr (tree phi, tree cond, basic_block true_bb,
799                                    block_stmt_iterator *bsi)
800 {
801   tree new_stmt;
802   basic_block bb;
803   tree rhs;
804   tree arg_0, arg_1;
805 
806   gcc_assert (TREE_CODE (phi) == PHI_NODE);
807 
808   /* If this is not filtered earlier, then now it is too late.  */
809   gcc_assert (PHI_NUM_ARGS (phi) == 2);
810 
811   /* Find basic block and initialize iterator.  */
812   bb = bb_for_stmt (phi);
813 
814   /* Use condition that is not TRUTH_NOT_EXPR in conditional modify expr.  */
815   if (EDGE_PRED (bb, 1)->src == true_bb)
816     {
817       arg_0 = PHI_ARG_DEF (phi, 1);
818       arg_1 = PHI_ARG_DEF (phi, 0);
819     }
820   else
821     {
822       arg_0 = PHI_ARG_DEF (phi, 0);
823       arg_1 = PHI_ARG_DEF (phi, 1);
824     }
825 
826   /* Build new RHS using selected condition and arguments.  */
827   rhs = build3 (COND_EXPR, TREE_TYPE (PHI_RESULT (phi)),
828 	        unshare_expr (cond), unshare_expr (arg_0),
829 	        unshare_expr (arg_1));
830 
831   /* Create new MODIFY expression using RHS.  */
832   new_stmt = build2 (MODIFY_EXPR, TREE_TYPE (PHI_RESULT (phi)),
833 		     unshare_expr (PHI_RESULT (phi)), rhs);
834 
835   /* Make new statement definition of the original phi result.  */
836   SSA_NAME_DEF_STMT (PHI_RESULT (phi)) = new_stmt;
837 
838   /* Insert using iterator.  */
839   bsi_insert_before (bsi, new_stmt, BSI_SAME_STMT);
840   update_stmt (new_stmt);
841 
842   if (dump_file && (dump_flags & TDF_DETAILS))
843     {
844       fprintf (dump_file, "new phi replacement stmt\n");
845       print_generic_stmt (dump_file, new_stmt, TDF_SLIM);
846     }
847 }
848 
849 /* Process phi nodes for the given  LOOP.  Replace phi nodes with cond
850    modify expr.  */
851 
852 static void
process_phi_nodes(struct loop * loop)853 process_phi_nodes (struct loop *loop)
854 {
855   basic_block bb;
856   unsigned int orig_loop_num_nodes = loop->num_nodes;
857   unsigned int i;
858 
859   /* Replace phi nodes with cond. modify expr.  */
860   for (i = 1; i < orig_loop_num_nodes; i++)
861     {
862       tree phi, cond;
863       block_stmt_iterator bsi;
864       basic_block true_bb = NULL;
865       bb = ifc_bbs[i];
866 
867       if (bb == loop->header)
868 	continue;
869 
870       phi = phi_nodes (bb);
871       bsi = bsi_after_labels (bb);
872 
873       /* BB has two predecessors. Using predecessor's aux field, set
874 	 appropriate condition for the PHI node replacement.  */
875       if (phi)
876 	true_bb = find_phi_replacement_condition (loop, bb, &cond, &bsi);
877 
878       while (phi)
879 	{
880 	  tree next = PHI_CHAIN (phi);
881 	  replace_phi_with_cond_modify_expr (phi, cond, true_bb, &bsi);
882 	  release_phi_node (phi);
883 	  phi = next;
884 	}
885       bb->phi_nodes = NULL;
886     }
887   return;
888 }
889 
890 /* Combine all basic block from the given LOOP into one or two super
891    basic block.  Replace PHI nodes with conditional modify expression.  */
892 
893 static void
combine_blocks(struct loop * loop)894 combine_blocks (struct loop *loop)
895 {
896   basic_block bb, exit_bb, merge_target_bb;
897   unsigned int orig_loop_num_nodes = loop->num_nodes;
898   unsigned int i;
899   edge e;
900   edge_iterator ei;
901 
902   /* Process phi nodes to prepare blocks for merge.  */
903   process_phi_nodes (loop);
904 
905   /* Merge basic blocks.  First remove all the edges in the loop, except
906      for those from the exit block.  */
907   exit_bb = NULL;
908   for (i = 0; i < orig_loop_num_nodes; i++)
909     {
910       bb = ifc_bbs[i];
911       if (bb_with_exit_edge_p (loop, bb))
912 	{
913 	  exit_bb = bb;
914 	  break;
915 	}
916     }
917   gcc_assert (exit_bb != loop->latch);
918 
919   for (i = 1; i < orig_loop_num_nodes; i++)
920     {
921       bb = ifc_bbs[i];
922 
923       for (ei = ei_start (bb->preds); (e = ei_safe_edge (ei));)
924 	{
925 	  if (e->src == exit_bb)
926 	    ei_next (&ei);
927 	  else
928 	    remove_edge (e);
929 	}
930     }
931 
932   if (exit_bb != NULL)
933     {
934       if (exit_bb != loop->header)
935 	{
936 	  /* Connect this node with loop header.  */
937 	  make_edge (loop->header, exit_bb, EDGE_FALLTHRU);
938 	  set_immediate_dominator (CDI_DOMINATORS, exit_bb, loop->header);
939 	}
940 
941       /* Redirect non-exit edges to loop->latch.  */
942       FOR_EACH_EDGE (e, ei, exit_bb->succs)
943 	{
944 	  if (!loop_exit_edge_p (loop, e))
945 	    redirect_edge_and_branch (e, loop->latch);
946 	}
947       set_immediate_dominator (CDI_DOMINATORS, loop->latch, exit_bb);
948     }
949   else
950     {
951       /* If the loop does not have exit then reconnect header and latch.  */
952       make_edge (loop->header, loop->latch, EDGE_FALLTHRU);
953       set_immediate_dominator (CDI_DOMINATORS, loop->latch, loop->header);
954     }
955 
956   merge_target_bb = loop->header;
957   for (i = 1; i < orig_loop_num_nodes; i++)
958     {
959       block_stmt_iterator bsi;
960       tree_stmt_iterator last;
961 
962       bb = ifc_bbs[i];
963 
964       if (bb == exit_bb || bb == loop->latch)
965 	continue;
966 
967       /* Remove labels and make stmts member of loop->header.  */
968       for (bsi = bsi_start (bb); !bsi_end_p (bsi); )
969 	{
970 	  if (TREE_CODE (bsi_stmt (bsi)) == LABEL_EXPR)
971 	    bsi_remove (&bsi, true);
972 	  else
973 	    {
974 	      set_bb_for_stmt (bsi_stmt (bsi), merge_target_bb);
975 	      bsi_next (&bsi);
976 	    }
977 	}
978 
979       /* Update stmt list.  */
980       last = tsi_last (merge_target_bb->stmt_list);
981       tsi_link_after (&last, bb->stmt_list, TSI_NEW_STMT);
982       bb->stmt_list = NULL;
983 
984       /* Update dominator info.  */
985       if (dom_computed[CDI_DOMINATORS])
986 	delete_from_dominance_info (CDI_DOMINATORS, bb);
987       if (dom_computed[CDI_POST_DOMINATORS])
988 	delete_from_dominance_info (CDI_POST_DOMINATORS, bb);
989 
990       /* Remove basic block.  */
991       remove_bb_from_loops (bb);
992       expunge_block (bb);
993     }
994 
995   /* Now if possible, merge loop header and block with exit edge.
996      This reduces number of basic blocks to 2. Auto vectorizer addresses
997      loops with two nodes only.  FIXME: Use cleanup_tree_cfg().  */
998   if (exit_bb
999       && exit_bb != loop->header
1000       && can_merge_blocks_p (loop->header, exit_bb))
1001     {
1002       remove_bb_from_loops (exit_bb);
1003       merge_blocks (loop->header, exit_bb);
1004     }
1005 }
1006 
1007 /* Make new  temp variable of type TYPE. Add MODIFY_EXPR to assign EXP
1008    to the new variable.  */
1009 
1010 static tree
ifc_temp_var(tree type,tree exp)1011 ifc_temp_var (tree type, tree exp)
1012 {
1013   const char *name = "_ifc_";
1014   tree var, stmt, new_name;
1015 
1016   if (is_gimple_reg (exp))
1017     return exp;
1018 
1019   /* Create new temporary variable.  */
1020   var = create_tmp_var (type, name);
1021   add_referenced_var (var);
1022 
1023   /* Build new statement to assign EXP to new variable.  */
1024   stmt = build2 (MODIFY_EXPR, type, var, exp);
1025 
1026   /* Get SSA name for the new variable and set make new statement
1027      its definition statement.  */
1028   new_name = make_ssa_name (var, stmt);
1029   TREE_OPERAND (stmt, 0) = new_name;
1030   SSA_NAME_DEF_STMT (new_name) = stmt;
1031 
1032   return stmt;
1033 }
1034 
1035 
1036 /* Return TRUE iff, all pred blocks of BB are visited.
1037    Bitmap VISITED keeps history of visited blocks.  */
1038 
1039 static bool
pred_blocks_visited_p(basic_block bb,bitmap * visited)1040 pred_blocks_visited_p (basic_block bb, bitmap *visited)
1041 {
1042   edge e;
1043   edge_iterator ei;
1044   FOR_EACH_EDGE (e, ei, bb->preds)
1045     if (!bitmap_bit_p (*visited, e->src->index))
1046       return false;
1047 
1048   return true;
1049 }
1050 
1051 /* Get body of a LOOP in suitable order for if-conversion.
1052    It is caller's responsibility to deallocate basic block
1053    list.  If-conversion suitable order is, BFS order with one
1054    additional constraint. Select block in BFS block, if all
1055    pred are already selected.  */
1056 
1057 static basic_block *
get_loop_body_in_if_conv_order(const struct loop * loop)1058 get_loop_body_in_if_conv_order (const struct loop *loop)
1059 {
1060   basic_block *blocks, *blocks_in_bfs_order;
1061   basic_block bb;
1062   bitmap visited;
1063   unsigned int index = 0;
1064   unsigned int visited_count = 0;
1065 
1066   gcc_assert (loop->num_nodes);
1067   gcc_assert (loop->latch != EXIT_BLOCK_PTR);
1068 
1069   blocks = XCNEWVEC (basic_block, loop->num_nodes);
1070   visited = BITMAP_ALLOC (NULL);
1071 
1072   blocks_in_bfs_order = get_loop_body_in_bfs_order (loop);
1073 
1074   index = 0;
1075   while (index < loop->num_nodes)
1076     {
1077       bb = blocks_in_bfs_order [index];
1078 
1079       if (bb->flags & BB_IRREDUCIBLE_LOOP)
1080 	{
1081 	  free (blocks_in_bfs_order);
1082 	  BITMAP_FREE (visited);
1083 	  free (blocks);
1084 	  return NULL;
1085 	}
1086       if (!bitmap_bit_p (visited, bb->index))
1087 	{
1088 	  if (pred_blocks_visited_p (bb, &visited)
1089 	      || bb == loop->header)
1090 	    {
1091 	      /* This block is now visited.  */
1092 	      bitmap_set_bit (visited, bb->index);
1093 	      blocks[visited_count++] = bb;
1094 	    }
1095 	}
1096       index++;
1097       if (index == loop->num_nodes
1098 	  && visited_count != loop->num_nodes)
1099 	{
1100 	  /* Not done yet.  */
1101 	  index = 0;
1102 	}
1103     }
1104   free (blocks_in_bfs_order);
1105   BITMAP_FREE (visited);
1106   return blocks;
1107 }
1108 
1109 /* Return true if one of the basic block BB edge is exit of LOOP.  */
1110 
1111 static bool
bb_with_exit_edge_p(struct loop * loop,basic_block bb)1112 bb_with_exit_edge_p (struct loop *loop, basic_block bb)
1113 {
1114   edge e;
1115   edge_iterator ei;
1116   bool exit_edge_found = false;
1117 
1118   FOR_EACH_EDGE (e, ei, bb->succs)
1119     if (loop_exit_edge_p (loop, e))
1120       {
1121 	exit_edge_found = true;
1122 	break;
1123       }
1124 
1125   return exit_edge_found;
1126 }
1127 
1128 /* Tree if-conversion pass management.  */
1129 
1130 static unsigned int
main_tree_if_conversion(void)1131 main_tree_if_conversion (void)
1132 {
1133   unsigned i, loop_num;
1134   struct loop *loop;
1135 
1136   if (!current_loops)
1137     return 0;
1138 
1139   loop_num = current_loops->num;
1140   for (i = 0; i < loop_num; i++)
1141     {
1142       loop =  current_loops->parray[i];
1143       if (!loop)
1144       continue;
1145 
1146       tree_if_conversion (loop, true);
1147     }
1148   return 0;
1149 }
1150 
1151 static bool
gate_tree_if_conversion(void)1152 gate_tree_if_conversion (void)
1153 {
1154   return flag_tree_vectorize != 0;
1155 }
1156 
1157 struct tree_opt_pass pass_if_conversion =
1158 {
1159   "ifcvt",				/* name */
1160   gate_tree_if_conversion,		/* gate */
1161   main_tree_if_conversion,		/* execute */
1162   NULL,					/* sub */
1163   NULL,					/* next */
1164   0,					/* static_pass_number */
1165   0,					/* tv_id */
1166   PROP_cfg | PROP_ssa | PROP_alias,	/* properties_required */
1167   0,					/* properties_provided */
1168   0,					/* properties_destroyed */
1169   0,					/* todo_flags_start */
1170   TODO_dump_func | TODO_verify_loops | TODO_verify_stmts | TODO_verify_flow,
1171                                         /* todo_flags_finish */
1172   0					/* letter */
1173 };
1174