gcc/tree-ssa-reassoc.c

   1 /* Reassociation for trees.
   2    Copyright (C) 2005-2017 Free Software Foundation, Inc.
   3    Contributed by Daniel Berlin <dan@dberlin.org>
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify
   8 it under the terms of the GNU General Public License as published by
   9 the Free Software Foundation; either version 3, or (at your option)
  10 any later version.
  11
  12 GCC is distributed in the hope that it will be useful,
  13 but WITHOUT ANY WARRANTY; without even the implied warranty of
  14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  15 GNU General Public License for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING3.  If not see
  19 <http://www.gnu.org/licenses/>.  */
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "backend.h"
  25 #include "target.h"
  26 #include "rtl.h"
  27 #include "tree.h"
  28 #include "gimple.h"
  29 #include "cfghooks.h"
  30 #include "alloc-pool.h"
  31 #include "tree-pass.h"
  32 #include "memmodel.h"
  33 #include "tm_p.h"
  34 #include "ssa.h"
  35 #include "optabs-tree.h"
  36 #include "gimple-pretty-print.h"
  37 #include "diagnostic-core.h"
  38 #include "fold-const.h"
  39 #include "stor-layout.h"
  40 #include "cfganal.h"
  41 #include "gimple-fold.h"
  42 #include "tree-eh.h"
  43 #include "gimple-iterator.h"
  44 #include "gimplify-me.h"
  45 #include "tree-cfg.h"
  46 #include "tree-ssa-loop.h"
  47 #include "flags.h"
  48 #include "tree-ssa.h"
  49 #include "langhooks.h"
  50 #include "cfgloop.h"
  51 #include "params.h"
  52 #include "builtins.h"
  53 #include "gimplify.h"
  54 #include "case-cfn-macros.h"
  55
  56 /*  This is a simple global reassociation pass.  It is, in part, based
  57     on the LLVM pass of the same name (They do some things more/less
  58     than we do, in different orders, etc).
  59
  60     It consists of five steps:
  61
  62     1. Breaking up subtract operations into addition + negate, where
  63     it would promote the reassociation of adds.
  64
  65     2. Left linearization of the expression trees, so that (A+B)+(C+D)
  66     becomes (((A+B)+C)+D), which is easier for us to rewrite later.
  67     During linearization, we place the operands of the binary
  68     expressions into a vector of operand_entry_*
  69
  70     3. Optimization of the operand lists, eliminating things like a +
  71     -a, a & a, etc.
  72
  73     3a. Combine repeated factors with the same occurrence counts
  74     into a __builtin_powi call that will later be optimized into
  75     an optimal number of multiplies.
  76
  77     4. Rewrite the expression trees we linearized and optimized so
  78     they are in proper rank order.
  79
  80     5. Repropagate negates, as nothing else will clean it up ATM.
  81
  82     A bit of theory on #4, since nobody seems to write anything down
  83     about why it makes sense to do it the way they do it:
  84
  85     We could do this much nicer theoretically, but don't (for reasons
  86     explained after how to do it theoretically nice :P).
  87
  88     In order to promote the most redundancy elimination, you want
  89     binary expressions whose operands are the same rank (or
  90     preferably, the same value) exposed to the redundancy eliminator,
  91     for possible elimination.
  92
  93     So the way to do this if we really cared, is to build the new op
  94     tree from the leaves to the roots, merging as you go, and putting the
  95     new op on the end of the worklist, until you are left with one
  96     thing on the worklist.
  97
  98     IE if you have to rewrite the following set of operands (listed with
  99     rank in parentheses), with opcode PLUS_EXPR:
 100
 101     a (1),  b (1),  c (1),  d (2), e (2)
 102
 103
 104     We start with our merge worklist empty, and the ops list with all of
 105     those on it.
 106
 107     You want to first merge all leaves of the same rank, as much as
 108     possible.
 109
 110     So first build a binary op of
 111
 112     mergetmp = a + b, and put "mergetmp" on the merge worklist.
 113
 114     Because there is no three operand form of PLUS_EXPR, c is not going to
 115     be exposed to redundancy elimination as a rank 1 operand.
 116
 117     So you might as well throw it on the merge worklist (you could also
 118     consider it to now be a rank two operand, and merge it with d and e,
 119     but in this case, you then have evicted e from a binary op. So at
 120     least in this situation, you can't win.)
 121
 122     Then build a binary op of d + e
 123     mergetmp2 = d + e
 124
 125     and put mergetmp2 on the merge worklist.
 126
 127     so merge worklist = {mergetmp, c, mergetmp2}
 128
 129     Continue building binary ops of these operations until you have only
 130     one operation left on the worklist.
 131
 132     So we have
 133
 134     build binary op
 135     mergetmp3 = mergetmp + c
 136
 137     worklist = {mergetmp2, mergetmp3}
 138
 139     mergetmp4 = mergetmp2 + mergetmp3
 140
 141     worklist = {mergetmp4}
 142
 143     because we have one operation left, we can now just set the original
 144     statement equal to the result of that operation.
 145
 146     This will at least expose a + b  and d + e to redundancy elimination
 147     as binary operations.
 148
 149     For extra points, you can reuse the old statements to build the
 150     mergetmps, since you shouldn't run out.
 151
 152     So why don't we do this?
 153
 154     Because it's expensive, and rarely will help.  Most trees we are
 155     reassociating have 3 or less ops.  If they have 2 ops, they already
 156     will be written into a nice single binary op.  If you have 3 ops, a
 157     single simple check suffices to tell you whether the first two are of the
 158     same rank.  If so, you know to order it
 159
 160     mergetmp = op1 + op2
 161     newstmt = mergetmp + op3
 162
 163     instead of
 164     mergetmp = op2 + op3
 165     newstmt = mergetmp + op1
 166
 167     If all three are of the same rank, you can't expose them all in a
 168     single binary operator anyway, so the above is *still* the best you
 169     can do.
 170
 171     Thus, this is what we do.  When we have three ops left, we check to see
 172     what order to put them in, and call it a day.  As a nod to vector sum
 173     reduction, we check if any of the ops are really a phi node that is a
 174     destructive update for the associating op, and keep the destructive
 175     update together for vector sum reduction recognition.  */
 176
 177 /* Enable insertion of __builtin_powi calls during execute_reassoc.  See
 178    point 3a in the pass header comment.  */
 179 static bool reassoc_insert_powi_p;
 180
 181 /* Statistics */
 182 static struct
 183 {
 184   int linearized;
 185   int constants_eliminated;
 186   int ops_eliminated;
 187   int rewritten;
 188   int pows_encountered;
 189   int pows_created;
 190 } reassociate_stats;
 191
 192 /* Operator, rank pair.  */
 193 struct operand_entry
 194 {
 195   unsigned int rank;
 196   unsigned int id;
 197   tree op;
 198   unsigned int count;
 199   gimple *stmt_to_insert;
 200 };
 201
 202 static object_allocator<operand_entry> operand_entry_pool
 203   ("operand entry pool");
 204
 205 /* This is used to assign a unique ID to each struct operand_entry
 206    so that qsort results are identical on different hosts.  */
 207 static unsigned int next_operand_entry_id;
 208
 209 /* Starting rank number for a given basic block, so that we can rank
 210    operations using unmovable instructions in that BB based on the bb
 211    depth.  */
 212 static long *bb_rank;
 213
 214 /* Operand->rank hashtable.  */
 215 static hash_map<tree, long> *operand_rank;
 216
 217 /* Vector of SSA_NAMEs on which after reassociate_bb is done with
 218    all basic blocks the CFG should be adjusted - basic blocks
 219    split right after that SSA_NAME's definition statement and before
 220    the only use, which must be a bit ior.  */
 221 static vec<tree> reassoc_branch_fixups;
 222
 223 /* Forward decls.  */
 224 static long get_rank (tree);
 225 static bool reassoc_stmt_dominates_stmt_p (gimple *, gimple *);
 226
 227 /* Wrapper around gsi_remove, which adjusts gimple_uid of debug stmts
 228    possibly added by gsi_remove.  */
 229
 230 bool
 231 reassoc_remove_stmt (gimple_stmt_iterator *gsi)
 232 {
 233   gimple *stmt = gsi_stmt (*gsi);
 234
 235   if (!MAY_HAVE_DEBUG_STMTS || gimple_code (stmt) == GIMPLE_PHI)
 236     return gsi_remove (gsi, true);
 237
 238   gimple_stmt_iterator prev = *gsi;
 239   gsi_prev (&prev);
 240   unsigned uid = gimple_uid (stmt);
 241   basic_block bb = gimple_bb (stmt);
 242   bool ret = gsi_remove (gsi, true);
 243   if (!gsi_end_p (prev))
 244     gsi_next (&prev);
 245   else
 246     prev = gsi_start_bb (bb);
 247   gimple *end_stmt = gsi_stmt (*gsi);
 248   while ((stmt = gsi_stmt (prev)) != end_stmt)
 249     {
 250       gcc_assert (stmt && is_gimple_debug (stmt) && gimple_uid (stmt) == 0);
 251       gimple_set_uid (stmt, uid);
 252       gsi_next (&prev);
 253     }
 254   return ret;
 255 }
 256
 257 /* Bias amount for loop-carried phis.  We want this to be larger than
 258    the depth of any reassociation tree we can see, but not larger than
 259    the rank difference between two blocks.  */
 260 #define PHI_LOOP_BIAS (1 << 15)
 261
 262 /* Rank assigned to a phi statement.  If STMT is a loop-carried phi of
 263    an innermost loop, and the phi has only a single use which is inside
 264    the loop, then the rank is the block rank of the loop latch plus an
 265    extra bias for the loop-carried dependence.  This causes expressions
 266    calculated into an accumulator variable to be independent for each
 267    iteration of the loop.  If STMT is some other phi, the rank is the
 268    block rank of its containing block.  */
 269 static long
 270 phi_rank (gimple *stmt)
 271 {
 272   basic_block bb = gimple_bb (stmt);
 273   struct loop *father = bb->loop_father;
 274   tree res;
 275   unsigned i;
 276   use_operand_p use;
 277   gimple *use_stmt;
 278
 279   /* We only care about real loops (those with a latch).  */
 280   if (!father->latch)
 281     return bb_rank[bb->index];
 282
 283   /* Interesting phis must be in headers of innermost loops.  */
 284   if (bb != father->header
 285       || father->inner)
 286     return bb_rank[bb->index];
 287
 288   /* Ignore virtual SSA_NAMEs.  */
 289   res = gimple_phi_result (stmt);
 290   if (virtual_operand_p (res))
 291     return bb_rank[bb->index];
 292
 293   /* The phi definition must have a single use, and that use must be
 294      within the loop.  Otherwise this isn't an accumulator pattern.  */
 295   if (!single_imm_use (res, &use, &use_stmt)
 296       || gimple_bb (use_stmt)->loop_father != father)
 297     return bb_rank[bb->index];
 298
 299   /* Look for phi arguments from within the loop.  If found, bias this phi.  */
 300   for (i = 0; i < gimple_phi_num_args (stmt); i++)
 301     {
 302       tree arg = gimple_phi_arg_def (stmt, i);
 303       if (TREE_CODE (arg) == SSA_NAME
 304           && !SSA_NAME_IS_DEFAULT_DEF (arg))
 305         {
 306           gimple *def_stmt = SSA_NAME_DEF_STMT (arg);
 307           if (gimple_bb (def_stmt)->loop_father == father)
 308             return bb_rank[father->latch->index] + PHI_LOOP_BIAS;
 309         }
 310     }
 311
 312   /* Must be an uninteresting phi.  */
 313   return bb_rank[bb->index];
 314 }
 315
 316 /* If EXP is an SSA_NAME defined by a PHI statement that represents a
 317    loop-carried dependence of an innermost loop, return TRUE; else
 318    return FALSE.  */
 319 static bool
 320 loop_carried_phi (tree exp)
 321 {
 322   gimple *phi_stmt;
 323   long block_rank;
 324
 325   if (TREE_CODE (exp) != SSA_NAME
 326       || SSA_NAME_IS_DEFAULT_DEF (exp))
 327     return false;
 328
 329   phi_stmt = SSA_NAME_DEF_STMT (exp);
 330
 331   if (gimple_code (SSA_NAME_DEF_STMT (exp)) != GIMPLE_PHI)
 332     return false;
 333
 334   /* Non-loop-carried phis have block rank.  Loop-carried phis have
 335      an additional bias added in.  If this phi doesn't have block rank,
 336      it's biased and should not be propagated.  */
 337   block_rank = bb_rank[gimple_bb (phi_stmt)->index];
 338
 339   if (phi_rank (phi_stmt) != block_rank)
 340     return true;
 341
 342   return false;
 343 }
 344
 345 /* Return the maximum of RANK and the rank that should be propagated
 346    from expression OP.  For most operands, this is just the rank of OP.
 347    For loop-carried phis, the value is zero to avoid undoing the bias
 348    in favor of the phi.  */
 349 static long
 350 propagate_rank (long rank, tree op)
 351 {
 352   long op_rank;
 353
 354   if (loop_carried_phi (op))
 355     return rank;
 356
 357   op_rank = get_rank (op);
 358
 359   return MAX (rank, op_rank);
 360 }
 361
 362 /* Look up the operand rank structure for expression E.  */
 363
 364 static inline long
 365 find_operand_rank (tree e)
 366 {
 367   long *slot = operand_rank->get (e);
 368   return slot ? *slot : -1;
 369 }
 370
 371 /* Insert {E,RANK} into the operand rank hashtable.  */
 372
 373 static inline void
 374 insert_operand_rank (tree e, long rank)
 375 {
 376   gcc_assert (rank > 0);
 377   gcc_assert (!operand_rank->put (e, rank));
 378 }
 379
 380 /* Given an expression E, return the rank of the expression.  */
 381
 382 static long
 383 get_rank (tree e)
 384 {
 385   /* SSA_NAME's have the rank of the expression they are the result
 386      of.
 387      For globals and uninitialized values, the rank is 0.
 388      For function arguments, use the pre-setup rank.
 389      For PHI nodes, stores, asm statements, etc, we use the rank of
 390      the BB.
 391      For simple operations, the rank is the maximum rank of any of
 392      its operands, or the bb_rank, whichever is less.
 393      I make no claims that this is optimal, however, it gives good
 394      results.  */
 395
 396   /* We make an exception to the normal ranking system to break
 397      dependences of accumulator variables in loops.  Suppose we
 398      have a simple one-block loop containing:
 399
 400        x_1 = phi(x_0, x_2)
 401        b = a + x_1
 402        c = b + d
 403        x_2 = c + e
 404
 405      As shown, each iteration of the calculation into x is fully
 406      dependent upon the iteration before it.  We would prefer to
 407      see this in the form:
 408
 409        x_1 = phi(x_0, x_2)
 410        b = a + d
 411        c = b + e
 412        x_2 = c + x_1
 413
 414      If the loop is unrolled, the calculations of b and c from
 415      different iterations can be interleaved.
 416
 417      To obtain this result during reassociation, we bias the rank
 418      of the phi definition x_1 upward, when it is recognized as an
 419      accumulator pattern.  The artificial rank causes it to be
 420      added last, providing the desired independence.  */
 421
 422   if (TREE_CODE (e) == SSA_NAME)
 423     {
 424       ssa_op_iter iter;
 425       gimple *stmt;
 426       long rank;
 427       tree op;
 428
 429       if (SSA_NAME_IS_DEFAULT_DEF (e))
 430         return find_operand_rank (e);
 431
 432       stmt = SSA_NAME_DEF_STMT (e);
 433       if (gimple_code (stmt) == GIMPLE_PHI)
 434         return phi_rank (stmt);
 435
 436       if (!is_gimple_assign (stmt))
 437         return bb_rank[gimple_bb (stmt)->index];
 438
 439       /* If we already have a rank for this expression, use that.  */
 440       rank = find_operand_rank (e);
 441       if (rank != -1)
 442         return rank;
 443
 444       /* Otherwise, find the maximum rank for the operands.  As an
 445          exception, remove the bias from loop-carried phis when propagating
 446          the rank so that dependent operations are not also biased.  */
 447       /* Simply walk over all SSA uses - this takes advatage of the
 448          fact that non-SSA operands are is_gimple_min_invariant and
 449          thus have rank 0.  */
 450       rank = 0;
 451       FOR_EACH_SSA_TREE_OPERAND (op, stmt, iter, SSA_OP_USE)
 452         rank = propagate_rank (rank, op);
 453
 454       if (dump_file && (dump_flags & TDF_DETAILS))
 455         {
 456           fprintf (dump_file, "Rank for ");
 457           print_generic_expr (dump_file, e);
 458           fprintf (dump_file, " is %ld\n", (rank + 1));
 459         }
 460
 461       /* Note the rank in the hashtable so we don't recompute it.  */
 462       insert_operand_rank (e, (rank + 1));
 463       return (rank + 1);
 464     }
 465
 466   /* Constants, globals, etc., are rank 0 */
 467   return 0;
 468 }
 469
 470
 471 /* We want integer ones to end up last no matter what, since they are
 472    the ones we can do the most with.  */
 473 #define INTEGER_CONST_TYPE 1 << 3
 474 #define FLOAT_CONST_TYPE 1 << 2
 475 #define OTHER_CONST_TYPE 1 << 1
 476
 477 /* Classify an invariant tree into integer, float, or other, so that
 478    we can sort them to be near other constants of the same type.  */
 479 static inline int
 480 constant_type (tree t)
 481 {
 482   if (INTEGRAL_TYPE_P (TREE_TYPE (t)))
 483     return INTEGER_CONST_TYPE;
 484   else if (SCALAR_FLOAT_TYPE_P (TREE_TYPE (t)))
 485     return FLOAT_CONST_TYPE;
 486   else
 487     return OTHER_CONST_TYPE;
 488 }
 489
 490 /* qsort comparison function to sort operand entries PA and PB by rank
 491    so that the sorted array is ordered by rank in decreasing order.  */
 492 static int
 493 sort_by_operand_rank (const void *pa, const void *pb)
 494 {
 495   const operand_entry *oea = *(const operand_entry *const *)pa;
 496   const operand_entry *oeb = *(const operand_entry *const *)pb;
 497
 498   /* It's nicer for optimize_expression if constants that are likely
 499      to fold when added/multiplied//whatever are put next to each
 500      other.  Since all constants have rank 0, order them by type.  */
 501   if (oeb->rank == 0 && oea->rank == 0)
 502     {
 503       if (constant_type (oeb->op) != constant_type (oea->op))
 504         return constant_type (oeb->op) - constant_type (oea->op);
 505       else
 506         /* To make sorting result stable, we use unique IDs to determine
 507            order.  */
 508         return oeb->id > oea->id ? 1 : -1;
 509     }
 510
 511   /* Lastly, make sure the versions that are the same go next to each
 512      other.  */
 513   if (oeb->rank == oea->rank
 514       && TREE_CODE (oea->op) == SSA_NAME
 515       && TREE_CODE (oeb->op) == SSA_NAME)
 516     {
 517       /* As SSA_NAME_VERSION is assigned pretty randomly, because we reuse
 518          versions of removed SSA_NAMEs, so if possible, prefer to sort
 519          based on basic block and gimple_uid of the SSA_NAME_DEF_STMT.
 520          See PR60418.  */
 521       if (!SSA_NAME_IS_DEFAULT_DEF (oea->op)
 522           && !SSA_NAME_IS_DEFAULT_DEF (oeb->op)
 523           && !oea->stmt_to_insert
 524           && !oeb->stmt_to_insert
 525           && SSA_NAME_VERSION (oeb->op) != SSA_NAME_VERSION (oea->op))
 526         {
 527           gimple *stmta = SSA_NAME_DEF_STMT (oea->op);
 528           gimple *stmtb = SSA_NAME_DEF_STMT (oeb->op);
 529           basic_block bba = gimple_bb (stmta);
 530           basic_block bbb = gimple_bb (stmtb);
 531           if (bbb != bba)
 532             {
 533               if (bb_rank[bbb->index] != bb_rank[bba->index])
 534                 return bb_rank[bbb->index] - bb_rank[bba->index];
 535             }
 536           else
 537             {
 538               bool da = reassoc_stmt_dominates_stmt_p (stmta, stmtb);
 539               bool db = reassoc_stmt_dominates_stmt_p (stmtb, stmta);
 540               if (da != db)
 541                 return da ? 1 : -1;
 542             }
 543         }
 544
 545       if (SSA_NAME_VERSION (oeb->op) != SSA_NAME_VERSION (oea->op))
 546         return SSA_NAME_VERSION (oeb->op) > SSA_NAME_VERSION (oea->op) ? 1 : -1;
 547       else
 548         return oeb->id > oea->id ? 1 : -1;
 549     }
 550
 551   if (oeb->rank != oea->rank)
 552     return oeb->rank > oea->rank ? 1 : -1;
 553   else
 554     return oeb->id > oea->id ? 1 : -1;
 555 }
 556
 557 /* Add an operand entry to *OPS for the tree operand OP.  */
 558
 559 static void
 560 add_to_ops_vec (vec<operand_entry *> *ops, tree op, gimple *stmt_to_insert = NULL)
 561 {
 562   operand_entry *oe = operand_entry_pool.allocate ();
 563
 564   oe->op = op;
 565   oe->rank = get_rank (op);
 566   oe->id = next_operand_entry_id++;
 567   oe->count = 1;
 568   oe->stmt_to_insert = stmt_to_insert;
 569   ops->safe_push (oe);
 570 }
 571
 572 /* Add an operand entry to *OPS for the tree operand OP with repeat
 573    count REPEAT.  */
 574
 575 static void
 576 add_repeat_to_ops_vec (vec<operand_entry *> *ops, tree op,
 577                        HOST_WIDE_INT repeat)
 578 {
 579   operand_entry *oe = operand_entry_pool.allocate ();
 580
 581   oe->op = op;
 582   oe->rank = get_rank (op);
 583   oe->id = next_operand_entry_id++;
 584   oe->count = repeat;
 585   oe->stmt_to_insert = NULL;
 586   ops->safe_push (oe);
 587
 588   reassociate_stats.pows_encountered++;
 589 }
 590
 591 /* Return true if STMT is reassociable operation containing a binary
 592    operation with tree code CODE, and is inside LOOP.  */
 593
 594 static bool
 595 is_reassociable_op (gimple *stmt, enum tree_code code, struct loop *loop)
 596 {
 597   basic_block bb = gimple_bb (stmt);
 598
 599   if (gimple_bb (stmt) == NULL)
 600     return false;
 601
 602   if (!flow_bb_inside_loop_p (loop, bb))
 603     return false;
 604
 605   if (is_gimple_assign (stmt)
 606       && gimple_assign_rhs_code (stmt) == code
 607       && has_single_use (gimple_assign_lhs (stmt)))
 608     {
 609       tree rhs1 = gimple_assign_rhs1 (stmt);
 610       tree rhs2 = gimple_assign_rhs1 (stmt);
 611       if (TREE_CODE (rhs1) == SSA_NAME
 612           && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (rhs1))
 613         return false;
 614       if (rhs2
 615           && TREE_CODE (rhs2) == SSA_NAME
 616           && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (rhs2))
 617         return false;
 618       return true;
 619     }
 620
 621   return false;
 622 }
 623
 624
 625 /* Return true if STMT is a nop-conversion.  */
 626
 627 static bool
 628 gimple_nop_conversion_p (gimple *stmt)
 629 {
 630   if (gassign *ass = dyn_cast <gassign *> (stmt))
 631     {
 632       if (CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (ass))
 633           && tree_nop_conversion_p (TREE_TYPE (gimple_assign_lhs (ass)),
 634                                     TREE_TYPE (gimple_assign_rhs1 (ass))))
 635         return true;
 636     }
 637   return false;
 638 }
 639
 640 /* Given NAME, if NAME is defined by a unary operation OPCODE, return the
 641    operand of the negate operation.  Otherwise, return NULL.  */
 642
 643 static tree
 644 get_unary_op (tree name, enum tree_code opcode)
 645 {
 646   gimple *stmt = SSA_NAME_DEF_STMT (name);
 647
 648   /* Look through nop conversions (sign changes).  */
 649   if (gimple_nop_conversion_p (stmt)
 650       && TREE_CODE (gimple_assign_rhs1 (stmt)) == SSA_NAME)
 651     stmt = SSA_NAME_DEF_STMT (gimple_assign_rhs1 (stmt));
 652
 653   if (!is_gimple_assign (stmt))
 654     return NULL_TREE;
 655
 656   if (gimple_assign_rhs_code (stmt) == opcode)
 657     return gimple_assign_rhs1 (stmt);
 658   return NULL_TREE;
 659 }
 660
 661 /* Return true if OP1 and OP2 have the same value if casted to either type.  */
 662
 663 static bool
 664 ops_equal_values_p (tree op1, tree op2)
 665 {
 666   if (op1 == op2)
 667     return true;
 668
 669   tree orig_op1 = op1;
 670   if (TREE_CODE (op1) == SSA_NAME)
 671     {
 672       gimple *stmt = SSA_NAME_DEF_STMT (op1);
 673       if (gimple_nop_conversion_p (stmt))
 674         {
 675           op1 = gimple_assign_rhs1 (stmt);
 676           if (op1 == op2)
 677             return true;
 678         }
 679     }
 680
 681   if (TREE_CODE (op2) == SSA_NAME)
 682     {
 683       gimple *stmt = SSA_NAME_DEF_STMT (op2);
 684       if (gimple_nop_conversion_p (stmt))
 685         {
 686           op2 = gimple_assign_rhs1 (stmt);
 687           if (op1 == op2
 688               || orig_op1 == op2)
 689             return true;
 690         }
 691     }
 692
 693   return false;
 694 }
 695
 696
 697 /* If CURR and LAST are a pair of ops that OPCODE allows us to
 698    eliminate through equivalences, do so, remove them from OPS, and
 699    return true.  Otherwise, return false.  */
 700
 701 static bool
 702 eliminate_duplicate_pair (enum tree_code opcode,
 703                           vec<operand_entry *> *ops,
 704                           bool *all_done,
 705                           unsigned int i,
 706                           operand_entry *curr,
 707                           operand_entry *last)
 708 {
 709
 710   /* If we have two of the same op, and the opcode is & |, min, or max,
 711      we can eliminate one of them.
 712      If we have two of the same op, and the opcode is ^, we can
 713      eliminate both of them.  */
 714
 715   if (last && last->op == curr->op)
 716     {
 717       switch (opcode)
 718         {
 719         case MAX_EXPR:
 720         case MIN_EXPR:
 721         case BIT_IOR_EXPR:
 722         case BIT_AND_EXPR:
 723           if (dump_file && (dump_flags & TDF_DETAILS))
 724             {
 725               fprintf (dump_file, "Equivalence: ");
 726               print_generic_expr (dump_file, curr->op);
 727               fprintf (dump_file, " [&|minmax] ");
 728               print_generic_expr (dump_file, last->op);
 729               fprintf (dump_file, " -> ");
 730               print_generic_stmt (dump_file, last->op);
 731             }
 732
 733           ops->ordered_remove (i);
 734           reassociate_stats.ops_eliminated ++;
 735
 736           return true;
 737
 738         case BIT_XOR_EXPR:
 739           if (dump_file && (dump_flags & TDF_DETAILS))
 740             {
 741               fprintf (dump_file, "Equivalence: ");
 742               print_generic_expr (dump_file, curr->op);
 743               fprintf (dump_file, " ^ ");
 744               print_generic_expr (dump_file, last->op);
 745               fprintf (dump_file, " -> nothing\n");
 746             }
 747
 748           reassociate_stats.ops_eliminated += 2;
 749
 750           if (ops->length () == 2)
 751             {
 752               ops->truncate (0);
 753               add_to_ops_vec (ops, build_zero_cst (TREE_TYPE (last->op)));
 754               *all_done = true;
 755             }
 756           else
 757             {
 758               ops->ordered_remove (i-1);
 759               ops->ordered_remove (i-1);
 760             }
 761
 762           return true;
 763
 764         default:
 765           break;
 766         }
 767     }
 768   return false;
 769 }
 770
 771 static vec<tree> plus_negates;
 772
 773 /* If OPCODE is PLUS_EXPR, CURR->OP is a negate expression or a bitwise not
 774    expression, look in OPS for a corresponding positive operation to cancel
 775    it out.  If we find one, remove the other from OPS, replace
 776    OPS[CURRINDEX] with 0 or -1, respectively, and return true.  Otherwise,
 777    return false. */
 778
 779 static bool
 780 eliminate_plus_minus_pair (enum tree_code opcode,
 781                            vec<operand_entry *> *ops,
 782                            unsigned int currindex,
 783                            operand_entry *curr)
 784 {
 785   tree negateop;
 786   tree notop;
 787   unsigned int i;
 788   operand_entry *oe;
 789
 790   if (opcode != PLUS_EXPR || TREE_CODE (curr->op) != SSA_NAME)
 791     return false;
 792
 793   negateop = get_unary_op (curr->op, NEGATE_EXPR);
 794   notop = get_unary_op (curr->op, BIT_NOT_EXPR);
 795   if (negateop == NULL_TREE && notop == NULL_TREE)
 796     return false;
 797
 798   /* Any non-negated version will have a rank that is one less than
 799      the current rank.  So once we hit those ranks, if we don't find
 800      one, we can stop.  */
 801
 802   for (i = currindex + 1;
 803        ops->iterate (i, &oe)
 804        && oe->rank >= curr->rank - 1 ;
 805        i++)
 806     {
 807       if (negateop
 808           && ops_equal_values_p (oe->op, negateop))
 809         {
 810           if (dump_file && (dump_flags & TDF_DETAILS))
 811             {
 812               fprintf (dump_file, "Equivalence: ");
 813               print_generic_expr (dump_file, negateop);
 814               fprintf (dump_file, " + -");
 815               print_generic_expr (dump_file, oe->op);
 816               fprintf (dump_file, " -> 0\n");
 817             }
 818
 819           ops->ordered_remove (i);
 820           add_to_ops_vec (ops, build_zero_cst (TREE_TYPE (oe->op)));
 821           ops->ordered_remove (currindex);
 822           reassociate_stats.ops_eliminated ++;
 823
 824           return true;
 825         }
 826       else if (notop
 827                && ops_equal_values_p (oe->op, notop))
 828         {
 829           tree op_type = TREE_TYPE (oe->op);
 830
 831           if (dump_file && (dump_flags & TDF_DETAILS))
 832             {
 833               fprintf (dump_file, "Equivalence: ");
 834               print_generic_expr (dump_file, notop);
 835               fprintf (dump_file, " + ~");
 836               print_generic_expr (dump_file, oe->op);
 837               fprintf (dump_file, " -> -1\n");
 838             }
 839
 840           ops->ordered_remove (i);
 841           add_to_ops_vec (ops, build_all_ones_cst (op_type));
 842           ops->ordered_remove (currindex);
 843           reassociate_stats.ops_eliminated ++;
 844
 845           return true;
 846         }
 847     }
 848
 849   /* If CURR->OP is a negate expr without nop conversion in a plus expr:
 850      save it for later inspection in repropagate_negates().  */
 851   if (negateop != NULL_TREE
 852       && gimple_assign_rhs_code (SSA_NAME_DEF_STMT (curr->op)) == NEGATE_EXPR)
 853     plus_negates.safe_push (curr->op);
 854
 855   return false;
 856 }
 857
 858 /* If OPCODE is BIT_IOR_EXPR, BIT_AND_EXPR, and, CURR->OP is really a
 859    bitwise not expression, look in OPS for a corresponding operand to
 860    cancel it out.  If we find one, remove the other from OPS, replace
 861    OPS[CURRINDEX] with 0, and return true.  Otherwise, return
 862    false. */
 863
 864 static bool
 865 eliminate_not_pairs (enum tree_code opcode,
 866                      vec<operand_entry *> *ops,
 867                      unsigned int currindex,
 868                      operand_entry *curr)
 869 {
 870   tree notop;
 871   unsigned int i;
 872   operand_entry *oe;
 873
 874   if ((opcode != BIT_IOR_EXPR && opcode != BIT_AND_EXPR)
 875       || TREE_CODE (curr->op) != SSA_NAME)
 876     return false;
 877
 878   notop = get_unary_op (curr->op, BIT_NOT_EXPR);
 879   if (notop == NULL_TREE)
 880     return false;
 881
 882   /* Any non-not version will have a rank that is one less than
 883      the current rank.  So once we hit those ranks, if we don't find
 884      one, we can stop.  */
 885
 886   for (i = currindex + 1;
 887        ops->iterate (i, &oe)
 888        && oe->rank >= curr->rank - 1;
 889        i++)
 890     {
 891       if (oe->op == notop)
 892         {
 893           if (dump_file && (dump_flags & TDF_DETAILS))
 894             {
 895               fprintf (dump_file, "Equivalence: ");
 896               print_generic_expr (dump_file, notop);
 897               if (opcode == BIT_AND_EXPR)
 898                 fprintf (dump_file, " & ~");
 899               else if (opcode == BIT_IOR_EXPR)
 900                 fprintf (dump_file, " | ~");
 901               print_generic_expr (dump_file, oe->op);
 902               if (opcode == BIT_AND_EXPR)
 903                 fprintf (dump_file, " -> 0\n");
 904               else if (opcode == BIT_IOR_EXPR)
 905                 fprintf (dump_file, " -> -1\n");
 906             }
 907
 908           if (opcode == BIT_AND_EXPR)
 909             oe->op = build_zero_cst (TREE_TYPE (oe->op));
 910           else if (opcode == BIT_IOR_EXPR)
 911             oe->op = build_all_ones_cst (TREE_TYPE (oe->op));
 912
 913           reassociate_stats.ops_eliminated += ops->length () - 1;
 914           ops->truncate (0);
 915           ops->quick_push (oe);
 916           return true;
 917         }
 918     }
 919
 920   return false;
 921 }
 922
 923 /* Use constant value that may be present in OPS to try to eliminate
 924    operands.  Note that this function is only really used when we've
 925    eliminated ops for other reasons, or merged constants.  Across
 926    single statements, fold already does all of this, plus more.  There
 927    is little point in duplicating logic, so I've only included the
 928    identities that I could ever construct testcases to trigger.  */
 929
 930 static void
 931 eliminate_using_constants (enum tree_code opcode,
 932                            vec<operand_entry *> *ops)
 933 {
 934   operand_entry *oelast = ops->last ();
 935   tree type = TREE_TYPE (oelast->op);
 936
 937   if (oelast->rank == 0
 938       && (ANY_INTEGRAL_TYPE_P (type) || FLOAT_TYPE_P (type)))
 939     {
 940       switch (opcode)
 941         {
 942         case BIT_AND_EXPR:
 943           if (integer_zerop (oelast->op))
 944             {
 945               if (ops->length () != 1)
 946                 {
 947                   if (dump_file && (dump_flags & TDF_DETAILS))
 948                     fprintf (dump_file, "Found & 0, removing all other ops\n");
 949
 950                   reassociate_stats.ops_eliminated += ops->length () - 1;
 951
 952                   ops->truncate (0);
 953                   ops->quick_push (oelast);
 954                   return;
 955                 }
 956             }
 957           else if (integer_all_onesp (oelast->op))
 958             {
 959               if (ops->length () != 1)
 960                 {
 961                   if (dump_file && (dump_flags & TDF_DETAILS))
 962                     fprintf (dump_file, "Found & -1, removing\n");
 963                   ops->pop ();
 964                   reassociate_stats.ops_eliminated++;
 965                 }
 966             }
 967           break;
 968         case BIT_IOR_EXPR:
 969           if (integer_all_onesp (oelast->op))
 970             {
 971               if (ops->length () != 1)
 972                 {
 973                   if (dump_file && (dump_flags & TDF_DETAILS))
 974                     fprintf (dump_file, "Found | -1, removing all other ops\n");
 975
 976                   reassociate_stats.ops_eliminated += ops->length () - 1;
 977
 978                   ops->truncate (0);
 979                   ops->quick_push (oelast);
 980                   return;
 981                 }
 982             }
 983           else if (integer_zerop (oelast->op))
 984             {
 985               if (ops->length () != 1)
 986                 {
 987                   if (dump_file && (dump_flags & TDF_DETAILS))
 988                     fprintf (dump_file, "Found | 0, removing\n");
 989                   ops->pop ();
 990                   reassociate_stats.ops_eliminated++;
 991                 }
 992             }
 993           break;
 994         case MULT_EXPR:
 995           if (integer_zerop (oelast->op)
 996               || (FLOAT_TYPE_P (type)
 997                   && !HONOR_NANS (type)
 998                   && !HONOR_SIGNED_ZEROS (type)
 999                   && real_zerop (oelast->op)))
1000             {
1001               if (ops->length () != 1)
1002                 {
1003                   if (dump_file && (dump_flags & TDF_DETAILS))
1004                     fprintf (dump_file, "Found * 0, removing all other ops\n");
1005
1006                   reassociate_stats.ops_eliminated += ops->length () - 1;
1007                   ops->truncate (1);
1008                   ops->quick_push (oelast);
1009                   return;
1010                 }
1011             }
1012           else if (integer_onep (oelast->op)
1013                    || (FLOAT_TYPE_P (type)
1014                        && !HONOR_SNANS (type)
1015                        && real_onep (oelast->op)))
1016             {
1017               if (ops->length () != 1)
1018                 {
1019                   if (dump_file && (dump_flags & TDF_DETAILS))
1020                     fprintf (dump_file, "Found * 1, removing\n");
1021                   ops->pop ();
1022                   reassociate_stats.ops_eliminated++;
1023                   return;
1024                 }
1025             }
1026           break;
1027         case BIT_XOR_EXPR:
1028         case PLUS_EXPR:
1029         case MINUS_EXPR:
1030           if (integer_zerop (oelast->op)
1031               || (FLOAT_TYPE_P (type)
1032                   && (opcode == PLUS_EXPR || opcode == MINUS_EXPR)
1033                   && fold_real_zero_addition_p (type, oelast->op,
1034                                                 opcode == MINUS_EXPR)))
1035             {
1036               if (ops->length () != 1)
1037                 {
1038                   if (dump_file && (dump_flags & TDF_DETAILS))
1039                     fprintf (dump_file, "Found [|^+] 0, removing\n");
1040                   ops->pop ();
1041                   reassociate_stats.ops_eliminated++;
1042                   return;
1043                 }
1044             }
1045           break;
1046         default:
1047           break;
1048         }
1049     }
1050 }
1051
1052
1053 static void linearize_expr_tree (vec<operand_entry *> *, gimple *,
1054                                  bool, bool);
1055
1056 /* Structure for tracking and counting operands.  */
1057 struct oecount {
1058   unsigned int cnt;
1059   unsigned int id;
1060   enum tree_code oecode;
1061   tree op;
1062 };
1063
1064
1065 /* The heap for the oecount hashtable and the sorted list of operands.  */
1066 static vec<oecount> cvec;
1067
1068
1069 /* Oecount hashtable helpers.  */
1070
1071 struct oecount_hasher : int_hash <int, 0, 1>
1072 {
1073   static inline hashval_t hash (int);
1074   static inline bool equal (int, int);
1075 };
1076
1077 /* Hash function for oecount.  */
1078
1079 inline hashval_t
1080 oecount_hasher::hash (int p)
1081 {
1082   const oecount *c = &cvec[p - 42];
1083   return htab_hash_pointer (c->op) ^ (hashval_t)c->oecode;
1084 }
1085
1086 /* Comparison function for oecount.  */
1087
1088 inline bool
1089 oecount_hasher::equal (int p1, int p2)
1090 {
1091   const oecount *c1 = &cvec[p1 - 42];
1092   const oecount *c2 = &cvec[p2 - 42];
1093   return c1->oecode == c2->oecode && c1->op == c2->op;
1094 }
1095
1096 /* Comparison function for qsort sorting oecount elements by count.  */
1097
1098 static int
1099 oecount_cmp (const void *p1, const void *p2)
1100 {
1101   const oecount *c1 = (const oecount *)p1;
1102   const oecount *c2 = (const oecount *)p2;
1103   if (c1->cnt != c2->cnt)
1104     return c1->cnt > c2->cnt ? 1 : -1;
1105   else
1106     /* If counts are identical, use unique IDs to stabilize qsort.  */
1107     return c1->id > c2->id ? 1 : -1;
1108 }
1109
1110 /* Return TRUE iff STMT represents a builtin call that raises OP
1111    to some exponent.  */
1112
1113 static bool
1114 stmt_is_power_of_op (gimple *stmt, tree op)
1115 {
1116   if (!is_gimple_call (stmt))
1117     return false;
1118
1119   switch (gimple_call_combined_fn (stmt))
1120     {
1121     CASE_CFN_POW:
1122     CASE_CFN_POWI:
1123       return (operand_equal_p (gimple_call_arg (stmt, 0), op, 0));
1124
1125     default:
1126       return false;
1127     }
1128 }
1129
1130 /* Given STMT which is a __builtin_pow* call, decrement its exponent
1131    in place and return the result.  Assumes that stmt_is_power_of_op
1132    was previously called for STMT and returned TRUE.  */
1133
1134 static HOST_WIDE_INT
1135 decrement_power (gimple *stmt)
1136 {
1137   REAL_VALUE_TYPE c, cint;
1138   HOST_WIDE_INT power;
1139   tree arg1;
1140
1141   switch (gimple_call_combined_fn (stmt))
1142     {
1143     CASE_CFN_POW:
1144       arg1 = gimple_call_arg (stmt, 1);
1145       c = TREE_REAL_CST (arg1);
1146       power = real_to_integer (&c) - 1;
1147       real_from_integer (&cint, VOIDmode, power, SIGNED);
1148       gimple_call_set_arg (stmt, 1, build_real (TREE_TYPE (arg1), cint));
1149       return power;
1150
1151     CASE_CFN_POWI:
1152       arg1 = gimple_call_arg (stmt, 1);
1153       power = TREE_INT_CST_LOW (arg1) - 1;
1154       gimple_call_set_arg (stmt, 1, build_int_cst (TREE_TYPE (arg1), power));
1155       return power;
1156
1157     default:
1158       gcc_unreachable ();
1159     }
1160 }
1161
1162 /* Replace SSA defined by STMT and replace all its uses with new
1163    SSA.  Also return the new SSA.  */
1164
1165 static tree
1166 make_new_ssa_for_def (gimple *stmt, enum tree_code opcode, tree op)
1167 {
1168   gimple *use_stmt;
1169   use_operand_p use;
1170   imm_use_iterator iter;
1171   tree new_lhs, new_debug_lhs = NULL_TREE;
1172   tree lhs = gimple_get_lhs (stmt);
1173
1174   new_lhs = make_ssa_name (TREE_TYPE (lhs));
1175   gimple_set_lhs (stmt, new_lhs);
1176
1177   /* Also need to update GIMPLE_DEBUGs.  */
1178   FOR_EACH_IMM_USE_STMT (use_stmt, iter, lhs)
1179     {
1180       tree repl = new_lhs;
1181       if (is_gimple_debug (use_stmt))
1182         {
1183           if (new_debug_lhs == NULL_TREE)
1184             {
1185               new_debug_lhs = make_node (DEBUG_EXPR_DECL);
1186               gdebug *def_temp
1187                 = gimple_build_debug_bind (new_debug_lhs,
1188                                            build2 (opcode, TREE_TYPE (lhs),
1189                                                    new_lhs, op),
1190                                            stmt);
1191               DECL_ARTIFICIAL (new_debug_lhs) = 1;
1192               TREE_TYPE (new_debug_lhs) = TREE_TYPE (lhs);
1193               SET_DECL_MODE (new_debug_lhs, TYPE_MODE (TREE_TYPE (lhs)));
1194               gimple_set_uid (def_temp, gimple_uid (stmt));
1195               gimple_stmt_iterator gsi = gsi_for_stmt (stmt);
1196               gsi_insert_after (&gsi, def_temp, GSI_SAME_STMT);
1197             }
1198           repl = new_debug_lhs;
1199         }
1200       FOR_EACH_IMM_USE_ON_STMT (use, iter)
1201         SET_USE (use, repl);
1202       update_stmt (use_stmt);
1203     }
1204   return new_lhs;
1205 }
1206
1207 /* Replace all SSAs defined in STMTS_TO_FIX and replace its
1208    uses with new SSAs.  Also do this for the stmt that defines DEF
1209    if *DEF is not OP.  */
1210
1211 static void
1212 make_new_ssa_for_all_defs (tree *def, enum tree_code opcode, tree op,
1213                            vec<gimple *> &stmts_to_fix)
1214 {
1215   unsigned i;
1216   gimple *stmt;
1217
1218   if (*def != op
1219       && TREE_CODE (*def) == SSA_NAME
1220       && (stmt = SSA_NAME_DEF_STMT (*def))
1221       && gimple_code (stmt) != GIMPLE_NOP)
1222     *def = make_new_ssa_for_def (stmt, opcode, op);
1223
1224   FOR_EACH_VEC_ELT (stmts_to_fix, i, stmt)
1225     make_new_ssa_for_def (stmt, opcode, op);
1226 }
1227
1228 /* Find the single immediate use of STMT's LHS, and replace it
1229    with OP.  Remove STMT.  If STMT's LHS is the same as *DEF,
1230    replace *DEF with OP as well.  */
1231
1232 static void
1233 propagate_op_to_single_use (tree op, gimple *stmt, tree *def)
1234 {
1235   tree lhs;
1236   gimple *use_stmt;
1237   use_operand_p use;
1238   gimple_stmt_iterator gsi;
1239
1240   if (is_gimple_call (stmt))
1241     lhs = gimple_call_lhs (stmt);
1242   else
1243     lhs = gimple_assign_lhs (stmt);
1244
1245   gcc_assert (has_single_use (lhs));
1246   single_imm_use (lhs, &use, &use_stmt);
1247   if (lhs == *def)
1248     *def = op;
1249   SET_USE (use, op);
1250   if (TREE_CODE (op) != SSA_NAME)
1251     update_stmt (use_stmt);
1252   gsi = gsi_for_stmt (stmt);
1253   unlink_stmt_vdef (stmt);
1254   reassoc_remove_stmt (&gsi);
1255   release_defs (stmt);
1256 }
1257
1258 /* Walks the linear chain with result *DEF searching for an operation
1259    with operand OP and code OPCODE removing that from the chain.  *DEF
1260    is updated if there is only one operand but no operation left.  */
1261
1262 static void
1263 zero_one_operation (tree *def, enum tree_code opcode, tree op)
1264 {
1265   tree orig_def = *def;
1266   gimple *stmt = SSA_NAME_DEF_STMT (*def);
1267   /* PR72835 - Record the stmt chain that has to be updated such that
1268      we dont use the same LHS when the values computed are different.  */
1269   auto_vec<gimple *, 64> stmts_to_fix;
1270
1271   do
1272     {
1273       tree name;
1274
1275       if (opcode == MULT_EXPR)
1276         {
1277           if (stmt_is_power_of_op (stmt, op))
1278             {
1279               if (decrement_power (stmt) == 1)
1280                 {
1281                   if (stmts_to_fix.length () > 0)
1282                     stmts_to_fix.pop ();
1283                   propagate_op_to_single_use (op, stmt, def);
1284                 }
1285               break;
1286             }
1287           else if (gimple_assign_rhs_code (stmt) == NEGATE_EXPR)
1288             {
1289               if (gimple_assign_rhs1 (stmt) == op)
1290                 {
1291                   tree cst = build_minus_one_cst (TREE_TYPE (op));
1292                   if (stmts_to_fix.length () > 0)
1293                     stmts_to_fix.pop ();
1294                   propagate_op_to_single_use (cst, stmt, def);
1295                   break;
1296                 }
1297               else if (integer_minus_onep (op)
1298                        || real_minus_onep (op))
1299                 {
1300                   gimple_assign_set_rhs_code
1301                     (stmt, TREE_CODE (gimple_assign_rhs1 (stmt)));
1302                   break;
1303                 }
1304             }
1305         }
1306
1307       name = gimple_assign_rhs1 (stmt);
1308
1309       /* If this is the operation we look for and one of the operands
1310          is ours simply propagate the other operand into the stmts
1311          single use.  */
1312       if (gimple_assign_rhs_code (stmt) == opcode
1313           && (name == op
1314               || gimple_assign_rhs2 (stmt) == op))
1315         {
1316           if (name == op)
1317             name = gimple_assign_rhs2 (stmt);
1318           if (stmts_to_fix.length () > 0)
1319             stmts_to_fix.pop ();
1320           propagate_op_to_single_use (name, stmt, def);
1321           break;
1322         }
1323
1324       /* We might have a multiply of two __builtin_pow* calls, and
1325          the operand might be hiding in the rightmost one.  Likewise
1326          this can happen for a negate.  */
1327       if (opcode == MULT_EXPR
1328           && gimple_assign_rhs_code (stmt) == opcode
1329           && TREE_CODE (gimple_assign_rhs2 (stmt)) == SSA_NAME
1330           && has_single_use (gimple_assign_rhs2 (stmt)))
1331         {
1332           gimple *stmt2 = SSA_NAME_DEF_STMT (gimple_assign_rhs2 (stmt));
1333           if (stmt_is_power_of_op (stmt2, op))
1334             {
1335               if (decrement_power (stmt2) == 1)
1336                 propagate_op_to_single_use (op, stmt2, def);
1337               else
1338                 stmts_to_fix.safe_push (stmt2);
1339               break;
1340             }
1341           else if (is_gimple_assign (stmt2)
1342                    && gimple_assign_rhs_code (stmt2) == NEGATE_EXPR)
1343             {
1344               if (gimple_assign_rhs1 (stmt2) == op)
1345                 {
1346                   tree cst = build_minus_one_cst (TREE_TYPE (op));
1347                   propagate_op_to_single_use (cst, stmt2, def);
1348                   break;
1349                 }
1350               else if (integer_minus_onep (op)
1351                        || real_minus_onep (op))
1352                 {
1353                   stmts_to_fix.safe_push (stmt2);
1354                   gimple_assign_set_rhs_code
1355                     (stmt2, TREE_CODE (gimple_assign_rhs1 (stmt2)));
1356                   break;
1357                 }
1358             }
1359         }
1360
1361       /* Continue walking the chain.  */
1362       gcc_assert (name != op
1363                   && TREE_CODE (name) == SSA_NAME);
1364       stmt = SSA_NAME_DEF_STMT (name);
1365       stmts_to_fix.safe_push (stmt);
1366     }
1367   while (1);
1368
1369   if (stmts_to_fix.length () > 0 || *def == orig_def)
1370     make_new_ssa_for_all_defs (def, opcode, op, stmts_to_fix);
1371 }
1372
1373 /* Returns true if statement S1 dominates statement S2.  Like
1374    stmt_dominates_stmt_p, but uses stmt UIDs to optimize.  */
1375
1376 static bool
1377 reassoc_stmt_dominates_stmt_p (gimple *s1, gimple *s2)
1378 {
1379   basic_block bb1 = gimple_bb (s1), bb2 = gimple_bb (s2);
1380
1381   /* If bb1 is NULL, it should be a GIMPLE_NOP def stmt of an (D)
1382      SSA_NAME.  Assume it lives at the beginning of function and
1383      thus dominates everything.  */
1384   if (!bb1 || s1 == s2)
1385     return true;
1386
1387   /* If bb2 is NULL, it doesn't dominate any stmt with a bb.  */
1388   if (!bb2)
1389     return false;
1390
1391   if (bb1 == bb2)
1392     {
1393       /* PHIs in the same basic block are assumed to be
1394          executed all in parallel, if only one stmt is a PHI,
1395          it dominates the other stmt in the same basic block.  */
1396       if (gimple_code (s1) == GIMPLE_PHI)
1397         return true;
1398
1399       if (gimple_code (s2) == GIMPLE_PHI)
1400         return false;
1401
1402       gcc_assert (gimple_uid (s1) && gimple_uid (s2));
1403
1404       if (gimple_uid (s1) < gimple_uid (s2))
1405         return true;
1406
1407       if (gimple_uid (s1) > gimple_uid (s2))
1408         return false;
1409
1410       gimple_stmt_iterator gsi = gsi_for_stmt (s1);
1411       unsigned int uid = gimple_uid (s1);
1412       for (gsi_next (&gsi); !gsi_end_p (gsi); gsi_next (&gsi))
1413         {
1414           gimple *s = gsi_stmt (gsi);
1415           if (gimple_uid (s) != uid)
1416             break;
1417           if (s == s2)
1418             return true;
1419         }
1420
1421       return false;
1422     }
1423
1424   return dominated_by_p (CDI_DOMINATORS, bb2, bb1);
1425 }
1426
1427 /* Insert STMT after INSERT_POINT.  */
1428
1429 static void
1430 insert_stmt_after (gimple *stmt, gimple *insert_point)
1431 {
1432   gimple_stmt_iterator gsi;
1433   basic_block bb;
1434
1435   if (gimple_code (insert_point) == GIMPLE_PHI)
1436     bb = gimple_bb (insert_point);
1437   else if (!stmt_ends_bb_p (insert_point))
1438     {
1439       gsi = gsi_for_stmt (insert_point);
1440       gimple_set_uid (stmt, gimple_uid (insert_point));
1441       gsi_insert_after (&gsi, stmt, GSI_NEW_STMT);
1442       return;
1443     }
1444   else
1445     /* We assume INSERT_POINT is a SSA_NAME_DEF_STMT of some SSA_NAME,
1446        thus if it must end a basic block, it should be a call that can
1447        throw, or some assignment that can throw.  If it throws, the LHS
1448        of it will not be initialized though, so only valid places using
1449        the SSA_NAME should be dominated by the fallthru edge.  */
1450     bb = find_fallthru_edge (gimple_bb (insert_point)->succs)->dest;
1451   gsi = gsi_after_labels (bb);
1452   if (gsi_end_p (gsi))
1453     {
1454       gimple_stmt_iterator gsi2 = gsi_last_bb (bb);
1455       gimple_set_uid (stmt,
1456                       gsi_end_p (gsi2) ? 1 : gimple_uid (gsi_stmt (gsi2)));
1457     }
1458   else
1459     gimple_set_uid (stmt, gimple_uid (gsi_stmt (gsi)));
1460   gsi_insert_before (&gsi, stmt, GSI_SAME_STMT);
1461 }
1462
1463 /* Builds one statement performing OP1 OPCODE OP2 using TMPVAR for
1464    the result.  Places the statement after the definition of either
1465    OP1 or OP2.  Returns the new statement.  */
1466
1467 static gimple *
1468 build_and_add_sum (tree type, tree op1, tree op2, enum tree_code opcode)
1469 {
1470   gimple *op1def = NULL, *op2def = NULL;
1471   gimple_stmt_iterator gsi;
1472   tree op;
1473   gassign *sum;
1474
1475   /* Create the addition statement.  */
1476   op = make_ssa_name (type);
1477   sum = gimple_build_assign (op, opcode, op1, op2);
1478
1479   /* Find an insertion place and insert.  */
1480   if (TREE_CODE (op1) == SSA_NAME)
1481     op1def = SSA_NAME_DEF_STMT (op1);
1482   if (TREE_CODE (op2) == SSA_NAME)
1483     op2def = SSA_NAME_DEF_STMT (op2);
1484   if ((!op1def || gimple_nop_p (op1def))
1485       && (!op2def || gimple_nop_p (op2def)))
1486     {
1487       gsi = gsi_after_labels (single_succ (ENTRY_BLOCK_PTR_FOR_FN (cfun)));
1488       if (gsi_end_p (gsi))
1489         {
1490           gimple_stmt_iterator gsi2
1491             = gsi_last_bb (single_succ (ENTRY_BLOCK_PTR_FOR_FN (cfun)));
1492           gimple_set_uid (sum,
1493                           gsi_end_p (gsi2) ? 1 : gimple_uid (gsi_stmt (gsi2)));
1494         }
1495       else
1496         gimple_set_uid (sum, gimple_uid (gsi_stmt (gsi)));
1497       gsi_insert_before (&gsi, sum, GSI_NEW_STMT);
1498     }
1499   else
1500     {
1501       gimple *insert_point;
1502       if ((!op1def || gimple_nop_p (op1def))
1503            || (op2def && !gimple_nop_p (op2def)
1504                && reassoc_stmt_dominates_stmt_p (op1def, op2def)))
1505         insert_point = op2def;
1506       else
1507         insert_point = op1def;
1508       insert_stmt_after (sum, insert_point);
1509     }
1510   update_stmt (sum);
1511
1512   return sum;
1513 }
1514
1515 /* Perform un-distribution of divisions and multiplications.
1516    A * X + B * X is transformed into (A + B) * X and A / X + B / X
1517    to (A + B) / X for real X.
1518
1519    The algorithm is organized as follows.
1520
1521     - First we walk the addition chain *OPS looking for summands that
1522       are defined by a multiplication or a real division.  This results
1523       in the candidates bitmap with relevant indices into *OPS.
1524
1525     - Second we build the chains of multiplications or divisions for
1526       these candidates, counting the number of occurrences of (operand, code)
1527       pairs in all of the candidates chains.
1528
1529     - Third we sort the (operand, code) pairs by number of occurrence and
1530       process them starting with the pair with the most uses.
1531
1532       * For each such pair we walk the candidates again to build a
1533         second candidate bitmap noting all multiplication/division chains
1534         that have at least one occurrence of (operand, code).
1535
1536       * We build an alternate addition chain only covering these
1537         candidates with one (operand, code) operation removed from their
1538         multiplication/division chain.
1539
1540       * The first candidate gets replaced by the alternate addition chain
1541         multiplied/divided by the operand.
1542
1543       * All candidate chains get disabled for further processing and
1544         processing of (operand, code) pairs continues.
1545
1546   The alternate addition chains built are re-processed by the main
1547   reassociation algorithm which allows optimizing a * x * y + b * y * x
1548   to (a + b ) * x * y in one invocation of the reassociation pass.  */
1549
1550 static bool
1551 undistribute_ops_list (enum tree_code opcode,
1552                        vec<operand_entry *> *ops, struct loop *loop)
1553 {
1554   unsigned int length = ops->length ();
1555   operand_entry *oe1;
1556   unsigned i, j;
1557   unsigned nr_candidates, nr_candidates2;
1558   sbitmap_iterator sbi0;
1559   vec<operand_entry *> *subops;
1560   bool changed = false;
1561   unsigned int next_oecount_id = 0;
1562
1563   if (length <= 1
1564       || opcode != PLUS_EXPR)
1565     return false;
1566
1567   /* Build a list of candidates to process.  */
1568   auto_sbitmap candidates (length);
1569   bitmap_clear (candidates);
1570   nr_candidates = 0;
1571   FOR_EACH_VEC_ELT (*ops, i, oe1)
1572     {
1573       enum tree_code dcode;
1574       gimple *oe1def;
1575
1576       if (TREE_CODE (oe1->op) != SSA_NAME)
1577         continue;
1578       oe1def = SSA_NAME_DEF_STMT (oe1->op);
1579       if (!is_gimple_assign (oe1def))
1580         continue;
1581       dcode = gimple_assign_rhs_code (oe1def);
1582       if ((dcode != MULT_EXPR
1583            && dcode != RDIV_EXPR)
1584           || !is_reassociable_op (oe1def, dcode, loop))
1585         continue;
1586
1587       bitmap_set_bit (candidates, i);
1588       nr_candidates++;
1589     }
1590
1591   if (nr_candidates < 2)
1592     return false;
1593
1594   if (dump_file && (dump_flags & TDF_DETAILS))
1595     {
1596       fprintf (dump_file, "searching for un-distribute opportunities ");
1597       print_generic_expr (dump_file,
1598         (*ops)[bitmap_first_set_bit (candidates)]->op, 0);
1599       fprintf (dump_file, " %d\n", nr_candidates);
1600     }
1601
1602   /* Build linearized sub-operand lists and the counting table.  */
1603   cvec.create (0);
1604
1605   hash_table<oecount_hasher> ctable (15);
1606
1607   /* ??? Macro arguments cannot have multi-argument template types in
1608      them.  This typedef is needed to workaround that limitation.  */
1609   typedef vec<operand_entry *> vec_operand_entry_t_heap;
1610   subops = XCNEWVEC (vec_operand_entry_t_heap, ops->length ());
1611   EXECUTE_IF_SET_IN_BITMAP (candidates, 0, i, sbi0)
1612     {
1613       gimple *oedef;
1614       enum tree_code oecode;
1615       unsigned j;
1616
1617       oedef = SSA_NAME_DEF_STMT ((*ops)[i]->op);
1618       oecode = gimple_assign_rhs_code (oedef);
1619       linearize_expr_tree (&subops[i], oedef,
1620                            associative_tree_code (oecode), false);
1621
1622       FOR_EACH_VEC_ELT (subops[i], j, oe1)
1623         {
1624           oecount c;
1625           int *slot;
1626           int idx;
1627           c.oecode = oecode;
1628           c.cnt = 1;
1629           c.id = next_oecount_id++;
1630           c.op = oe1->op;
1631           cvec.safe_push (c);
1632           idx = cvec.length () + 41;
1633           slot = ctable.find_slot (idx, INSERT);
1634           if (!*slot)
1635             {
1636               *slot = idx;
1637             }
1638           else
1639             {
1640               cvec.pop ();
1641               cvec[*slot - 42].cnt++;
1642             }
1643         }
1644     }
1645
1646   /* Sort the counting table.  */
1647   cvec.qsort (oecount_cmp);
1648
1649   if (dump_file && (dump_flags & TDF_DETAILS))
1650     {
1651       oecount *c;
1652       fprintf (dump_file, "Candidates:\n");
1653       FOR_EACH_VEC_ELT (cvec, j, c)
1654         {
1655           fprintf (dump_file, "  %u %s: ", c->cnt,
1656                    c->oecode == MULT_EXPR
1657                    ? "*" : c->oecode == RDIV_EXPR ? "/" : "?");
1658           print_generic_expr (dump_file, c->op);
1659           fprintf (dump_file, "\n");
1660         }
1661     }
1662
1663   /* Process the (operand, code) pairs in order of most occurrence.  */
1664   auto_sbitmap candidates2 (length);
1665   while (!cvec.is_empty ())
1666     {
1667       oecount *c = &cvec.last ();
1668       if (c->cnt < 2)
1669         break;
1670
1671       /* Now collect the operands in the outer chain that contain
1672          the common operand in their inner chain.  */
1673       bitmap_clear (candidates2);
1674       nr_candidates2 = 0;
1675       EXECUTE_IF_SET_IN_BITMAP (candidates, 0, i, sbi0)
1676         {
1677           gimple *oedef;
1678           enum tree_code oecode;
1679           unsigned j;
1680           tree op = (*ops)[i]->op;
1681
1682           /* If we undistributed in this chain already this may be
1683              a constant.  */
1684           if (TREE_CODE (op) != SSA_NAME)
1685             continue;
1686
1687           oedef = SSA_NAME_DEF_STMT (op);
1688           oecode = gimple_assign_rhs_code (oedef);
1689           if (oecode != c->oecode)
1690             continue;
1691
1692           FOR_EACH_VEC_ELT (subops[i], j, oe1)
1693             {
1694               if (oe1->op == c->op)
1695                 {
1696                   bitmap_set_bit (candidates2, i);
1697                   ++nr_candidates2;
1698                   break;
1699                 }
1700             }
1701         }
1702
1703       if (nr_candidates2 >= 2)
1704         {
1705           operand_entry *oe1, *oe2;
1706           gimple *prod;
1707           int first = bitmap_first_set_bit (candidates2);
1708
1709           /* Build the new addition chain.  */
1710           oe1 = (*ops)[first];
1711           if (dump_file && (dump_flags & TDF_DETAILS))
1712             {
1713               fprintf (dump_file, "Building (");
1714               print_generic_expr (dump_file, oe1->op);
1715             }
1716           zero_one_operation (&oe1->op, c->oecode, c->op);
1717           EXECUTE_IF_SET_IN_BITMAP (candidates2, first+1, i, sbi0)
1718             {
1719               gimple *sum;
1720               oe2 = (*ops)[i];
1721               if (dump_file && (dump_flags & TDF_DETAILS))
1722                 {
1723                   fprintf (dump_file, " + ");
1724                   print_generic_expr (dump_file, oe2->op);
1725                 }
1726               zero_one_operation (&oe2->op, c->oecode, c->op);
1727               sum = build_and_add_sum (TREE_TYPE (oe1->op),
1728                                        oe1->op, oe2->op, opcode);
1729               oe2->op = build_zero_cst (TREE_TYPE (oe2->op));
1730               oe2->rank = 0;
1731               oe1->op = gimple_get_lhs (sum);
1732             }
1733
1734           /* Apply the multiplication/division.  */
1735           prod = build_and_add_sum (TREE_TYPE (oe1->op),
1736                                     oe1->op, c->op, c->oecode);
1737           if (dump_file && (dump_flags & TDF_DETAILS))
1738             {
1739               fprintf (dump_file, ") %s ", c->oecode == MULT_EXPR ? "*" : "/");
1740               print_generic_expr (dump_file, c->op);
1741               fprintf (dump_file, "\n");
1742             }
1743
1744           /* Record it in the addition chain and disable further
1745              undistribution with this op.  */
1746           oe1->op = gimple_assign_lhs (prod);
1747           oe1->rank = get_rank (oe1->op);
1748           subops[first].release ();
1749
1750           changed = true;
1751         }
1752
1753       cvec.pop ();
1754     }
1755
1756   for (i = 0; i < ops->length (); ++i)
1757     subops[i].release ();
1758   free (subops);
1759   cvec.release ();
1760
1761   return changed;
1762 }
1763
1764 /* If OPCODE is BIT_IOR_EXPR or BIT_AND_EXPR and CURR is a comparison
1765    expression, examine the other OPS to see if any of them are comparisons
1766    of the same values, which we may be able to combine or eliminate.
1767    For example, we can rewrite (a < b) | (a == b) as (a <= b).  */
1768
1769 static bool
1770 eliminate_redundant_comparison (enum tree_code opcode,
1771                                 vec<operand_entry *> *ops,
1772                                 unsigned int currindex,
1773                                 operand_entry *curr)
1774 {
1775   tree op1, op2;
1776   enum tree_code lcode, rcode;
1777   gimple *def1, *def2;
1778   int i;
1779   operand_entry *oe;
1780
1781   if (opcode != BIT_IOR_EXPR && opcode != BIT_AND_EXPR)
1782     return false;
1783
1784   /* Check that CURR is a comparison.  */
1785   if (TREE_CODE (curr->op) != SSA_NAME)
1786     return false;
1787   def1 = SSA_NAME_DEF_STMT (curr->op);
1788   if (!is_gimple_assign (def1))
1789     return false;
1790   lcode = gimple_assign_rhs_code (def1);
1791   if (TREE_CODE_CLASS (lcode) != tcc_comparison)
1792     return false;
1793   op1 = gimple_assign_rhs1 (def1);
1794   op2 = gimple_assign_rhs2 (def1);
1795
1796   /* Now look for a similar comparison in the remaining OPS.  */
1797   for (i = currindex + 1; ops->iterate (i, &oe); i++)
1798     {
1799       tree t;
1800
1801       if (TREE_CODE (oe->op) != SSA_NAME)
1802         continue;
1803       def2 = SSA_NAME_DEF_STMT (oe->op);
1804       if (!is_gimple_assign (def2))
1805         continue;
1806       rcode = gimple_assign_rhs_code (def2);
1807       if (TREE_CODE_CLASS (rcode) != tcc_comparison)
1808         continue;
1809
1810       /* If we got here, we have a match.  See if we can combine the
1811          two comparisons.  */
1812       if (opcode == BIT_IOR_EXPR)
1813         t = maybe_fold_or_comparisons (lcode, op1, op2,
1814                                        rcode, gimple_assign_rhs1 (def2),
1815                                        gimple_assign_rhs2 (def2));
1816       else
1817         t = maybe_fold_and_comparisons (lcode, op1, op2,
1818                                         rcode, gimple_assign_rhs1 (def2),
1819                                         gimple_assign_rhs2 (def2));
1820       if (!t)
1821         continue;
1822
1823       /* maybe_fold_and_comparisons and maybe_fold_or_comparisons
1824          always give us a boolean_type_node value back.  If the original
1825          BIT_AND_EXPR or BIT_IOR_EXPR was of a wider integer type,
1826          we need to convert.  */
1827       if (!useless_type_conversion_p (TREE_TYPE (curr->op), TREE_TYPE (t)))
1828         t = fold_convert (TREE_TYPE (curr->op), t);
1829
1830       if (TREE_CODE (t) != INTEGER_CST
1831           && !operand_equal_p (t, curr->op, 0))
1832         {
1833           enum tree_code subcode;
1834           tree newop1, newop2;
1835           if (!COMPARISON_CLASS_P (t))
1836             continue;
1837           extract_ops_from_tree (t, &subcode, &newop1, &newop2);
1838           STRIP_USELESS_TYPE_CONVERSION (newop1);
1839           STRIP_USELESS_TYPE_CONVERSION (newop2);
1840           if (!is_gimple_val (newop1) || !is_gimple_val (newop2))
1841             continue;
1842         }
1843
1844       if (dump_file && (dump_flags & TDF_DETAILS))
1845         {
1846           fprintf (dump_file, "Equivalence: ");
1847           print_generic_expr (dump_file, curr->op);
1848           fprintf (dump_file, " %s ", op_symbol_code (opcode));
1849           print_generic_expr (dump_file, oe->op);
1850           fprintf (dump_file, " -> ");
1851           print_generic_expr (dump_file, t);
1852           fprintf (dump_file, "\n");
1853         }
1854
1855       /* Now we can delete oe, as it has been subsumed by the new combined
1856          expression t.  */
1857       ops->ordered_remove (i);
1858       reassociate_stats.ops_eliminated ++;
1859
1860       /* If t is the same as curr->op, we're done.  Otherwise we must
1861          replace curr->op with t.  Special case is if we got a constant
1862          back, in which case we add it to the end instead of in place of
1863          the current entry.  */
1864       if (TREE_CODE (t) == INTEGER_CST)
1865         {
1866           ops->ordered_remove (currindex);
1867           add_to_ops_vec (ops, t);
1868         }
1869       else if (!operand_equal_p (t, curr->op, 0))
1870         {
1871           gimple *sum;
1872           enum tree_code subcode;
1873           tree newop1;
1874           tree newop2;
1875           gcc_assert (COMPARISON_CLASS_P (t));
1876           extract_ops_from_tree (t, &subcode, &newop1, &newop2);
1877           STRIP_USELESS_TYPE_CONVERSION (newop1);
1878           STRIP_USELESS_TYPE_CONVERSION (newop2);
1879           gcc_checking_assert (is_gimple_val (newop1)
1880                                && is_gimple_val (newop2));
1881           sum = build_and_add_sum (TREE_TYPE (t), newop1, newop2, subcode);
1882           curr->op = gimple_get_lhs (sum);
1883         }
1884       return true;
1885     }
1886
1887   return false;
1888 }
1889
1890
1891 /* Transform repeated addition of same values into multiply with
1892    constant.  */
1893 static bool
1894 transform_add_to_multiply (vec<operand_entry *> *ops)
1895 {
1896   operand_entry *oe;
1897   tree op = NULL_TREE;
1898   int j;
1899   int i, start = -1, end = 0, count = 0;
1900   auto_vec<std::pair <int, int> > indxs;
1901   bool changed = false;
1902
1903   if (!INTEGRAL_TYPE_P (TREE_TYPE ((*ops)[0]->op))
1904       && (!SCALAR_FLOAT_TYPE_P (TREE_TYPE ((*ops)[0]->op))
1905           || !flag_unsafe_math_optimizations))
1906     return false;
1907
1908   /* Look for repeated operands.  */
1909   FOR_EACH_VEC_ELT (*ops, i, oe)
1910     {
1911       if (start == -1)
1912         {
1913           count = 1;
1914           op = oe->op;
1915           start = i;
1916         }
1917       else if (operand_equal_p (oe->op, op, 0))
1918         {
1919           count++;
1920           end = i;
1921         }
1922       else
1923         {
1924           if (count > 1)
1925             indxs.safe_push (std::make_pair (start, end));
1926           count = 1;
1927           op = oe->op;
1928           start = i;
1929         }
1930     }
1931
1932   if (count > 1)
1933     indxs.safe_push (std::make_pair (start, end));
1934
1935   for (j = indxs.length () - 1; j >= 0; --j)
1936     {
1937       /* Convert repeated operand addition to multiplication.  */
1938       start = indxs[j].first;
1939       end = indxs[j].second;
1940       op = (*ops)[start]->op;
1941       count = end - start + 1;
1942       for (i = end; i >= start; --i)
1943         ops->unordered_remove (i);
1944       tree tmp = make_ssa_name (TREE_TYPE (op));
1945       tree cst = build_int_cst (integer_type_node, count);
1946       gassign *mul_stmt
1947         = gimple_build_assign (tmp, MULT_EXPR,
1948                                op, fold_convert (TREE_TYPE (op), cst));
1949       gimple_set_visited (mul_stmt, true);
1950       add_to_ops_vec (ops, tmp, mul_stmt);
1951       changed = true;
1952     }
1953
1954   return changed;
1955 }
1956
1957
1958 /* Perform various identities and other optimizations on the list of
1959    operand entries, stored in OPS.  The tree code for the binary
1960    operation between all the operands is OPCODE.  */
1961
1962 static void
1963 optimize_ops_list (enum tree_code opcode,
1964                    vec<operand_entry *> *ops)
1965 {
1966   unsigned int length = ops->length ();
1967   unsigned int i;
1968   operand_entry *oe;
1969   operand_entry *oelast = NULL;
1970   bool iterate = false;
1971
1972   if (length == 1)
1973     return;
1974
1975   oelast = ops->last ();
1976
1977   /* If the last two are constants, pop the constants off, merge them
1978      and try the next two.  */
1979   if (oelast->rank == 0 && is_gimple_min_invariant (oelast->op))
1980     {
1981       operand_entry *oelm1 = (*ops)[length - 2];
1982
1983       if (oelm1->rank == 0
1984           && is_gimple_min_invariant (oelm1->op)
1985           && useless_type_conversion_p (TREE_TYPE (oelm1->op),
1986                                        TREE_TYPE (oelast->op)))
1987         {
1988           tree folded = fold_binary (opcode, TREE_TYPE (oelm1->op),
1989                                      oelm1->op, oelast->op);
1990
1991           if (folded && is_gimple_min_invariant (folded))
1992             {
1993               if (dump_file && (dump_flags & TDF_DETAILS))
1994                 fprintf (dump_file, "Merging constants\n");
1995
1996               ops->pop ();
1997               ops->pop ();
1998
1999               add_to_ops_vec (ops, folded);
2000               reassociate_stats.constants_eliminated++;
2001
2002               optimize_ops_list (opcode, ops);
2003               return;
2004             }
2005         }
2006     }
2007
2008   eliminate_using_constants (opcode, ops);
2009   oelast = NULL;
2010
2011   for (i = 0; ops->iterate (i, &oe);)
2012     {
2013       bool done = false;
2014
2015       if (eliminate_not_pairs (opcode, ops, i, oe))
2016         return;
2017       if (eliminate_duplicate_pair (opcode, ops, &done, i, oe, oelast)
2018           || (!done && eliminate_plus_minus_pair (opcode, ops, i, oe))
2019           || (!done && eliminate_redundant_comparison (opcode, ops, i, oe)))
2020         {
2021           if (done)
2022             return;
2023           iterate = true;
2024           oelast = NULL;
2025           continue;
2026         }
2027       oelast = oe;
2028       i++;
2029     }
2030
2031   length = ops->length ();
2032   oelast = ops->last ();
2033
2034   if (iterate)
2035     optimize_ops_list (opcode, ops);
2036 }
2037
2038 /* The following functions are subroutines to optimize_range_tests and allow
2039    it to try to change a logical combination of comparisons into a range
2040    test.
2041
2042    For example, both
2043         X == 2 || X == 5 || X == 3 || X == 4
2044    and
2045         X >= 2 && X <= 5
2046    are converted to
2047         (unsigned) (X - 2) <= 3
2048
2049    For more information see comments above fold_test_range in fold-const.c,
2050    this implementation is for GIMPLE.  */
2051
2052 struct range_entry
2053 {
2054   tree exp;
2055   tree low;
2056   tree high;
2057   bool in_p;
2058   bool strict_overflow_p;
2059   unsigned int idx, next;
2060 };
2061
2062 /* This is similar to make_range in fold-const.c, but on top of
2063    GIMPLE instead of trees.  If EXP is non-NULL, it should be
2064    an SSA_NAME and STMT argument is ignored, otherwise STMT
2065    argument should be a GIMPLE_COND.  */
2066
2067 static void
2068 init_range_entry (struct range_entry *r, tree exp, gimple *stmt)
2069 {
2070   int in_p;
2071   tree low, high;
2072   bool is_bool, strict_overflow_p;
2073
2074   r->exp = NULL_TREE;
2075   r->in_p = false;
2076   r->strict_overflow_p = false;
2077   r->low = NULL_TREE;
2078   r->high = NULL_TREE;
2079   if (exp != NULL_TREE
2080       && (TREE_CODE (exp) != SSA_NAME || !INTEGRAL_TYPE_P (TREE_TYPE (exp))))
2081     return;
2082
2083   /* Start with simply saying "EXP != 0" and then look at the code of EXP
2084      and see if we can refine the range.  Some of the cases below may not
2085      happen, but it doesn't seem worth worrying about this.  We "continue"
2086      the outer loop when we've changed something; otherwise we "break"
2087      the switch, which will "break" the while.  */
2088   low = exp ? build_int_cst (TREE_TYPE (exp), 0) : boolean_false_node;
2089   high = low;
2090   in_p = 0;
2091   strict_overflow_p = false;
2092   is_bool = false;
2093   if (exp == NULL_TREE)
2094     is_bool = true;
2095   else if (TYPE_PRECISION (TREE_TYPE (exp)) == 1)
2096     {
2097       if (TYPE_UNSIGNED (TREE_TYPE (exp)))
2098         is_bool = true;
2099       else
2100         return;
2101     }
2102   else if (TREE_CODE (TREE_TYPE (exp)) == BOOLEAN_TYPE)
2103     is_bool = true;
2104
2105   while (1)
2106     {
2107       enum tree_code code;
2108       tree arg0, arg1, exp_type;
2109       tree nexp;
2110       location_t loc;
2111
2112       if (exp != NULL_TREE)
2113         {
2114           if (TREE_CODE (exp) != SSA_NAME
2115               || SSA_NAME_OCCURS_IN_ABNORMAL_PHI (exp))
2116             break;
2117
2118           stmt = SSA_NAME_DEF_STMT (exp);
2119           if (!is_gimple_assign (stmt))
2120             break;
2121
2122           code = gimple_assign_rhs_code (stmt);
2123           arg0 = gimple_assign_rhs1 (stmt);
2124           arg1 = gimple_assign_rhs2 (stmt);
2125           exp_type = TREE_TYPE (exp);
2126         }
2127       else
2128         {
2129           code = gimple_cond_code (stmt);
2130           arg0 = gimple_cond_lhs (stmt);
2131           arg1 = gimple_cond_rhs (stmt);
2132           exp_type = boolean_type_node;
2133         }
2134
2135       if (TREE_CODE (arg0) != SSA_NAME)
2136         break;
2137       loc = gimple_location (stmt);
2138       switch (code)
2139         {
2140         case BIT_NOT_EXPR:
2141           if (TREE_CODE (TREE_TYPE (exp)) == BOOLEAN_TYPE
2142               /* Ensure the range is either +[-,0], +[0,0],
2143                  -[-,0], -[0,0] or +[1,-], +[1,1], -[1,-] or
2144                  -[1,1].  If it is e.g. +[-,-] or -[-,-]
2145                  or similar expression of unconditional true or
2146                  false, it should not be negated.  */
2147               && ((high && integer_zerop (high))
2148                   || (low && integer_onep (low))))
2149             {
2150               in_p = !in_p;
2151               exp = arg0;
2152               continue;
2153             }
2154           break;
2155         case SSA_NAME:
2156           exp = arg0;
2157           continue;
2158         CASE_CONVERT:
2159           if (is_bool)
2160             goto do_default;
2161           if (TYPE_PRECISION (TREE_TYPE (arg0)) == 1)
2162             {
2163               if (TYPE_UNSIGNED (TREE_TYPE (arg0)))
2164                 is_bool = true;
2165               else
2166                 return;
2167             }
2168           else if (TREE_CODE (TREE_TYPE (arg0)) == BOOLEAN_TYPE)
2169             is_bool = true;
2170           goto do_default;
2171         case EQ_EXPR:
2172         case NE_EXPR:
2173         case LT_EXPR:
2174         case LE_EXPR:
2175         case GE_EXPR:
2176         case GT_EXPR:
2177           is_bool = true;
2178           /* FALLTHRU */
2179         default:
2180           if (!is_bool)
2181             return;
2182         do_default:
2183           nexp = make_range_step (loc, code, arg0, arg1, exp_type,
2184                                   &low, &high, &in_p,
2185                                   &strict_overflow_p);
2186           if (nexp != NULL_TREE)
2187             {
2188               exp = nexp;
2189               gcc_assert (TREE_CODE (exp) == SSA_NAME);
2190               continue;
2191             }
2192           break;
2193         }
2194       break;
2195     }
2196   if (is_bool)
2197     {
2198       r->exp = exp;
2199       r->in_p = in_p;
2200       r->low = low;
2201       r->high = high;
2202       r->strict_overflow_p = strict_overflow_p;
2203     }
2204 }
2205
2206 /* Comparison function for qsort.  Sort entries
2207    without SSA_NAME exp first, then with SSA_NAMEs sorted
2208    by increasing SSA_NAME_VERSION, and for the same SSA_NAMEs
2209    by increasing ->low and if ->low is the same, by increasing
2210    ->high.  ->low == NULL_TREE means minimum, ->high == NULL_TREE
2211    maximum.  */
2212
2213 static int
2214 range_entry_cmp (const void *a, const void *b)
2215 {
2216   const struct range_entry *p = (const struct range_entry *) a;
2217   const struct range_entry *q = (const struct range_entry *) b;
2218
2219   if (p->exp != NULL_TREE && TREE_CODE (p->exp) == SSA_NAME)
2220     {
2221       if (q->exp != NULL_TREE && TREE_CODE (q->exp) == SSA_NAME)
2222         {
2223           /* Group range_entries for the same SSA_NAME together.  */
2224           if (SSA_NAME_VERSION (p->exp) < SSA_NAME_VERSION (q->exp))
2225             return -1;
2226           else if (SSA_NAME_VERSION (p->exp) > SSA_NAME_VERSION (q->exp))
2227             return 1;
2228           /* If ->low is different, NULL low goes first, then by
2229              ascending low.  */
2230           if (p->low != NULL_TREE)
2231             {
2232               if (q->low != NULL_TREE)
2233                 {
2234                   tree tem = fold_binary (LT_EXPR, boolean_type_node,
2235                                           p->low, q->low);
2236                   if (tem && integer_onep (tem))
2237                     return -1;
2238                   tem = fold_binary (GT_EXPR, boolean_type_node,
2239                                      p->low, q->low);
2240                   if (tem && integer_onep (tem))
2241                     return 1;
2242                 }
2243               else
2244                 return 1;
2245             }
2246           else if (q->low != NULL_TREE)
2247             return -1;
2248           /* If ->high is different, NULL high goes last, before that by
2249              ascending high.  */
2250           if (p->high != NULL_TREE)
2251             {
2252               if (q->high != NULL_TREE)
2253                 {
2254                   tree tem = fold_binary (LT_EXPR, boolean_type_node,
2255                                           p->high, q->high);
2256                   if (tem && integer_onep (tem))
2257                     return -1;
2258                   tem = fold_binary (GT_EXPR, boolean_type_node,
2259                                      p->high, q->high);
2260                   if (tem && integer_onep (tem))
2261                     return 1;
2262                 }
2263               else
2264                 return -1;
2265             }
2266           else if (q->high != NULL_TREE)
2267             return 1;
2268           /* If both ranges are the same, sort below by ascending idx.  */
2269         }
2270       else
2271         return 1;
2272     }
2273   else if (q->exp != NULL_TREE && TREE_CODE (q->exp) == SSA_NAME)
2274     return -1;
2275
2276   if (p->idx < q->idx)
2277     return -1;
2278   else
2279     {
2280       gcc_checking_assert (p->idx > q->idx);
2281       return 1;
2282     }
2283 }
2284
2285 /* Helper function for update_range_test.  Force EXPR into an SSA_NAME,
2286    insert needed statements BEFORE or after GSI.  */
2287
2288 static tree
2289 force_into_ssa_name (gimple_stmt_iterator *gsi, tree expr, bool before)
2290 {
2291   enum gsi_iterator_update m = before ? GSI_SAME_STMT : GSI_CONTINUE_LINKING;
2292   tree ret = force_gimple_operand_gsi (gsi, expr, true, NULL_TREE, before, m);
2293   if (TREE_CODE (ret) != SSA_NAME)
2294     {
2295       gimple *g = gimple_build_assign (make_ssa_name (TREE_TYPE (ret)), ret);
2296       if (before)
2297         gsi_insert_before (gsi, g, GSI_SAME_STMT);
2298       else
2299         gsi_insert_after (gsi, g, GSI_CONTINUE_LINKING);
2300       ret = gimple_assign_lhs (g);
2301     }
2302   return ret;
2303 }
2304
2305 /* Helper routine of optimize_range_test.
2306    [EXP, IN_P, LOW, HIGH, STRICT_OVERFLOW_P] is a merged range for
2307    RANGE and OTHERRANGE through OTHERRANGE + COUNT - 1 ranges,
2308    OPCODE and OPS are arguments of optimize_range_tests.  If OTHERRANGE
2309    is NULL, OTHERRANGEP should not be and then OTHERRANGEP points to
2310    an array of COUNT pointers to other ranges.  Return
2311    true if the range merge has been successful.
2312    If OPCODE is ERROR_MARK, this is called from within
2313    maybe_optimize_range_tests and is performing inter-bb range optimization.
2314    In that case, whether an op is BIT_AND_EXPR or BIT_IOR_EXPR is found in
2315    oe->rank.  */
2316
2317 static bool
2318 update_range_test (struct range_entry *range, struct range_entry *otherrange,
2319                    struct range_entry **otherrangep,
2320                    unsigned int count, enum tree_code opcode,
2321                    vec<operand_entry *> *ops, tree exp, gimple_seq seq,
2322                    bool in_p, tree low, tree high, bool strict_overflow_p)
2323 {
2324   operand_entry *oe = (*ops)[range->idx];
2325   tree op = oe->op;
2326   gimple *stmt = op ? SSA_NAME_DEF_STMT (op)
2327                     : last_stmt (BASIC_BLOCK_FOR_FN (cfun, oe->id));
2328   location_t loc = gimple_location (stmt);
2329   tree optype = op ? TREE_TYPE (op) : boolean_type_node;
2330   tree tem = build_range_check (loc, optype, unshare_expr (exp),
2331                                 in_p, low, high);
2332   enum warn_strict_overflow_code wc = WARN_STRICT_OVERFLOW_COMPARISON;
2333   gimple_stmt_iterator gsi;
2334   unsigned int i, uid;
2335
2336   if (tem == NULL_TREE)
2337     return false;
2338
2339   /* If op is default def SSA_NAME, there is no place to insert the
2340      new comparison.  Give up, unless we can use OP itself as the
2341      range test.  */
2342   if (op && SSA_NAME_IS_DEFAULT_DEF (op))
2343     {
2344       if (op == range->exp
2345           && ((TYPE_PRECISION (optype) == 1 && TYPE_UNSIGNED (optype))
2346               || TREE_CODE (optype) == BOOLEAN_TYPE)
2347           && (op == tem
2348               || (TREE_CODE (tem) == EQ_EXPR
2349                   && TREE_OPERAND (tem, 0) == op
2350                   && integer_onep (TREE_OPERAND (tem, 1))))
2351           && opcode != BIT_IOR_EXPR
2352           && (opcode != ERROR_MARK || oe->rank != BIT_IOR_EXPR))
2353         {
2354           stmt = NULL;
2355           tem = op;
2356         }
2357       else
2358         return false;
2359     }
2360
2361   if (strict_overflow_p && issue_strict_overflow_warning (wc))
2362     warning_at (loc, OPT_Wstrict_overflow,
2363                 "assuming signed overflow does not occur "
2364                 "when simplifying range test");
2365
2366   if (dump_file && (dump_flags & TDF_DETAILS))
2367     {
2368       struct range_entry *r;
2369       fprintf (dump_file, "Optimizing range tests ");
2370       print_generic_expr (dump_file, range->exp);
2371       fprintf (dump_file, " %c[", range->in_p ? '+' : '-');
2372       print_generic_expr (dump_file, range->low);
2373       fprintf (dump_file, ", ");
2374       print_generic_expr (dump_file, range->high);
2375       fprintf (dump_file, "]");
2376       for (i = 0; i < count; i++)
2377         {
2378           if (otherrange)
2379             r = otherrange + i;
2380           else
2381             r = otherrangep[i];
2382           fprintf (dump_file, " and %c[", r->in_p ? '+' : '-');
2383           print_generic_expr (dump_file, r->low);
2384           fprintf (dump_file, ", ");
2385           print_generic_expr (dump_file, r->high);
2386           fprintf (dump_file, "]");
2387         }
2388       fprintf (dump_file, "\n into ");
2389       print_generic_expr (dump_file, tem);
2390       fprintf (dump_file, "\n");
2391     }
2392
2393   if (opcode == BIT_IOR_EXPR
2394       || (opcode == ERROR_MARK && oe->rank == BIT_IOR_EXPR))
2395     tem = invert_truthvalue_loc (loc, tem);
2396
2397   tem = fold_convert_loc (loc, optype, tem);
2398   if (stmt)
2399     {
2400       gsi = gsi_for_stmt (stmt);
2401       uid = gimple_uid (stmt);
2402     }
2403   else
2404     {
2405       gsi = gsi_none ();
2406       uid = 0;
2407     }
2408   if (stmt == NULL)
2409     gcc_checking_assert (tem == op);
2410   /* In rare cases range->exp can be equal to lhs of stmt.
2411      In that case we have to insert after the stmt rather then before
2412      it.  If stmt is a PHI, insert it at the start of the basic block.  */
2413   else if (op != range->exp)
2414     {
2415       gsi_insert_seq_before (&gsi, seq, GSI_SAME_STMT);
2416       tem = force_into_ssa_name (&gsi, tem, true);
2417       gsi_prev (&gsi);
2418     }
2419   else if (gimple_code (stmt) != GIMPLE_PHI)
2420     {
2421       gsi_insert_seq_after (&gsi, seq, GSI_CONTINUE_LINKING);
2422       tem = force_into_ssa_name (&gsi, tem, false);
2423     }
2424   else
2425     {
2426       gsi = gsi_after_labels (gimple_bb (stmt));
2427       if (!gsi_end_p (gsi))
2428         uid = gimple_uid (gsi_stmt (gsi));
2429       else
2430         {
2431           gsi = gsi_start_bb (gimple_bb (stmt));
2432           uid = 1;
2433           while (!gsi_end_p (gsi))
2434             {
2435               uid = gimple_uid (gsi_stmt (gsi));
2436               gsi_next (&gsi);
2437             }
2438         }
2439       gsi_insert_seq_before (&gsi, seq, GSI_SAME_STMT);
2440       tem = force_into_ssa_name (&gsi, tem, true);
2441       if (gsi_end_p (gsi))
2442         gsi = gsi_last_bb (gimple_bb (stmt));
2443       else
2444         gsi_prev (&gsi);
2445     }
2446   for (; !gsi_end_p (gsi); gsi_prev (&gsi))
2447     if (gimple_uid (gsi_stmt (gsi)))
2448       break;
2449     else
2450       gimple_set_uid (gsi_stmt (gsi), uid);
2451
2452   oe->op = tem;
2453   range->exp = exp;
2454   range->low = low;
2455   range->high = high;
2456   range->in_p = in_p;
2457   range->strict_overflow_p = false;
2458
2459   for (i = 0; i < count; i++)
2460     {
2461       if (otherrange)
2462         range = otherrange + i;
2463       else
2464         range = otherrangep[i];
2465       oe = (*ops)[range->idx];
2466       /* Now change all the other range test immediate uses, so that
2467          those tests will be optimized away.  */
2468       if (opcode == ERROR_MARK)
2469         {
2470           if (oe->op)
2471             oe->op = build_int_cst (TREE_TYPE (oe->op),
2472                                     oe->rank == BIT_IOR_EXPR ? 0 : 1);
2473           else
2474             oe->op = (oe->rank == BIT_IOR_EXPR
2475                       ? boolean_false_node : boolean_true_node);
2476         }
2477       else
2478         oe->op = error_mark_node;
2479       range->exp = NULL_TREE;
2480       range->low = NULL_TREE;
2481       range->high = NULL_TREE;
2482     }
2483   return true;
2484 }
2485
2486 /* Optimize X == CST1 || X == CST2
2487    if popcount (CST1 ^ CST2) == 1 into
2488    (X & ~(CST1 ^ CST2)) == (CST1 & ~(CST1 ^ CST2)).
2489    Similarly for ranges.  E.g.
2490    X != 2 && X != 3 && X != 10 && X != 11
2491    will be transformed by the previous optimization into
2492    !((X - 2U) <= 1U || (X - 10U) <= 1U)
2493    and this loop can transform that into
2494    !(((X & ~8) - 2U) <= 1U).  */
2495
2496 static bool
2497 optimize_range_tests_xor (enum tree_code opcode, tree type,
2498                           tree lowi, tree lowj, tree highi, tree highj,
2499                           vec<operand_entry *> *ops,
2500                           struct range_entry *rangei,
2501                           struct range_entry *rangej)
2502 {
2503   tree lowxor, highxor, tem, exp;
2504   /* Check lowi ^ lowj == highi ^ highj and
2505      popcount (lowi ^ lowj) == 1.  */
2506   lowxor = fold_binary (BIT_XOR_EXPR, type, lowi, lowj);
2507   if (lowxor == NULL_TREE || TREE_CODE (lowxor) != INTEGER_CST)
2508     return false;
2509   if (!integer_pow2p (lowxor))
2510     return false;
2511   highxor = fold_binary (BIT_XOR_EXPR, type, highi, highj);
2512   if (!tree_int_cst_equal (lowxor, highxor))
2513     return false;
2514
2515   tem = fold_build1 (BIT_NOT_EXPR, type, lowxor);
2516   exp = fold_build2 (BIT_AND_EXPR, type, rangei->exp, tem);
2517   lowj = fold_build2 (BIT_AND_EXPR, type, lowi, tem);
2518   highj = fold_build2 (BIT_AND_EXPR, type, highi, tem);
2519   if (update_range_test (rangei, rangej, NULL, 1, opcode, ops, exp,
2520                          NULL, rangei->in_p, lowj, highj,
2521                          rangei->strict_overflow_p
2522                          || rangej->strict_overflow_p))
2523     return true;
2524   return false;
2525 }
2526
2527 /* Optimize X == CST1 || X == CST2
2528    if popcount (CST2 - CST1) == 1 into
2529    ((X - CST1) & ~(CST2 - CST1)) == 0.
2530    Similarly for ranges.  E.g.
2531    X == 43 || X == 76 || X == 44 || X == 78 || X == 77 || X == 46
2532    || X == 75 || X == 45
2533    will be transformed by the previous optimization into
2534    (X - 43U) <= 3U || (X - 75U) <= 3U
2535    and this loop can transform that into
2536    ((X - 43U) & ~(75U - 43U)) <= 3U.  */
2537 static bool
2538 optimize_range_tests_diff (enum tree_code opcode, tree type,
2539                            tree lowi, tree lowj, tree highi, tree highj,
2540                            vec<operand_entry *> *ops,
2541                            struct range_entry *rangei,
2542                            struct range_entry *rangej)
2543 {
2544   tree tem1, tem2, mask;
2545   /* Check highi - lowi == highj - lowj.  */
2546   tem1 = fold_binary (MINUS_EXPR, type, highi, lowi);
2547   if (tem1 == NULL_TREE || TREE_CODE (tem1) != INTEGER_CST)
2548     return false;
2549   tem2 = fold_binary (MINUS_EXPR, type, highj, lowj);
2550   if (!tree_int_cst_equal (tem1, tem2))
2551     return false;
2552   /* Check popcount (lowj - lowi) == 1.  */
2553   tem1 = fold_binary (MINUS_EXPR, type, lowj, lowi);
2554   if (tem1 == NULL_TREE || TREE_CODE (tem1) != INTEGER_CST)
2555     return false;
2556   if (!integer_pow2p (tem1))
2557     return false;
2558
2559   type = unsigned_type_for (type);
2560   tem1 = fold_convert (type, tem1);
2561   tem2 = fold_convert (type, tem2);
2562   lowi = fold_convert (type, lowi);
2563   mask = fold_build1 (BIT_NOT_EXPR, type, tem1);
2564   tem1 = fold_build2 (MINUS_EXPR, type,
2565                       fold_convert (type, rangei->exp), lowi);
2566   tem1 = fold_build2 (BIT_AND_EXPR, type, tem1, mask);
2567   lowj = build_int_cst (type, 0);
2568   if (update_range_test (rangei, rangej, NULL, 1, opcode, ops, tem1,
2569                          NULL, rangei->in_p, lowj, tem2,
2570                          rangei->strict_overflow_p
2571                          || rangej->strict_overflow_p))
2572     return true;
2573   return false;
2574 }
2575
2576 /* It does some common checks for function optimize_range_tests_xor and
2577    optimize_range_tests_diff.
2578    If OPTIMIZE_XOR is TRUE, it calls optimize_range_tests_xor.
2579    Else it calls optimize_range_tests_diff.  */
2580
2581 static bool
2582 optimize_range_tests_1 (enum tree_code opcode, int first, int length,
2583                         bool optimize_xor, vec<operand_entry *> *ops,
2584                         struct range_entry *ranges)
2585 {
2586   int i, j;
2587   bool any_changes = false;
2588   for (i = first; i < length; i++)
2589     {
2590       tree lowi, highi, lowj, highj, type, tem;
2591
2592       if (ranges[i].exp == NULL_TREE || ranges[i].in_p)
2593         continue;
2594       type = TREE_TYPE (ranges[i].exp);
2595       if (!INTEGRAL_TYPE_P (type))
2596         continue;
2597       lowi = ranges[i].low;
2598       if (lowi == NULL_TREE)
2599         lowi = TYPE_MIN_VALUE (type);
2600       highi = ranges[i].high;
2601       if (highi == NULL_TREE)
2602         continue;
2603       for (j = i + 1; j < length && j < i + 64; j++)
2604         {
2605           bool changes;
2606           if (ranges[i].exp != ranges[j].exp || ranges[j].in_p)
2607             continue;
2608           lowj = ranges[j].low;
2609           if (lowj == NULL_TREE)
2610             continue;
2611           highj = ranges[j].high;
2612           if (highj == NULL_TREE)
2613             highj = TYPE_MAX_VALUE (type);
2614           /* Check lowj > highi.  */
2615           tem = fold_binary (GT_EXPR, boolean_type_node,
2616                              lowj, highi);
2617           if (tem == NULL_TREE || !integer_onep (tem))
2618             continue;
2619           if (optimize_xor)
2620             changes = optimize_range_tests_xor (opcode, type, lowi, lowj,
2621                                                 highi, highj, ops,
2622                                                 ranges + i, ranges + j);
2623           else
2624             changes = optimize_range_tests_diff (opcode, type, lowi, lowj,
2625                                                  highi, highj, ops,
2626                                                  ranges + i, ranges + j);
2627           if (changes)
2628             {
2629               any_changes = true;
2630               break;
2631             }
2632         }
2633     }
2634   return any_changes;
2635 }
2636
2637 /* Helper function of optimize_range_tests_to_bit_test.  Handle a single
2638    range, EXP, LOW, HIGH, compute bit mask of bits to test and return
2639    EXP on success, NULL otherwise.  */
2640
2641 static tree
2642 extract_bit_test_mask (tree exp, int prec, tree totallow, tree low, tree high,
2643                        wide_int *mask, tree *totallowp)
2644 {
2645   tree tem = int_const_binop (MINUS_EXPR, high, low);
2646   if (tem == NULL_TREE
2647       || TREE_CODE (tem) != INTEGER_CST
2648       || TREE_OVERFLOW (tem)
2649       || tree_int_cst_sgn (tem) == -1
2650       || compare_tree_int (tem, prec) != -1)
2651     return NULL_TREE;
2652
2653   unsigned HOST_WIDE_INT max = tree_to_uhwi (tem) + 1;
2654   *mask = wi::shifted_mask (0, max, false, prec);
2655   if (TREE_CODE (exp) == BIT_AND_EXPR
2656       && TREE_CODE (TREE_OPERAND (exp, 1)) == INTEGER_CST)
2657     {
2658       widest_int msk = wi::to_widest (TREE_OPERAND (exp, 1));
2659       msk = wi::zext (~msk, TYPE_PRECISION (TREE_TYPE (exp)));
2660       if (wi::popcount (msk) == 1
2661           && wi::ltu_p (msk, prec - max))
2662         {
2663           *mask |= wi::shifted_mask (msk.to_uhwi (), max, false, prec);
2664           max += msk.to_uhwi ();
2665           exp = TREE_OPERAND (exp, 0);
2666           if (integer_zerop (low)
2667               && TREE_CODE (exp) == PLUS_EXPR
2668               && TREE_CODE (TREE_OPERAND (exp, 1)) == INTEGER_CST)
2669             {
2670               tree ret = TREE_OPERAND (exp, 0);
2671               STRIP_NOPS (ret);
2672               widest_int bias
2673                 = wi::neg (wi::sext (wi::to_widest (TREE_OPERAND (exp, 1)),
2674                                      TYPE_PRECISION (TREE_TYPE (low))));
2675               tree tbias = wide_int_to_tree (TREE_TYPE (ret), bias);
2676               if (totallowp)
2677                 {
2678                   *totallowp = tbias;
2679                   return ret;
2680                 }
2681               else if (!tree_int_cst_lt (totallow, tbias))
2682                 return NULL_TREE;
2683               bias = wi::to_widest (tbias);
2684               bias -= wi::to_widest (totallow);
2685               if (bias >= 0 && bias < prec - max)
2686                 {
2687                   *mask = wi::lshift (*mask, bias);
2688                   return ret;
2689                 }
2690             }
2691         }
2692     }
2693   if (totallowp)
2694     return exp;
2695   if (!tree_int_cst_lt (totallow, low))
2696     return exp;
2697   tem = int_const_binop (MINUS_EXPR, low, totallow);
2698   if (tem == NULL_TREE
2699       || TREE_CODE (tem) != INTEGER_CST
2700       || TREE_OVERFLOW (tem)
2701       || compare_tree_int (tem, prec - max) == 1)
2702     return NULL_TREE;
2703
2704   *mask = wi::lshift (*mask, wi::to_widest (tem));
2705   return exp;
2706 }
2707
2708 /* Attempt to optimize small range tests using bit test.
2709    E.g.
2710    X != 43 && X != 76 && X != 44 && X != 78 && X != 49
2711    && X != 77 && X != 46 && X != 75 && X != 45 && X != 82
2712    has been by earlier optimizations optimized into:
2713    ((X - 43U) & ~32U) > 3U && X != 49 && X != 82
2714    As all the 43 through 82 range is less than 64 numbers,
2715    for 64-bit word targets optimize that into:
2716    (X - 43U) > 40U && ((1 << (X - 43U)) & 0x8F0000004FULL) == 0  */
2717
2718 static bool
2719 optimize_range_tests_to_bit_test (enum tree_code opcode, int first, int length,
2720                                   vec<operand_entry *> *ops,
2721                                   struct range_entry *ranges)
2722 {
2723   int i, j;
2724   bool any_changes = false;
2725   int prec = GET_MODE_BITSIZE (word_mode);
2726   auto_vec<struct range_entry *, 64> candidates;
2727
2728   for (i = first; i < length - 2; i++)
2729     {
2730       tree lowi, highi, lowj, highj, type;
2731
2732       if (ranges[i].exp == NULL_TREE || ranges[i].in_p)
2733         continue;
2734       type = TREE_TYPE (ranges[i].exp);
2735       if (!INTEGRAL_TYPE_P (type))
2736         continue;
2737       lowi = ranges[i].low;
2738       if (lowi == NULL_TREE)
2739         lowi = TYPE_MIN_VALUE (type);
2740       highi = ranges[i].high;
2741       if (highi == NULL_TREE)
2742         continue;
2743       wide_int mask;
2744       tree exp = extract_bit_test_mask (ranges[i].exp, prec, lowi, lowi,
2745                                         highi, &mask, &lowi);
2746       if (exp == NULL_TREE)
2747         continue;
2748       bool strict_overflow_p = ranges[i].strict_overflow_p;
2749       candidates.truncate (0);
2750       int end = MIN (i + 64, length);
2751       for (j = i + 1; j < end; j++)
2752         {
2753           tree exp2;
2754           if (ranges[j].exp == NULL_TREE || ranges[j].in_p)
2755             continue;
2756           if (ranges[j].exp == exp)
2757             ;
2758           else if (TREE_CODE (ranges[j].exp) == BIT_AND_EXPR)
2759             {
2760               exp2 = TREE_OPERAND (ranges[j].exp, 0);
2761               if (exp2 == exp)
2762                 ;
2763               else if (TREE_CODE (exp2) == PLUS_EXPR)
2764                 {
2765                   exp2 = TREE_OPERAND (exp2, 0);
2766                   STRIP_NOPS (exp2);
2767                   if (exp2 != exp)
2768                     continue;
2769                 }
2770               else
2771                 continue;
2772             }
2773           else
2774             continue;
2775           lowj = ranges[j].low;
2776           if (lowj == NULL_TREE)
2777             continue;
2778           highj = ranges[j].high;
2779           if (highj == NULL_TREE)
2780             highj = TYPE_MAX_VALUE (type);
2781           wide_int mask2;
2782           exp2 = extract_bit_test_mask (ranges[j].exp, prec, lowi, lowj,
2783                                         highj, &mask2, NULL);
2784           if (exp2 != exp)
2785             continue;
2786           mask |= mask2;
2787           strict_overflow_p |= ranges[j].strict_overflow_p;
2788           candidates.safe_push (&ranges[j]);
2789         }
2790
2791       /* If we need otherwise 3 or more comparisons, use a bit test.  */
2792       if (candidates.length () >= 2)
2793         {
2794           tree high = wide_int_to_tree (TREE_TYPE (lowi),
2795                                         wi::to_widest (lowi)
2796                                         + prec - 1 - wi::clz (mask));
2797           operand_entry *oe = (*ops)[ranges[i].idx];
2798           tree op = oe->op;
2799           gimple *stmt = op ? SSA_NAME_DEF_STMT (op)
2800                             : last_stmt (BASIC_BLOCK_FOR_FN (cfun, oe->id));
2801           location_t loc = gimple_location (stmt);
2802           tree optype = op ? TREE_TYPE (op) : boolean_type_node;
2803
2804           /* See if it isn't cheaper to pretend the minimum value of the
2805              range is 0, if maximum value is small enough.
2806              We can avoid then subtraction of the minimum value, but the
2807              mask constant could be perhaps more expensive.  */
2808           if (compare_tree_int (lowi, 0) > 0
2809               && compare_tree_int (high, prec) < 0)
2810             {
2811               int cost_diff;
2812               HOST_WIDE_INT m = tree_to_uhwi (lowi);
2813               rtx reg = gen_raw_REG (word_mode, 10000);
2814               bool speed_p = optimize_bb_for_speed_p (gimple_bb (stmt));
2815               cost_diff = set_rtx_cost (gen_rtx_PLUS (word_mode, reg,
2816                                                       GEN_INT (-m)), speed_p);
2817               rtx r = immed_wide_int_const (mask, word_mode);
2818               cost_diff += set_src_cost (gen_rtx_AND (word_mode, reg, r),
2819                                          word_mode, speed_p);
2820               r = immed_wide_int_const (wi::lshift (mask, m), word_mode);
2821               cost_diff -= set_src_cost (gen_rtx_AND (word_mode, reg, r),
2822                                          word_mode, speed_p);
2823               if (cost_diff > 0)
2824                 {
2825                   mask = wi::lshift (mask, m);
2826                   lowi = build_zero_cst (TREE_TYPE (lowi));
2827                 }
2828             }
2829
2830           tree tem = build_range_check (loc, optype, unshare_expr (exp),
2831                                         false, lowi, high);
2832           if (tem == NULL_TREE || is_gimple_val (tem))
2833             continue;
2834           tree etype = unsigned_type_for (TREE_TYPE (exp));
2835           exp = fold_build2_loc (loc, MINUS_EXPR, etype,
2836                                  fold_convert_loc (loc, etype, exp),
2837                                  fold_convert_loc (loc, etype, lowi));
2838           exp = fold_convert_loc (loc, integer_type_node, exp);
2839           tree word_type = lang_hooks.types.type_for_mode (word_mode, 1);
2840           exp = fold_build2_loc (loc, LSHIFT_EXPR, word_type,
2841                                  build_int_cst (word_type, 1), exp);
2842           exp = fold_build2_loc (loc, BIT_AND_EXPR, word_type, exp,
2843                                  wide_int_to_tree (word_type, mask));
2844           exp = fold_build2_loc (loc, EQ_EXPR, optype, exp,
2845                                  build_zero_cst (word_type));
2846           if (is_gimple_val (exp))
2847             continue;
2848
2849           /* The shift might have undefined behavior if TEM is true,
2850              but reassociate_bb isn't prepared to have basic blocks
2851              split when it is running.  So, temporarily emit a code
2852              with BIT_IOR_EXPR instead of &&, and fix it up in
2853              branch_fixup.  */
2854           gimple_seq seq;
2855           tem = force_gimple_operand (tem, &seq, true, NULL_TREE);
2856           gcc_assert (TREE_CODE (tem) == SSA_NAME);
2857           gimple_set_visited (SSA_NAME_DEF_STMT (tem), true);
2858           gimple_seq seq2;
2859           exp = force_gimple_operand (exp, &seq2, true, NULL_TREE);
2860           gimple_seq_add_seq_without_update (&seq, seq2);
2861           gcc_assert (TREE_CODE (exp) == SSA_NAME);
2862           gimple_set_visited (SSA_NAME_DEF_STMT (exp), true);
2863           gimple *g = gimple_build_assign (make_ssa_name (optype),
2864                                            BIT_IOR_EXPR, tem, exp);
2865           gimple_set_location (g, loc);
2866           gimple_seq_add_stmt_without_update (&seq, g);
2867           exp = gimple_assign_lhs (g);
2868           tree val = build_zero_cst (optype);
2869           if (update_range_test (&ranges[i], NULL, candidates.address (),
2870                                  candidates.length (), opcode, ops, exp,
2871                                  seq, false, val, val, strict_overflow_p))
2872             {
2873               any_changes = true;
2874               reassoc_branch_fixups.safe_push (tem);
2875             }
2876           else
2877             gimple_seq_discard (seq);
2878         }
2879     }
2880   return any_changes;
2881 }
2882
2883 /* Attempt to optimize for signed a and b where b is known to be >= 0:
2884    a >= 0 && a < b into (unsigned) a < (unsigned) b
2885    a >= 0 && a <= b into (unsigned) a <= (unsigned) b  */
2886
2887 static bool
2888 optimize_range_tests_var_bound (enum tree_code opcode, int first, int length,
2889                                 vec<operand_entry *> *ops,
2890                                 struct range_entry *ranges)
2891 {
2892   int i;
2893   bool any_changes = false;
2894   hash_map<tree, int> *map = NULL;
2895
2896   for (i = first; i < length; i++)
2897     {
2898       if (ranges[i].exp == NULL_TREE
2899           || TREE_CODE (ranges[i].exp) != SSA_NAME
2900           || !ranges[i].in_p)
2901         continue;
2902
2903       tree type = TREE_TYPE (ranges[i].exp);
2904       if (!INTEGRAL_TYPE_P (type)
2905           || TYPE_UNSIGNED (type)
2906           || ranges[i].low == NULL_TREE
2907           || !integer_zerop (ranges[i].low)
2908           || ranges[i].high != NULL_TREE)
2909         continue;
2910       /* EXP >= 0 here.  */
2911       if (map == NULL)
2912         map = new hash_map <tree, int>;
2913       map->put (ranges[i].exp, i);
2914     }
2915
2916   if (map == NULL)
2917     return false;
2918
2919   for (i = 0; i < length; i++)
2920     {
2921       if (ranges[i].low == NULL_TREE
2922           || ranges[i].high == NULL_TREE
2923           || !integer_zerop (ranges[i].low)
2924           || !integer_zerop (ranges[i].high))
2925         continue;
2926
2927       gimple *stmt;
2928       tree_code ccode;
2929       tree rhs1, rhs2;
2930       if (ranges[i].exp)
2931         {
2932           if (TREE_CODE (ranges[i].exp) != SSA_NAME)
2933             continue;
2934           stmt = SSA_NAME_DEF_STMT (ranges[i].exp);
2935           if (!is_gimple_assign (stmt))
2936             continue;
2937           ccode = gimple_assign_rhs_code (stmt);
2938           rhs1 = gimple_assign_rhs1 (stmt);
2939           rhs2 = gimple_assign_rhs2 (stmt);
2940         }
2941       else
2942         {
2943           operand_entry *oe = (*ops)[ranges[i].idx];
2944           stmt = last_stmt (BASIC_BLOCK_FOR_FN (cfun, oe->id));
2945           if (gimple_code (stmt) != GIMPLE_COND)
2946             continue;
2947           ccode = gimple_cond_code (stmt);
2948           rhs1 = gimple_cond_lhs (stmt);
2949           rhs2 = gimple_cond_rhs (stmt);
2950         }
2951
2952       if (TREE_CODE (rhs1) != SSA_NAME
2953           || rhs2 == NULL_TREE
2954           || TREE_CODE (rhs2) != SSA_NAME)
2955         continue;
2956
2957       switch (ccode)
2958         {
2959         case GT_EXPR:
2960         case GE_EXPR:
2961         case LT_EXPR:
2962         case LE_EXPR:
2963           break;
2964         default:
2965           continue;
2966         }
2967       if (ranges[i].in_p)
2968         ccode = invert_tree_comparison (ccode, false);
2969       switch (ccode)
2970         {
2971         case GT_EXPR:
2972         case GE_EXPR:
2973           std::swap (rhs1, rhs2);
2974           ccode = swap_tree_comparison (ccode);
2975           break;
2976         case LT_EXPR:
2977         case LE_EXPR:
2978           break;
2979         default:
2980           gcc_unreachable ();
2981         }
2982
2983       int *idx = map->get (rhs1);
2984       if (idx == NULL)
2985         continue;
2986
2987       wide_int nz = get_nonzero_bits (rhs2);
2988       if (wi::neg_p (nz))
2989         continue;
2990
2991       /* We have EXP < RHS2 or EXP <= RHS2 where EXP >= 0
2992          and RHS2 is known to be RHS2 >= 0.  */
2993       tree utype = unsigned_type_for (TREE_TYPE (rhs1));
2994
2995       enum warn_strict_overflow_code wc = WARN_STRICT_OVERFLOW_COMPARISON;
2996       if ((ranges[*idx].strict_overflow_p
2997            || ranges[i].strict_overflow_p)
2998           && issue_strict_overflow_warning (wc))
2999         warning_at (gimple_location (stmt), OPT_Wstrict_overflow,
3000                     "assuming signed overflow does not occur "
3001                     "when simplifying range test");
3002
3003       if (dump_file && (dump_flags & TDF_DETAILS))
3004         {
3005           struct range_entry *r = &ranges[*idx];
3006           fprintf (dump_file, "Optimizing range test ");
3007           print_generic_expr (dump_file, r->exp);
3008           fprintf (dump_file, " +[");
3009           print_generic_expr (dump_file, r->low);
3010           fprintf (dump_file, ", ");
3011           print_generic_expr (dump_file, r->high);
3012           fprintf (dump_file, "] and comparison ");
3013           print_generic_expr (dump_file, rhs1);
3014           fprintf (dump_file, " %s ", op_symbol_code (ccode));
3015           print_generic_expr (dump_file, rhs2);
3016           fprintf (dump_file, "\n into (");
3017           print_generic_expr (dump_file, utype);
3018           fprintf (dump_file, ") ");
3019           print_generic_expr (dump_file, rhs1);
3020           fprintf (dump_file, " %s (", op_symbol_code (ccode));
3021           print_generic_expr (dump_file, utype);
3022           fprintf (dump_file, ") ");
3023           print_generic_expr (dump_file, rhs2);
3024           fprintf (dump_file, "\n");
3025         }
3026
3027       operand_entry *oe = (*ops)[ranges[i].idx];
3028       ranges[i].in_p = 0;
3029       if (opcode == BIT_IOR_EXPR
3030           || (opcode == ERROR_MARK && oe->rank == BIT_IOR_EXPR))
3031         {
3032           ranges[i].in_p = 1;
3033           ccode = invert_tree_comparison (ccode, false);
3034         }
3035
3036       unsigned int uid = gimple_uid (stmt);
3037       gimple_stmt_iterator gsi = gsi_for_stmt (stmt);
3038       gimple *g = gimple_build_assign (make_ssa_name (utype), NOP_EXPR, rhs1);
3039       gimple_set_uid (g, uid);
3040       rhs1 = gimple_assign_lhs (g);
3041       gsi_insert_before (&gsi, g, GSI_SAME_STMT);
3042       g = gimple_build_assign (make_ssa_name (utype), NOP_EXPR, rhs2);
3043       gimple_set_uid (g, uid);
3044       rhs2 = gimple_assign_lhs (g);
3045       gsi_insert_before (&gsi, g, GSI_SAME_STMT);
3046       if (tree_swap_operands_p (rhs1, rhs2))
3047         {
3048           std::swap (rhs1, rhs2);
3049           ccode = swap_tree_comparison (ccode);
3050         }
3051       if (gimple_code (stmt) == GIMPLE_COND)
3052         {
3053           gcond *c = as_a <gcond *> (stmt);
3054           gimple_cond_set_code (c, ccode);
3055           gimple_cond_set_lhs (c, rhs1);
3056           gimple_cond_set_rhs (c, rhs2);
3057           update_stmt (stmt);
3058         }
3059       else
3060         {
3061           tree ctype = oe->op ? TREE_TYPE (oe->op) : boolean_type_node;
3062           if (!INTEGRAL_TYPE_P (ctype)
3063               || (TREE_CODE (ctype) != BOOLEAN_TYPE
3064                   && TYPE_PRECISION (ctype) != 1))
3065             ctype = boolean_type_node;
3066           g = gimple_build_assign (make_ssa_name (ctype), ccode, rhs1, rhs2);
3067           gimple_set_uid (g, uid);
3068           gsi_insert_before (&gsi, g, GSI_SAME_STMT);
3069           if (oe->op && ctype != TREE_TYPE (oe->op))
3070             {
3071               g = gimple_build_assign (make_ssa_name (TREE_TYPE (oe->op)),
3072                                        NOP_EXPR, gimple_assign_lhs (g));
3073               gimple_set_uid (g, uid);
3074               gsi_insert_before (&gsi, g, GSI_SAME_STMT);
3075             }
3076           ranges[i].exp = gimple_assign_lhs (g);
3077           oe->op = ranges[i].exp;
3078           ranges[i].low = build_zero_cst (TREE_TYPE (ranges[i].exp));
3079           ranges[i].high = ranges[i].low;
3080         }
3081       ranges[i].strict_overflow_p = false;
3082       oe = (*ops)[ranges[*idx].idx];
3083       /* Now change all the other range test immediate uses, so that
3084          those tests will be optimized away.  */
3085       if (opcode == ERROR_MARK)
3086         {
3087           if (oe->op)
3088             oe->op = build_int_cst (TREE_TYPE (oe->op),
3089                                     oe->rank == BIT_IOR_EXPR ? 0 : 1);
3090           else
3091             oe->op = (oe->rank == BIT_IOR_EXPR
3092                       ? boolean_false_node : boolean_true_node);
3093         }
3094       else
3095         oe->op = error_mark_node;
3096       ranges[*idx].exp = NULL_TREE;
3097       ranges[*idx].low = NULL_TREE;
3098       ranges[*idx].high = NULL_TREE;
3099       any_changes = true;
3100     }
3101
3102   delete map;
3103   return any_changes;
3104 }
3105
3106 /* Optimize range tests, similarly how fold_range_test optimizes
3107    it on trees.  The tree code for the binary
3108    operation between all the operands is OPCODE.
3109    If OPCODE is ERROR_MARK, optimize_range_tests is called from within
3110    maybe_optimize_range_tests for inter-bb range optimization.
3111    In that case if oe->op is NULL, oe->id is bb->index whose
3112    GIMPLE_COND is && or ||ed into the test, and oe->rank says
3113    the actual opcode.  */
3114
3115 static bool
3116 optimize_range_tests (enum tree_code opcode,
3117                       vec<operand_entry *> *ops)
3118 {
3119   unsigned int length = ops->length (), i, j, first;
3120   operand_entry *oe;
3121   struct range_entry *ranges;
3122   bool any_changes = false;
3123
3124   if (length == 1)
3125     return false;
3126
3127   ranges = XNEWVEC (struct range_entry, length);
3128   for (i = 0; i < length; i++)
3129     {
3130       oe = (*ops)[i];
3131       ranges[i].idx = i;
3132       init_range_entry (ranges + i, oe->op,
3133                         oe->op
3134                         ? NULL
3135                         : last_stmt (BASIC_BLOCK_FOR_FN (cfun, oe->id)));
3136       /* For | invert it now, we will invert it again before emitting
3137          the optimized expression.  */
3138       if (opcode == BIT_IOR_EXPR
3139           || (opcode == ERROR_MARK && oe->rank == BIT_IOR_EXPR))
3140         ranges[i].in_p = !ranges[i].in_p;
3141     }
3142
3143   qsort (ranges, length, sizeof (*ranges), range_entry_cmp);
3144   for (i = 0; i < length; i++)
3145     if (ranges[i].exp != NULL_TREE && TREE_CODE (ranges[i].exp) == SSA_NAME)
3146       break;
3147
3148   /* Try to merge ranges.  */
3149   for (first = i; i < length; i++)
3150     {
3151       tree low = ranges[i].low;
3152       tree high = ranges[i].high;
3153       int in_p = ranges[i].in_p;
3154       bool strict_overflow_p = ranges[i].strict_overflow_p;
3155       int update_fail_count = 0;
3156
3157       for (j = i + 1; j < length; j++)
3158         {
3159           if (ranges[i].exp != ranges[j].exp)
3160             break;
3161           if (!merge_ranges (&in_p, &low, &high, in_p, low, high,
3162                              ranges[j].in_p, ranges[j].low, ranges[j].high))
3163             break;
3164           strict_overflow_p |= ranges[j].strict_overflow_p;
3165         }
3166
3167       if (j == i + 1)
3168         continue;
3169
3170       if (update_range_test (ranges + i, ranges + i + 1, NULL, j - i - 1,
3171                              opcode, ops, ranges[i].exp, NULL, in_p,
3172                              low, high, strict_overflow_p))
3173         {
3174           i = j - 1;
3175           any_changes = true;
3176         }
3177       /* Avoid quadratic complexity if all merge_ranges calls would succeed,
3178          while update_range_test would fail.  */
3179       else if (update_fail_count == 64)
3180         i = j - 1;
3181       else
3182         ++update_fail_count;
3183     }
3184
3185   any_changes |= optimize_range_tests_1 (opcode, first, length, true,
3186                                          ops, ranges);
3187
3188   if (BRANCH_COST (optimize_function_for_speed_p (cfun), false) >= 2)
3189     any_changes |= optimize_range_tests_1 (opcode, first, length, false,
3190                                            ops, ranges);
3191   if (lshift_cheap_p (optimize_function_for_speed_p (cfun)))
3192     any_changes |= optimize_range_tests_to_bit_test (opcode, first, length,
3193                                                      ops, ranges);
3194   any_changes |= optimize_range_tests_var_bound (opcode, first, length, ops,
3195                                                  ranges);
3196
3197   if (any_changes && opcode != ERROR_MARK)
3198     {
3199       j = 0;
3200       FOR_EACH_VEC_ELT (*ops, i, oe)
3201         {
3202           if (oe->op == error_mark_node)
3203             continue;
3204           else if (i != j)
3205             (*ops)[j] = oe;
3206           j++;
3207         }
3208       ops->truncate (j);
3209     }
3210
3211   XDELETEVEC (ranges);
3212   return any_changes;
3213 }
3214
3215 /* A subroutine of optimize_vec_cond_expr to extract and canonicalize
3216    the operands of the VEC_COND_EXPR.  Returns ERROR_MARK on failure,
3217    otherwise the comparison code.  */
3218
3219 static tree_code
3220 ovce_extract_ops (tree var, gassign **rets, bool *reti)
3221 {
3222   if (TREE_CODE (var) != SSA_NAME)
3223     return ERROR_MARK;
3224
3225   gassign *stmt = dyn_cast <gassign *> (SSA_NAME_DEF_STMT (var));
3226   if (stmt == NULL)
3227     return ERROR_MARK;
3228
3229   /* ??? If we start creating more COND_EXPR, we could perform
3230      this same optimization with them.  For now, simplify.  */
3231   if (gimple_assign_rhs_code (stmt) != VEC_COND_EXPR)
3232     return ERROR_MARK;
3233
3234   tree cond = gimple_assign_rhs1 (stmt);
3235   tree_code cmp = TREE_CODE (cond);
3236   if (TREE_CODE_CLASS (cmp) != tcc_comparison)
3237     return ERROR_MARK;
3238
3239   /* ??? For now, allow only canonical true and false result vectors.
3240      We could expand this to other constants should the need arise,
3241      but at the moment we don't create them.  */
3242   tree t = gimple_assign_rhs2 (stmt);
3243   tree f = gimple_assign_rhs3 (stmt);
3244   bool inv;
3245   if (integer_all_onesp (t))
3246     inv = false;
3247   else if (integer_all_onesp (f))
3248     {
3249       cmp = invert_tree_comparison (cmp, false);
3250       inv = true;
3251     }
3252   else
3253     return ERROR_MARK;
3254   if (!integer_zerop (f))
3255     return ERROR_MARK;
3256
3257   /* Success!  */
3258   if (rets)
3259     *rets = stmt;
3260   if (reti)
3261     *reti = inv;
3262   return cmp;
3263 }
3264
3265 /* Optimize the condition of VEC_COND_EXPRs which have been combined
3266    with OPCODE (either BIT_AND_EXPR or BIT_IOR_EXPR).  */
3267
3268 static bool
3269 optimize_vec_cond_expr (tree_code opcode, vec<operand_entry *> *ops)
3270 {
3271   unsigned int length = ops->length (), i, j;
3272   bool any_changes = false;
3273
3274   if (length == 1)
3275     return false;
3276
3277   for (i = 0; i < length; ++i)
3278     {
3279       tree elt0 = (*ops)[i]->op;
3280
3281       gassign *stmt0;
3282       bool invert;
3283       tree_code cmp0 = ovce_extract_ops (elt0, &stmt0, &invert);
3284       if (cmp0 == ERROR_MARK)
3285         continue;
3286
3287       for (j = i + 1; j < length; ++j)
3288         {
3289           tree &elt1 = (*ops)[j]->op;
3290
3291           gassign *stmt1;
3292           tree_code cmp1 = ovce_extract_ops (elt1, &stmt1, NULL);
3293           if (cmp1 == ERROR_MARK)
3294             continue;
3295
3296           tree cond0 = gimple_assign_rhs1 (stmt0);
3297           tree x0 = TREE_OPERAND (cond0, 0);
3298           tree y0 = TREE_OPERAND (cond0, 1);
3299
3300           tree cond1 = gimple_assign_rhs1 (stmt1);
3301           tree x1 = TREE_OPERAND (cond1, 0);
3302           tree y1 = TREE_OPERAND (cond1, 1);
3303
3304           tree comb;
3305           if (opcode == BIT_AND_EXPR)
3306             comb = maybe_fold_and_comparisons (cmp0, x0, y0, cmp1, x1, y1);
3307           else if (opcode == BIT_IOR_EXPR)
3308             comb = maybe_fold_or_comparisons (cmp0, x0, y0, cmp1, x1, y1);
3309           else
3310             gcc_unreachable ();
3311           if (comb == NULL)
3312             continue;
3313
3314           /* Success! */
3315           if (dump_file && (dump_flags & TDF_DETAILS))
3316             {
3317               fprintf (dump_file, "Transforming ");
3318               print_generic_expr (dump_file, cond0);
3319               fprintf (dump_file, " %c ", opcode == BIT_AND_EXPR ? '&' : '|');
3320               print_generic_expr (dump_file, cond1);
3321               fprintf (dump_file, " into ");
3322               print_generic_expr (dump_file, comb);
3323               fputc ('\n', dump_file);
3324             }
3325
3326           gimple_assign_set_rhs1 (stmt0, comb);
3327           if (invert)
3328             std::swap (*gimple_assign_rhs2_ptr (stmt0),
3329                        *gimple_assign_rhs3_ptr (stmt0));
3330           update_stmt (stmt0);
3331
3332           elt1 = error_mark_node;
3333           any_changes = true;
3334         }
3335     }
3336
3337   if (any_changes)
3338     {
3339       operand_entry *oe;
3340       j = 0;
3341       FOR_EACH_VEC_ELT (*ops, i, oe)
3342         {
3343           if (oe->op == error_mark_node)
3344             continue;
3345           else if (i != j)
3346             (*ops)[j] = oe;
3347           j++;
3348         }
3349       ops->truncate (j);
3350     }
3351
3352   return any_changes;
3353 }
3354
3355 /* Return true if STMT is a cast like:
3356    <bb N>:
3357    ...
3358    _123 = (int) _234;
3359
3360    <bb M>:
3361    # _345 = PHI <_123(N), 1(...), 1(...)>
3362    where _234 has bool type, _123 has single use and
3363    bb N has a single successor M.  This is commonly used in
3364    the last block of a range test.
3365
3366    Also Return true if STMT is tcc_compare like:
3367    <bb N>:
3368    ...
3369    _234 = a_2(D) == 2;
3370
3371    <bb M>:
3372    # _345 = PHI <_234(N), 1(...), 1(...)>
3373    _346 = (int) _345;
3374    where _234 has booltype, single use and
3375    bb N has a single successor M.  This is commonly used in
3376    the last block of a range test.  */
3377
3378 static bool
3379 final_range_test_p (gimple *stmt)
3380 {
3381   basic_block bb, rhs_bb, lhs_bb;
3382   edge e;
3383   tree lhs, rhs;
3384   use_operand_p use_p;
3385   gimple *use_stmt;
3386
3387   if (!gimple_assign_cast_p (stmt)
3388       && (!is_gimple_assign (stmt)
3389           || (TREE_CODE_CLASS (gimple_assign_rhs_code (stmt))
3390               != tcc_comparison)))
3391     return false;
3392   bb = gimple_bb (stmt);
3393   if (!single_succ_p (bb))
3394     return false;
3395   e = single_succ_edge (bb);
3396   if (e->flags & EDGE_COMPLEX)
3397     return false;
3398
3399   lhs = gimple_assign_lhs (stmt);
3400   rhs = gimple_assign_rhs1 (stmt);
3401   if (gimple_assign_cast_p (stmt)
3402       && (!INTEGRAL_TYPE_P (TREE_TYPE (lhs))
3403           || TREE_CODE (rhs) != SSA_NAME
3404           || TREE_CODE (TREE_TYPE (rhs)) != BOOLEAN_TYPE))
3405     return false;
3406
3407   if (!gimple_assign_cast_p (stmt)
3408       && (TREE_CODE (TREE_TYPE (lhs)) != BOOLEAN_TYPE))
3409       return false;
3410
3411   /* Test whether lhs is consumed only by a PHI in the only successor bb.  */
3412   if (!single_imm_use (lhs, &use_p, &use_stmt))
3413     return false;
3414
3415   if (gimple_code (use_stmt) != GIMPLE_PHI
3416       || gimple_bb (use_stmt) != e->dest)
3417     return false;
3418
3419   /* And that the rhs is defined in the same loop.  */
3420   if (gimple_assign_cast_p (stmt))
3421     {
3422       if (TREE_CODE (rhs) != SSA_NAME
3423           || !(rhs_bb = gimple_bb (SSA_NAME_DEF_STMT (rhs)))
3424           || !flow_bb_inside_loop_p (loop_containing_stmt (stmt), rhs_bb))
3425         return false;
3426     }
3427   else
3428     {
3429       if (TREE_CODE (lhs) != SSA_NAME
3430           || !(lhs_bb = gimple_bb (SSA_NAME_DEF_STMT (lhs)))
3431           || !flow_bb_inside_loop_p (loop_containing_stmt (stmt), lhs_bb))
3432         return false;
3433     }
3434
3435   return true;
3436 }
3437
3438 /* Return true if BB is suitable basic block for inter-bb range test
3439    optimization.  If BACKWARD is true, BB should be the only predecessor
3440    of TEST_BB, and *OTHER_BB is either NULL and filled by the routine,
3441    or compared with to find a common basic block to which all conditions
3442    branch to if true resp. false.  If BACKWARD is false, TEST_BB should
3443    be the only predecessor of BB.  */
3444
3445 static bool
3446 suitable_cond_bb (basic_block bb, basic_block test_bb, basic_block *other_bb,
3447                   bool backward)
3448 {
3449   edge_iterator ei, ei2;
3450   edge e, e2;
3451   gimple *stmt;
3452   gphi_iterator gsi;
3453   bool other_edge_seen = false;
3454   bool is_cond;
3455
3456   if (test_bb == bb)
3457     return false;
3458   /* Check last stmt first.  */
3459   stmt = last_stmt (bb);
3460   if (stmt == NULL
3461       || (gimple_code (stmt) != GIMPLE_COND
3462           && (backward || !final_range_test_p (stmt)))
3463       || gimple_visited_p (stmt)
3464       || stmt_could_throw_p (stmt)
3465       || *other_bb == bb)
3466     return false;
3467   is_cond = gimple_code (stmt) == GIMPLE_COND;
3468   if (is_cond)
3469     {
3470       /* If last stmt is GIMPLE_COND, verify that one of the succ edges
3471          goes to the next bb (if BACKWARD, it is TEST_BB), and the other
3472          to *OTHER_BB (if not set yet, try to find it out).  */
3473       if (EDGE_COUNT (bb->succs) != 2)
3474         return false;
3475       FOR_EACH_EDGE (e, ei, bb->succs)
3476         {
3477           if (!(e->flags & (EDGE_TRUE_VALUE | EDGE_FALSE_VALUE)))
3478             return false;
3479           if (e->dest == test_bb)
3480             {
3481               if (backward)
3482                 continue;
3483               else
3484                 return false;
3485             }
3486           if (e->dest == bb)
3487             return false;
3488           if (*other_bb == NULL)
3489             {
3490               FOR_EACH_EDGE (e2, ei2, test_bb->succs)
3491                 if (!(e2->flags & (EDGE_TRUE_VALUE | EDGE_FALSE_VALUE)))
3492                   return false;
3493                 else if (e->dest == e2->dest)
3494                   *other_bb = e->dest;
3495               if (*other_bb == NULL)
3496                 return false;
3497             }
3498           if (e->dest == *other_bb)
3499             other_edge_seen = true;
3500           else if (backward)
3501             return false;
3502         }
3503       if (*other_bb == NULL || !other_edge_seen)
3504         return false;
3505     }
3506   else if (single_succ (bb) != *other_bb)
3507     return false;
3508
3509   /* Now check all PHIs of *OTHER_BB.  */
3510   e = find_edge (bb, *other_bb);
3511   e2 = find_edge (test_bb, *other_bb);
3512   for (gsi = gsi_start_phis (e->dest); !gsi_end_p (gsi); gsi_next (&gsi))
3513     {
3514       gphi *phi = gsi.phi ();
3515       /* If both BB and TEST_BB end with GIMPLE_COND, all PHI arguments
3516          corresponding to BB and TEST_BB predecessor must be the same.  */
3517       if (!operand_equal_p (gimple_phi_arg_def (phi, e->dest_idx),
3518                             gimple_phi_arg_def (phi, e2->dest_idx), 0))
3519         {
3520           /* Otherwise, if one of the blocks doesn't end with GIMPLE_COND,
3521              one of the PHIs should have the lhs of the last stmt in
3522              that block as PHI arg and that PHI should have 0 or 1
3523              corresponding to it in all other range test basic blocks
3524              considered.  */
3525           if (!is_cond)
3526             {
3527               if (gimple_phi_arg_def (phi, e->dest_idx)
3528                   == gimple_assign_lhs (stmt)
3529                   && (integer_zerop (gimple_phi_arg_def (phi, e2->dest_idx))
3530                       || integer_onep (gimple_phi_arg_def (phi,
3531                                                            e2->dest_idx))))
3532                 continue;
3533             }
3534           else
3535             {
3536               gimple *test_last = last_stmt (test_bb);
3537               if (gimple_code (test_last) != GIMPLE_COND
3538                   && gimple_phi_arg_def (phi, e2->dest_idx)
3539                      == gimple_assign_lhs (test_last)
3540                   && (integer_zerop (gimple_phi_arg_def (phi, e->dest_idx))
3541                       || integer_onep (gimple_phi_arg_def (phi, e->dest_idx))))
3542                 continue;
3543             }
3544
3545           return false;
3546         }
3547     }
3548   return true;
3549 }
3550
3551 /* Return true if BB doesn't have side-effects that would disallow
3552    range test optimization, all SSA_NAMEs set in the bb are consumed
3553    in the bb and there are no PHIs.  */
3554
3555 static bool
3556 no_side_effect_bb (basic_block bb)
3557 {
3558   gimple_stmt_iterator gsi;
3559   gimple *last;
3560
3561   if (!gimple_seq_empty_p (phi_nodes (bb)))
3562     return false;
3563   last = last_stmt (bb);
3564   for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
3565     {
3566       gimple *stmt = gsi_stmt (gsi);
3567       tree lhs;
3568       imm_use_iterator imm_iter;
3569       use_operand_p use_p;
3570
3571       if (is_gimple_debug (stmt))
3572         continue;
3573       if (gimple_has_side_effects (stmt))
3574         return false;
3575       if (stmt == last)
3576         return true;
3577       if (!is_gimple_assign (stmt))
3578         return false;
3579       lhs = gimple_assign_lhs (stmt);
3580       if (TREE_CODE (lhs) != SSA_NAME)
3581         return false;
3582       if (gimple_assign_rhs_could_trap_p (stmt))
3583         return false;
3584       FOR_EACH_IMM_USE_FAST (use_p, imm_iter, lhs)
3585         {
3586           gimple *use_stmt = USE_STMT (use_p);
3587           if (is_gimple_debug (use_stmt))
3588             continue;
3589           if (gimple_bb (use_stmt) != bb)
3590             return false;
3591         }
3592     }
3593   return false;
3594 }
3595
3596 /* If VAR is set by CODE (BIT_{AND,IOR}_EXPR) which is reassociable,
3597    return true and fill in *OPS recursively.  */
3598
3599 static bool
3600 get_ops (tree var, enum tree_code code, vec<operand_entry *> *ops,
3601          struct loop *loop)
3602 {
3603   gimple *stmt = SSA_NAME_DEF_STMT (var);
3604   tree rhs[2];
3605   int i;
3606
3607   if (!is_reassociable_op (stmt, code, loop))
3608     return false;
3609
3610   rhs[0] = gimple_assign_rhs1 (stmt);
3611   rhs[1] = gimple_assign_rhs2 (stmt);
3612   gimple_set_visited (stmt, true);
3613   for (i = 0; i < 2; i++)
3614     if (TREE_CODE (rhs[i]) == SSA_NAME
3615         && !get_ops (rhs[i], code, ops, loop)
3616         && has_single_use (rhs[i]))
3617       {
3618         operand_entry *oe = operand_entry_pool.allocate ();
3619
3620         oe->op = rhs[i];
3621         oe->rank = code;
3622         oe->id = 0;
3623         oe->count = 1;
3624         oe->stmt_to_insert = NULL;
3625         ops->safe_push (oe);
3626       }
3627   return true;
3628 }
3629
3630 /* Find the ops that were added by get_ops starting from VAR, see if
3631    they were changed during update_range_test and if yes, create new
3632    stmts.  */
3633
3634 static tree
3635 update_ops (tree var, enum tree_code code, vec<operand_entry *> ops,
3636             unsigned int *pidx, struct loop *loop)
3637 {
3638   gimple *stmt = SSA_NAME_DEF_STMT (var);
3639   tree rhs[4];
3640   int i;
3641
3642   if (!is_reassociable_op (stmt, code, loop))
3643     return NULL;
3644
3645   rhs[0] = gimple_assign_rhs1 (stmt);
3646   rhs[1] = gimple_assign_rhs2 (stmt);
3647   rhs[2] = rhs[0];
3648   rhs[3] = rhs[1];
3649   for (i = 0; i < 2; i++)
3650     if (TREE_CODE (rhs[i]) == SSA_NAME)
3651       {
3652         rhs[2 + i] = update_ops (rhs[i], code, ops, pidx, loop);
3653         if (rhs[2 + i] == NULL_TREE)
3654           {
3655             if (has_single_use (rhs[i]))
3656               rhs[2 + i] = ops[(*pidx)++]->op;
3657             else
3658               rhs[2 + i] = rhs[i];
3659           }
3660       }
3661   if ((rhs[2] != rhs[0] || rhs[3] != rhs[1])
3662       && (rhs[2] != rhs[1] || rhs[3] != rhs[0]))
3663     {
3664       gimple_stmt_iterator gsi = gsi_for_stmt (stmt);
3665       var = make_ssa_name (TREE_TYPE (var));
3666       gassign *g = gimple_build_assign (var, gimple_assign_rhs_code (stmt),
3667                                         rhs[2], rhs[3]);
3668       gimple_set_uid (g, gimple_uid (stmt));
3669       gimple_set_visited (g, true);
3670       gsi_insert_before (&gsi, g, GSI_SAME_STMT);
3671     }
3672   return var;
3673 }
3674
3675 /* Structure to track the initial value passed to get_ops and
3676    the range in the ops vector for each basic block.  */
3677
3678 struct inter_bb_range_test_entry
3679 {
3680   tree op;
3681   unsigned int first_idx, last_idx;
3682 };
3683
3684 /* Inter-bb range test optimization.
3685
3686    Returns TRUE if a gimple conditional is optimized to a true/false,
3687    otherwise return FALSE.
3688
3689    This indicates to the caller that it should run a CFG cleanup pass
3690    once reassociation is completed.  */
3691
3692 static bool
3693 maybe_optimize_range_tests (gimple *stmt)
3694 {
3695   basic_block first_bb = gimple_bb (stmt);
3696   basic_block last_bb = first_bb;
3697   basic_block other_bb = NULL;
3698   basic_block bb;
3699   edge_iterator ei;
3700   edge e;
3701   auto_vec<operand_entry *> ops;
3702   auto_vec<inter_bb_range_test_entry> bbinfo;
3703   bool any_changes = false;
3704   bool cfg_cleanup_needed = false;
3705
3706   /* Consider only basic blocks that end with GIMPLE_COND or
3707      a cast statement satisfying final_range_test_p.  All
3708      but the last bb in the first_bb .. last_bb range
3709      should end with GIMPLE_COND.  */
3710   if (gimple_code (stmt) == GIMPLE_COND)
3711     {
3712       if (EDGE_COUNT (first_bb->succs) != 2)
3713         return cfg_cleanup_needed;
3714     }
3715   else if (final_range_test_p (stmt))
3716     other_bb = single_succ (first_bb);
3717   else
3718     return cfg_cleanup_needed;
3719
3720   if (stmt_could_throw_p (stmt))
3721     return cfg_cleanup_needed;
3722
3723   /* As relative ordering of post-dominator sons isn't fixed,
3724      maybe_optimize_range_tests can be called first on any
3725      bb in the range we want to optimize.  So, start searching
3726      backwards, if first_bb can be set to a predecessor.  */
3727   while (single_pred_p (first_bb))
3728     {
3729       basic_block pred_bb = single_pred (first_bb);
3730       if (!suitable_cond_bb (pred_bb, first_bb, &other_bb, true))
3731         break;
3732       if (!no_side_effect_bb (first_bb))
3733         break;
3734       first_bb = pred_bb;
3735     }
3736   /* If first_bb is last_bb, other_bb hasn't been computed yet.
3737      Before starting forward search in last_bb successors, find
3738      out the other_bb.  */
3739   if (first_bb == last_bb)
3740     {
3741       other_bb = NULL;
3742       /* As non-GIMPLE_COND last stmt always terminates the range,
3743          if forward search didn't discover anything, just give up.  */
3744       if (gimple_code (stmt) != GIMPLE_COND)
3745         return cfg_cleanup_needed;
3746       /* Look at both successors.  Either it ends with a GIMPLE_COND
3747          and satisfies suitable_cond_bb, or ends with a cast and
3748          other_bb is that cast's successor.  */
3749       FOR_EACH_EDGE (e, ei, first_bb->succs)
3750         if (!(e->flags & (EDGE_TRUE_VALUE | EDGE_FALSE_VALUE))
3751             || e->dest == first_bb)
3752           return cfg_cleanup_needed;
3753         else if (single_pred_p (e->dest))
3754           {
3755             stmt = last_stmt (e->dest);
3756             if (stmt
3757                 && gimple_code (stmt) == GIMPLE_COND
3758                 && EDGE_COUNT (e->dest->succs) == 2)
3759               {
3760                 if (suitable_cond_bb (first_bb, e->dest, &other_bb, true))
3761                   break;
3762                 else
3763                   other_bb = NULL;
3764               }
3765             else if (stmt
3766                      && final_range_test_p (stmt)
3767                      && find_edge (first_bb, single_succ (e->dest)))
3768               {
3769                 other_bb = single_succ (e->dest);
3770                 if (other_bb == first_bb)
3771                   other_bb = NULL;
3772               }
3773           }
3774       if (other_bb == NULL)
3775         return cfg_cleanup_needed;
3776     }
3777   /* Now do the forward search, moving last_bb to successor bbs
3778      that aren't other_bb.  */
3779   while (EDGE_COUNT (last_bb->succs) == 2)
3780     {
3781       FOR_EACH_EDGE (e, ei, last_bb->succs)
3782         if (e->dest != other_bb)
3783           break;
3784       if (e == NULL)
3785         break;
3786       if (!single_pred_p (e->dest))
3787         break;
3788       if (!suitable_cond_bb (e->dest, last_bb, &other_bb, false))
3789         break;
3790       if (!no_side_effect_bb (e->dest))
3791         break;
3792       last_bb = e->dest;
3793     }
3794   if (first_bb == last_bb)
3795     return cfg_cleanup_needed;
3796   /* Here basic blocks first_bb through last_bb's predecessor
3797      end with GIMPLE_COND, all of them have one of the edges to
3798      other_bb and another to another block in the range,
3799      all blocks except first_bb don't have side-effects and
3800      last_bb ends with either GIMPLE_COND, or cast satisfying
3801      final_range_test_p.  */
3802   for (bb = last_bb; ; bb = single_pred (bb))
3803     {
3804       enum tree_code code;
3805       tree lhs, rhs;
3806       inter_bb_range_test_entry bb_ent;
3807
3808       bb_ent.op = NULL_TREE;
3809       bb_ent.first_idx = ops.length ();
3810       bb_ent.last_idx = bb_ent.first_idx;
3811       e = find_edge (bb, other_bb);
3812       stmt = last_stmt (bb);
3813       gimple_set_visited (stmt, true);
3814       if (gimple_code (stmt) != GIMPLE_COND)
3815         {
3816           use_operand_p use_p;
3817           gimple *phi;
3818           edge e2;
3819           unsigned int d;
3820
3821           lhs = gimple_assign_lhs (stmt);
3822           rhs = gimple_assign_rhs1 (stmt);
3823           gcc_assert (bb == last_bb);
3824
3825           /* stmt is
3826              _123 = (int) _234;
3827              OR
3828              _234 = a_2(D) == 2;
3829
3830              followed by:
3831              <bb M>:
3832              # _345 = PHI <_123(N), 1(...), 1(...)>
3833
3834              or 0 instead of 1.  If it is 0, the _234
3835              range test is anded together with all the
3836              other range tests, if it is 1, it is ored with
3837              them.  */
3838           single_imm_use (lhs, &use_p, &phi);
3839           gcc_assert (gimple_code (phi) == GIMPLE_PHI);
3840           e2 = find_edge (first_bb, other_bb);
3841           d = e2->dest_idx;
3842           gcc_assert (gimple_phi_arg_def (phi, e->dest_idx) == lhs);
3843           if (integer_zerop (gimple_phi_arg_def (phi, d)))
3844             code = BIT_AND_EXPR;
3845           else
3846             {
3847               gcc_checking_assert (integer_onep (gimple_phi_arg_def (phi, d)));
3848               code = BIT_IOR_EXPR;
3849             }
3850
3851           /* If _234 SSA_NAME_DEF_STMT is
3852              _234 = _567 | _789;
3853              (or &, corresponding to 1/0 in the phi arguments,
3854              push into ops the individual range test arguments
3855              of the bitwise or resp. and, recursively.  */
3856           if (TREE_CODE (rhs) == SSA_NAME
3857               && (TREE_CODE_CLASS (gimple_assign_rhs_code (stmt))
3858                   != tcc_comparison)
3859               && !get_ops (rhs, code, &ops,
3860                         loop_containing_stmt (stmt))
3861               && has_single_use (rhs))
3862             {
3863               /* Otherwise, push the _234 range test itself.  */
3864               operand_entry *oe = operand_entry_pool.allocate ();
3865
3866               oe->op = rhs;
3867               oe->rank = code;
3868               oe->id = 0;
3869               oe->count = 1;
3870               oe->stmt_to_insert = NULL;
3871               ops.safe_push (oe);
3872               bb_ent.last_idx++;
3873               bb_ent.op = rhs;
3874             }
3875           else if (is_gimple_assign (stmt)
3876                    && (TREE_CODE_CLASS (gimple_assign_rhs_code (stmt))
3877                        == tcc_comparison)
3878                    && !get_ops (lhs, code, &ops,
3879                                 loop_containing_stmt (stmt))
3880                    && has_single_use (lhs))
3881             {
3882               operand_entry *oe = operand_entry_pool.allocate ();
3883               oe->op = lhs;
3884               oe->rank = code;
3885               oe->id = 0;
3886               oe->count = 1;
3887               ops.safe_push (oe);
3888               bb_ent.last_idx++;
3889               bb_ent.op = lhs;
3890             }
3891           else
3892             {
3893               bb_ent.last_idx = ops.length ();
3894               bb_ent.op = rhs;
3895             }
3896           bbinfo.safe_push (bb_ent);
3897           continue;
3898         }
3899       /* Otherwise stmt is GIMPLE_COND.  */
3900       code = gimple_cond_code (stmt);
3901       lhs = gimple_cond_lhs (stmt);
3902       rhs = gimple_cond_rhs (stmt);
3903       if (TREE_CODE (lhs) == SSA_NAME
3904           && INTEGRAL_TYPE_P (TREE_TYPE (lhs))
3905           && ((code != EQ_EXPR && code != NE_EXPR)
3906               || rhs != boolean_false_node
3907                  /* Either push into ops the individual bitwise
3908                     or resp. and operands, depending on which
3909                     edge is other_bb.  */
3910               || !get_ops (lhs, (((e->flags & EDGE_TRUE_VALUE) == 0)
3911                                  ^ (code == EQ_EXPR))
3912                                 ? BIT_AND_EXPR : BIT_IOR_EXPR, &ops,
3913                            loop_containing_stmt (stmt))))
3914         {
3915           /* Or push the GIMPLE_COND stmt itself.  */
3916           operand_entry *oe = operand_entry_pool.allocate ();
3917
3918           oe->op = NULL;
3919           oe->rank = (e->flags & EDGE_TRUE_VALUE)
3920                      ? BIT_IOR_EXPR : BIT_AND_EXPR;
3921           /* oe->op = NULL signs that there is no SSA_NAME
3922              for the range test, and oe->id instead is the
3923              basic block number, at which's end the GIMPLE_COND
3924              is.  */
3925           oe->id = bb->index;
3926           oe->count = 1;
3927           oe->stmt_to_insert = NULL;
3928           ops.safe_push (oe);
3929           bb_ent.op = NULL;
3930           bb_ent.last_idx++;
3931         }
3932       else if (ops.length () > bb_ent.first_idx)
3933         {
3934           bb_ent.op = lhs;
3935           bb_ent.last_idx = ops.length ();
3936         }
3937       bbinfo.safe_push (bb_ent);
3938       if (bb == first_bb)
3939         break;
3940     }
3941   if (ops.length () > 1)
3942     any_changes = optimize_range_tests (ERROR_MARK, &ops);
3943   if (any_changes)
3944     {
3945       unsigned int idx, max_idx = 0;
3946       /* update_ops relies on has_single_use predicates returning the
3947          same values as it did during get_ops earlier.  Additionally it
3948          never removes statements, only adds new ones and it should walk
3949          from the single imm use and check the predicate already before
3950          making those changes.
3951          On the other side, the handling of GIMPLE_COND directly can turn
3952          previously multiply used SSA_NAMEs into single use SSA_NAMEs, so
3953          it needs to be done in a separate loop afterwards.  */
3954       for (bb = last_bb, idx = 0; ; bb = single_pred (bb), idx++)
3955         {
3956           if (bbinfo[idx].first_idx < bbinfo[idx].last_idx
3957               && bbinfo[idx].op != NULL_TREE)
3958             {
3959               tree new_op;
3960
3961               max_idx = idx;
3962               stmt = last_stmt (bb);
3963               new_op = update_ops (bbinfo[idx].op,
3964                                    (enum tree_code)
3965                                    ops[bbinfo[idx].first_idx]->rank,
3966                                    ops, &bbinfo[idx].first_idx,
3967                                    loop_containing_stmt (stmt));
3968               if (new_op == NULL_TREE)
3969                 {
3970                   gcc_assert (bb == last_bb);
3971                   new_op = ops[bbinfo[idx].first_idx++]->op;
3972                 }
3973               if (bbinfo[idx].op != new_op)
3974                 {
3975                   imm_use_iterator iter;
3976                   use_operand_p use_p;
3977                   gimple *use_stmt, *cast_or_tcc_cmp_stmt = NULL;
3978
3979                   FOR_EACH_IMM_USE_STMT (use_stmt, iter, bbinfo[idx].op)
3980                     if (is_gimple_debug (use_stmt))
3981                       continue;
3982                     else if (gimple_code (use_stmt) == GIMPLE_COND
3983                              || gimple_code (use_stmt) == GIMPLE_PHI)
3984                       FOR_EACH_IMM_USE_ON_STMT (use_p, iter)
3985                         SET_USE (use_p, new_op);
3986                     else if ((is_gimple_assign (use_stmt)
3987                               && (TREE_CODE_CLASS
3988                                   (gimple_assign_rhs_code (use_stmt))
3989                                   == tcc_comparison)))
3990                       cast_or_tcc_cmp_stmt = use_stmt;
3991                     else if (gimple_assign_cast_p (use_stmt))
3992                       cast_or_tcc_cmp_stmt = use_stmt;
3993                     else
3994                       gcc_unreachable ();
3995
3996                   if (cast_or_tcc_cmp_stmt)
3997                     {
3998                       gcc_assert (bb == last_bb);
3999                       tree lhs = gimple_assign_lhs (cast_or_tcc_cmp_stmt);
4000                       tree new_lhs = make_ssa_name (TREE_TYPE (lhs));
4001                       enum tree_code rhs_code
4002                         = gimple_assign_cast_p (cast_or_tcc_cmp_stmt)
4003                         ? gimple_assign_rhs_code (cast_or_tcc_cmp_stmt)
4004                         : CONVERT_EXPR;
4005                       gassign *g;
4006                       if (is_gimple_min_invariant (new_op))
4007                         {
4008                           new_op = fold_convert (TREE_TYPE (lhs), new_op);
4009                           g = gimple_build_assign (new_lhs, new_op);
4010                         }
4011                       else
4012                         g = gimple_build_assign (new_lhs, rhs_code, new_op);
4013                       gimple_stmt_iterator gsi
4014                         = gsi_for_stmt (cast_or_tcc_cmp_stmt);
4015                       gimple_set_uid (g, gimple_uid (cast_or_tcc_cmp_stmt));
4016                       gimple_set_visited (g, true);
4017                       gsi_insert_before (&gsi, g, GSI_SAME_STMT);
4018                       FOR_EACH_IMM_USE_STMT (use_stmt, iter, lhs)
4019                         if (is_gimple_debug (use_stmt))
4020                           continue;
4021                         else if (gimple_code (use_stmt) == GIMPLE_COND
4022                                  || gimple_code (use_stmt) == GIMPLE_PHI)
4023                           FOR_EACH_IMM_USE_ON_STMT (use_p, iter)
4024                             SET_USE (use_p, new_lhs);
4025                         else
4026                           gcc_unreachable ();
4027                     }
4028                 }
4029             }
4030           if (bb == first_bb)
4031             break;
4032         }
4033       for (bb = last_bb, idx = 0; ; bb = single_pred (bb), idx++)
4034         {
4035           if (bbinfo[idx].first_idx < bbinfo[idx].last_idx
4036               && bbinfo[idx].op == NULL_TREE
4037               && ops[bbinfo[idx].first_idx]->op != NULL_TREE)
4038             {
4039               gcond *cond_stmt = as_a <gcond *> (last_stmt (bb));
4040
4041               if (idx > max_idx)
4042                 max_idx = idx;
4043
4044               /* If we collapse the conditional to a true/false
4045                  condition, then bubble that knowledge up to our caller.  */
4046               if (integer_zerop (ops[bbinfo[idx].first_idx]->op))
4047                 {
4048                   gimple_cond_make_false (cond_stmt);
4049                   cfg_cleanup_needed = true;
4050                 }
4051               else if (integer_onep (ops[bbinfo[idx].first_idx]->op))
4052                 {
4053                   gimple_cond_make_true (cond_stmt);
4054                   cfg_cleanup_needed = true;
4055                 }
4056               else
4057                 {
4058                   gimple_cond_set_code (cond_stmt, NE_EXPR);
4059                   gimple_cond_set_lhs (cond_stmt,
4060                                        ops[bbinfo[idx].first_idx]->op);
4061                   gimple_cond_set_rhs (cond_stmt, boolean_false_node);
4062                 }
4063               update_stmt (cond_stmt);
4064             }
4065           if (bb == first_bb)
4066             break;
4067         }
4068
4069       /* The above changes could result in basic blocks after the first
4070          modified one, up to and including last_bb, to be executed even if
4071          they would not be in the original program.  If the value ranges of
4072          assignment lhs' in those bbs were dependent on the conditions
4073          guarding those basic blocks which now can change, the VRs might
4074          be incorrect.  As no_side_effect_bb should ensure those SSA_NAMEs
4075          are only used within the same bb, it should be not a big deal if
4076          we just reset all the VRs in those bbs.  See PR68671.  */
4077       for (bb = last_bb, idx = 0; idx < max_idx; bb = single_pred (bb), idx++)
4078         reset_flow_sensitive_info_in_bb (bb);
4079     }
4080   return cfg_cleanup_needed;
4081 }
4082
4083 /* Return true if OPERAND is defined by a PHI node which uses the LHS
4084    of STMT in it's operands.  This is also known as a "destructive
4085    update" operation.  */
4086
4087 static bool
4088 is_phi_for_stmt (gimple *stmt, tree operand)
4089 {
4090   gimple *def_stmt;
4091   gphi *def_phi;
4092   tree lhs;
4093   use_operand_p arg_p;
4094   ssa_op_iter i;
4095
4096   if (TREE_CODE (operand) != SSA_NAME)
4097     return false;
4098
4099   lhs = gimple_assign_lhs (stmt);
4100
4101   def_stmt = SSA_NAME_DEF_STMT (operand);
4102   def_phi = dyn_cast <gphi *> (def_stmt);
4103   if (!def_phi)
4104     return false;
4105
4106   FOR_EACH_PHI_ARG (arg_p, def_phi, i, SSA_OP_USE)
4107     if (lhs == USE_FROM_PTR (arg_p))
4108       return true;
4109   return false;
4110 }
4111
4112 /* Remove def stmt of VAR if VAR has zero uses and recurse
4113    on rhs1 operand if so.  */
4114
4115 static void
4116 remove_visited_stmt_chain (tree var)
4117 {
4118   gimple *stmt;
4119   gimple_stmt_iterator gsi;
4120
4121   while (1)
4122     {
4123       if (TREE_CODE (var) != SSA_NAME || !has_zero_uses (var))
4124         return;
4125       stmt = SSA_NAME_DEF_STMT (var);
4126       if (is_gimple_assign (stmt) && gimple_visited_p (stmt))
4127         {
4128           var = gimple_assign_rhs1 (stmt);
4129           gsi = gsi_for_stmt (stmt);
4130           reassoc_remove_stmt (&gsi);
4131           release_defs (stmt);
4132         }
4133       else
4134         return;
4135     }
4136 }
4137
4138 /* This function checks three consequtive operands in
4139    passed operands vector OPS starting from OPINDEX and
4140    swaps two operands if it is profitable for binary operation
4141    consuming OPINDEX + 1 abnd OPINDEX + 2 operands.
4142
4143    We pair ops with the same rank if possible.
4144
4145    The alternative we try is to see if STMT is a destructive
4146    update style statement, which is like:
4147    b = phi (a, ...)
4148    a = c + b;
4149    In that case, we want to use the destructive update form to
4150    expose the possible vectorizer sum reduction opportunity.
4151    In that case, the third operand will be the phi node. This
4152    check is not performed if STMT is null.
4153
4154    We could, of course, try to be better as noted above, and do a
4155    lot of work to try to find these opportunities in >3 operand
4156    cases, but it is unlikely to be worth it.  */
4157
4158 static void
4159 swap_ops_for_binary_stmt (vec<operand_entry *> ops,
4160                           unsigned int opindex, gimple *stmt)
4161 {
4162   operand_entry *oe1, *oe2, *oe3;
4163
4164   oe1 = ops[opindex];
4165   oe2 = ops[opindex + 1];
4166   oe3 = ops[opindex + 2];
4167
4168   if ((oe1->rank == oe2->rank
4169        && oe2->rank != oe3->rank)
4170       || (stmt && is_phi_for_stmt (stmt, oe3->op)
4171           && !is_phi_for_stmt (stmt, oe1->op)
4172           && !is_phi_for_stmt (stmt, oe2->op)))
4173     std::swap (*oe1, *oe3);
4174   else if ((oe1->rank == oe3->rank
4175             && oe2->rank != oe3->rank)
4176            || (stmt && is_phi_for_stmt (stmt, oe2->op)
4177                && !is_phi_for_stmt (stmt, oe1->op)
4178                && !is_phi_for_stmt (stmt, oe3->op)))
4179     std::swap (*oe1, *oe2);
4180 }
4181
4182 /* If definition of RHS1 or RHS2 dominates STMT, return the later of those
4183    two definitions, otherwise return STMT.  */
4184
4185 static inline gimple *
4186 find_insert_point (gimple *stmt, tree rhs1, tree rhs2)
4187 {
4188   if (TREE_CODE (rhs1) == SSA_NAME
4189       && reassoc_stmt_dominates_stmt_p (stmt, SSA_NAME_DEF_STMT (rhs1)))
4190     stmt = SSA_NAME_DEF_STMT (rhs1);
4191   if (TREE_CODE (rhs2) == SSA_NAME
4192       && reassoc_stmt_dominates_stmt_p (stmt, SSA_NAME_DEF_STMT (rhs2)))
4193     stmt = SSA_NAME_DEF_STMT (rhs2);
4194   return stmt;
4195 }
4196
4197 /* If the stmt that defines operand has to be inserted, insert it
4198    before the use.  */
4199 static void
4200 insert_stmt_before_use (gimple *stmt, gimple *stmt_to_insert)
4201 {
4202   gcc_assert (is_gimple_assign (stmt_to_insert));
4203   tree rhs1 = gimple_assign_rhs1 (stmt_to_insert);
4204   tree rhs2 = gimple_assign_rhs2 (stmt_to_insert);
4205   gimple *insert_point = find_insert_point (stmt, rhs1, rhs2);
4206   gimple_stmt_iterator gsi = gsi_for_stmt (insert_point);
4207   gimple_set_uid (stmt_to_insert, gimple_uid (insert_point));
4208
4209   /* If the insert point is not stmt, then insert_point would be
4210      the point where operand rhs1 or rhs2 is defined. In this case,
4211      stmt_to_insert has to be inserted afterwards. This would
4212      only happen when the stmt insertion point is flexible. */
4213   if (stmt == insert_point)
4214     gsi_insert_before (&gsi, stmt_to_insert, GSI_NEW_STMT);
4215   else
4216     insert_stmt_after (stmt_to_insert, insert_point);
4217 }
4218
4219
4220 /* Recursively rewrite our linearized statements so that the operators
4221    match those in OPS[OPINDEX], putting the computation in rank
4222    order.  Return new lhs.
4223    CHANGED is true if we shouldn't reuse the lhs SSA_NAME both in
4224    the current stmt and during recursive invocations.
4225    NEXT_CHANGED is true if we shouldn't reuse the lhs SSA_NAME in
4226    recursive invocations.  */
4227
4228 static tree
4229 rewrite_expr_tree (gimple *stmt, unsigned int opindex,
4230                    vec<operand_entry *> ops, bool changed, bool next_changed)
4231 {
4232   tree rhs1 = gimple_assign_rhs1 (stmt);
4233   tree rhs2 = gimple_assign_rhs2 (stmt);
4234   tree lhs = gimple_assign_lhs (stmt);
4235   operand_entry *oe;
4236
4237   /* The final recursion case for this function is that you have
4238      exactly two operations left.
4239      If we had exactly one op in the entire list to start with, we
4240      would have never called this function, and the tail recursion
4241      rewrites them one at a time.  */
4242   if (opindex + 2 == ops.length ())
4243     {
4244       operand_entry *oe1, *oe2;
4245
4246       oe1 = ops[opindex];
4247       oe2 = ops[opindex + 1];
4248
4249       if (rhs1 != oe1->op || rhs2 != oe2->op)
4250         {
4251           gimple_stmt_iterator gsi = gsi_for_stmt (stmt);
4252           unsigned int uid = gimple_uid (stmt);
4253
4254           if (dump_file && (dump_flags & TDF_DETAILS))
4255             {
4256               fprintf (dump_file, "Transforming ");
4257               print_gimple_stmt (dump_file, stmt, 0);
4258             }
4259
4260           /* If the stmt that defines operand has to be inserted, insert it
4261              before the use.  */
4262           if (oe1->stmt_to_insert)
4263             insert_stmt_before_use (stmt, oe1->stmt_to_insert);
4264           if (oe2->stmt_to_insert)
4265             insert_stmt_before_use (stmt, oe2->stmt_to_insert);
4266           /* Even when changed is false, reassociation could have e.g. removed
4267              some redundant operations, so unless we are just swapping the
4268              arguments or unless there is no change at all (then we just
4269              return lhs), force creation of a new SSA_NAME.  */
4270           if (changed || ((rhs1 != oe2->op || rhs2 != oe1->op) && opindex))
4271             {
4272               gimple *insert_point
4273                 = find_insert_point (stmt, oe1->op, oe2->op);
4274               lhs = make_ssa_name (TREE_TYPE (lhs));
4275               stmt
4276                 = gimple_build_assign (lhs, gimple_assign_rhs_code (stmt),
4277                                        oe1->op, oe2->op);
4278               gimple_set_uid (stmt, uid);
4279               gimple_set_visited (stmt, true);
4280               if (insert_point == gsi_stmt (gsi))
4281                 gsi_insert_before (&gsi, stmt, GSI_SAME_STMT);
4282               else
4283                 insert_stmt_after (stmt, insert_point);
4284             }
4285           else
4286             {
4287               gcc_checking_assert (find_insert_point (stmt, oe1->op, oe2->op)
4288                                    == stmt);
4289               gimple_assign_set_rhs1 (stmt, oe1->op);
4290               gimple_assign_set_rhs2 (stmt, oe2->op);
4291               update_stmt (stmt);
4292             }
4293
4294           if (rhs1 != oe1->op && rhs1 != oe2->op)
4295             remove_visited_stmt_chain (rhs1);
4296
4297           if (dump_file && (dump_flags & TDF_DETAILS))
4298             {
4299               fprintf (dump_file, " into ");
4300               print_gimple_stmt (dump_file, stmt, 0);
4301             }
4302         }
4303       return lhs;
4304     }
4305
4306   /* If we hit here, we should have 3 or more ops left.  */
4307   gcc_assert (opindex + 2 < ops.length ());
4308
4309   /* Rewrite the next operator.  */
4310   oe = ops[opindex];
4311
4312   /* If the stmt that defines operand has to be inserted, insert it
4313      before the use.  */
4314   if (oe->stmt_to_insert)
4315     insert_stmt_before_use (stmt, oe->stmt_to_insert);
4316
4317   /* Recurse on the LHS of the binary operator, which is guaranteed to
4318      be the non-leaf side.  */
4319   tree new_rhs1
4320     = rewrite_expr_tree (SSA_NAME_DEF_STMT (rhs1), opindex + 1, ops,
4321                          changed || oe->op != rhs2 || next_changed,
4322                          false);
4323
4324   if (oe->op != rhs2 || new_rhs1 != rhs1)
4325     {
4326       if (dump_file && (dump_flags & TDF_DETAILS))
4327         {
4328           fprintf (dump_file, "Transforming ");
4329           print_gimple_stmt (dump_file, stmt, 0);
4330         }
4331
4332       /* If changed is false, this is either opindex == 0
4333          or all outer rhs2's were equal to corresponding oe->op,
4334          and powi_result is NULL.
4335          That means lhs is equivalent before and after reassociation.
4336          Otherwise ensure the old lhs SSA_NAME is not reused and
4337          create a new stmt as well, so that any debug stmts will be
4338          properly adjusted.  */
4339       if (changed)
4340         {
4341           gimple_stmt_iterator gsi = gsi_for_stmt (stmt);
4342           unsigned int uid = gimple_uid (stmt);
4343           gimple *insert_point = find_insert_point (stmt, new_rhs1, oe->op);
4344
4345           lhs = make_ssa_name (TREE_TYPE (lhs));
4346           stmt = gimple_build_assign (lhs, gimple_assign_rhs_code (stmt),
4347                                       new_rhs1, oe->op);
4348           gimple_set_uid (stmt, uid);
4349           gimple_set_visited (stmt, true);
4350           if (insert_point == gsi_stmt (gsi))
4351             gsi_insert_before (&gsi, stmt, GSI_SAME_STMT);
4352           else
4353             insert_stmt_after (stmt, insert_point);
4354         }
4355       else
4356         {
4357           gcc_checking_assert (find_insert_point (stmt, new_rhs1, oe->op)
4358                                == stmt);
4359           gimple_assign_set_rhs1 (stmt, new_rhs1);
4360           gimple_assign_set_rhs2 (stmt, oe->op);
4361           update_stmt (stmt);
4362         }
4363
4364       if (dump_file && (dump_flags & TDF_DETAILS))
4365         {
4366           fprintf (dump_file, " into ");
4367           print_gimple_stmt (dump_file, stmt, 0);
4368         }
4369     }
4370   return lhs;
4371 }
4372
4373 /* Find out how many cycles we need to compute statements chain.
4374    OPS_NUM holds number os statements in a chain.  CPU_WIDTH is a
4375    maximum number of independent statements we may execute per cycle.  */
4376
4377 static int
4378 get_required_cycles (int ops_num, int cpu_width)
4379 {
4380   int res;
4381   int elog;
4382   unsigned int rest;
4383
4384   /* While we have more than 2 * cpu_width operands
4385      we may reduce number of operands by cpu_width
4386      per cycle.  */
4387   res = ops_num / (2 * cpu_width);
4388
4389   /* Remained operands count may be reduced twice per cycle
4390      until we have only one operand.  */
4391   rest = (unsigned)(ops_num - res * cpu_width);
4392   elog = exact_log2 (rest);
4393   if (elog >= 0)
4394     res += elog;
4395   else
4396     res += floor_log2 (rest) + 1;
4397
4398   return res;
4399 }
4400
4401 /* Returns an optimal number of registers to use for computation of
4402    given statements.  */
4403
4404 static int
4405 get_reassociation_width (int ops_num, enum tree_code opc,
4406                          machine_mode mode)
4407 {
4408   int param_width = PARAM_VALUE (PARAM_TREE_REASSOC_WIDTH);
4409   int width;
4410   int width_min;
4411   int cycles_best;
4412
4413   if (param_width > 0)
4414     width = param_width;
4415   else
4416     width = targetm.sched.reassociation_width (opc, mode);
4417
4418   if (width == 1)
4419     return width;
4420
4421   /* Get the minimal time required for sequence computation.  */
4422   cycles_best = get_required_cycles (ops_num, width);
4423
4424   /* Check if we may use less width and still compute sequence for
4425      the same time.  It will allow us to reduce registers usage.
4426      get_required_cycles is monotonically increasing with lower width
4427      so we can perform a binary search for the minimal width that still
4428      results in the optimal cycle count.  */
4429   width_min = 1;
4430   while (width > width_min)
4431     {
4432       int width_mid = (width + width_min) / 2;
4433
4434       if (get_required_cycles (ops_num, width_mid) == cycles_best)
4435         width = width_mid;
4436       else if (width_min < width_mid)
4437         width_min = width_mid;
4438       else
4439         break;
4440     }
4441
4442   return width;
4443 }
4444
4445 /* Recursively rewrite our linearized statements so that the operators
4446    match those in OPS[OPINDEX], putting the computation in rank
4447    order and trying to allow operations to be executed in
4448    parallel.  */
4449
4450 static void
4451 rewrite_expr_tree_parallel (gassign *stmt, int width,
4452                             vec<operand_entry *> ops)
4453 {
4454   enum tree_code opcode = gimple_assign_rhs_code (stmt);
4455   int op_num = ops.length ();
4456   gcc_assert (op_num > 0);
4457   int stmt_num = op_num - 1;
4458   gimple **stmts = XALLOCAVEC (gimple *, stmt_num);
4459   int op_index = op_num - 1;
4460   int stmt_index = 0;
4461   int ready_stmts_end = 0;
4462   int i = 0;
4463   gimple *stmt1 = NULL, *stmt2 = NULL;
4464   tree last_rhs1 = gimple_assign_rhs1 (stmt);
4465
4466   /* We start expression rewriting from the top statements.
4467      So, in this loop we create a full list of statements
4468      we will work with.  */
4469   stmts[stmt_num - 1] = stmt;
4470   for (i = stmt_num - 2; i >= 0; i--)
4471     stmts[i] = SSA_NAME_DEF_STMT (gimple_assign_rhs1 (stmts[i+1]));
4472
4473   for (i = 0; i < stmt_num; i++)
4474     {
4475       tree op1, op2;
4476
4477       /* Determine whether we should use results of
4478          already handled statements or not.  */
4479       if (ready_stmts_end == 0
4480           && (i - stmt_index >= width || op_index < 1))
4481         ready_stmts_end = i;
4482
4483       /* Now we choose operands for the next statement.  Non zero
4484          value in ready_stmts_end means here that we should use
4485          the result of already generated statements as new operand.  */
4486       if (ready_stmts_end > 0)
4487         {
4488           op1 = gimple_assign_lhs (stmts[stmt_index++]);
4489           if (ready_stmts_end > stmt_index)
4490             op2 = gimple_assign_lhs (stmts[stmt_index++]);
4491           else if (op_index >= 0)
4492             {
4493               operand_entry *oe = ops[op_index--];
4494               stmt2 = oe->stmt_to_insert;
4495               op2 = oe->op;
4496             }
4497           else
4498             {
4499               gcc_assert (stmt_index < i);
4500               op2 = gimple_assign_lhs (stmts[stmt_index++]);
4501             }
4502
4503           if (stmt_index >= ready_stmts_end)
4504             ready_stmts_end = 0;
4505         }
4506       else
4507         {
4508           if (op_index > 1)
4509             swap_ops_for_binary_stmt (ops, op_index - 2, NULL);
4510           operand_entry *oe2 = ops[op_index--];
4511           operand_entry *oe1 = ops[op_index--];
4512           op2 = oe2->op;
4513           stmt2 = oe2->stmt_to_insert;
4514           op1 = oe1->op;
4515           stmt1 = oe1->stmt_to_insert;
4516         }
4517
4518       /* If we emit the last statement then we should put
4519          operands into the last statement.  It will also
4520          break the loop.  */
4521       if (op_index < 0 && stmt_index == i)
4522         i = stmt_num - 1;
4523
4524       if (dump_file && (dump_flags & TDF_DETAILS))
4525         {
4526           fprintf (dump_file, "Transforming ");
4527           print_gimple_stmt (dump_file, stmts[i], 0);
4528         }
4529
4530       /* If the stmt that defines operand has to be inserted, insert it
4531          before the use.  */
4532       if (stmt1)
4533         insert_stmt_before_use (stmts[i], stmt1);
4534       if (stmt2)
4535         insert_stmt_before_use (stmts[i], stmt2);
4536       stmt1 = stmt2 = NULL;
4537
4538       /* We keep original statement only for the last one.  All
4539          others are recreated.  */
4540       if (i == stmt_num - 1)
4541         {
4542           gimple_assign_set_rhs1 (stmts[i], op1);
4543           gimple_assign_set_rhs2 (stmts[i], op2);
4544           update_stmt (stmts[i]);
4545         }
4546       else
4547         {
4548           stmts[i] = build_and_add_sum (TREE_TYPE (last_rhs1), op1, op2, opcode);
4549         }
4550       if (dump_file && (dump_flags & TDF_DETAILS))
4551         {
4552           fprintf (dump_file, " into ");
4553           print_gimple_stmt (dump_file, stmts[i], 0);
4554         }
4555     }
4556
4557   remove_visited_stmt_chain (last_rhs1);
4558 }
4559
4560 /* Transform STMT, which is really (A +B) + (C + D) into the left
4561    linear form, ((A+B)+C)+D.
4562    Recurse on D if necessary.  */
4563
4564 static void
4565 linearize_expr (gimple *stmt)
4566 {
4567   gimple_stmt_iterator gsi;
4568   gimple *binlhs = SSA_NAME_DEF_STMT (gimple_assign_rhs1 (stmt));
4569   gimple *binrhs = SSA_NAME_DEF_STMT (gimple_assign_rhs2 (stmt));
4570   gimple *oldbinrhs = binrhs;
4571   enum tree_code rhscode = gimple_assign_rhs_code (stmt);
4572   gimple *newbinrhs = NULL;
4573   struct loop *loop = loop_containing_stmt (stmt);
4574   tree lhs = gimple_assign_lhs (stmt);
4575
4576   gcc_assert (is_reassociable_op (binlhs, rhscode, loop)
4577               && is_reassociable_op (binrhs, rhscode, loop));
4578
4579   gsi = gsi_for_stmt (stmt);
4580
4581   gimple_assign_set_rhs2 (stmt, gimple_assign_rhs1 (binrhs));
4582   binrhs = gimple_build_assign (make_ssa_name (TREE_TYPE (lhs)),
4583                                 gimple_assign_rhs_code (binrhs),
4584                                 gimple_assign_lhs (binlhs),
4585                                 gimple_assign_rhs2 (binrhs));
4586   gimple_assign_set_rhs1 (stmt, gimple_assign_lhs (binrhs));
4587   gsi_insert_before (&gsi, binrhs, GSI_SAME_STMT);
4588   gimple_set_uid (binrhs, gimple_uid (stmt));
4589
4590   if (TREE_CODE (gimple_assign_rhs2 (stmt)) == SSA_NAME)
4591     newbinrhs = SSA_NAME_DEF_STMT (gimple_assign_rhs2 (stmt));
4592
4593   if (dump_file && (dump_flags & TDF_DETAILS))
4594     {
4595       fprintf (dump_file, "Linearized: ");
4596       print_gimple_stmt (dump_file, stmt, 0);
4597     }
4598
4599   reassociate_stats.linearized++;
4600   update_stmt (stmt);
4601
4602   gsi = gsi_for_stmt (oldbinrhs);
4603   reassoc_remove_stmt (&gsi);
4604   release_defs (oldbinrhs);
4605
4606   gimple_set_visited (stmt, true);
4607   gimple_set_visited (binlhs, true);
4608   gimple_set_visited (binrhs, true);
4609
4610   /* Tail recurse on the new rhs if it still needs reassociation.  */
4611   if (newbinrhs && is_reassociable_op (newbinrhs, rhscode, loop))
4612     /* ??? This should probably be linearize_expr (newbinrhs) but I don't
4613            want to change the algorithm while converting to tuples.  */
4614     linearize_expr (stmt);
4615 }
4616
4617 /* If LHS has a single immediate use that is a GIMPLE_ASSIGN statement, return
4618    it.  Otherwise, return NULL.  */
4619
4620 static gimple *
4621 get_single_immediate_use (tree lhs)
4622 {
4623   use_operand_p immuse;
4624   gimple *immusestmt;
4625
4626   if (TREE_CODE (lhs) == SSA_NAME
4627       && single_imm_use (lhs, &immuse, &immusestmt)
4628       && is_gimple_assign (immusestmt))
4629     return immusestmt;
4630
4631   return NULL;
4632 }
4633
4634 /* Recursively negate the value of TONEGATE, and return the SSA_NAME
4635    representing the negated value.  Insertions of any necessary
4636    instructions go before GSI.
4637    This function is recursive in that, if you hand it "a_5" as the
4638    value to negate, and a_5 is defined by "a_5 = b_3 + b_4", it will
4639    transform b_3 + b_4 into a_5 = -b_3 + -b_4.  */
4640
4641 static tree
4642 negate_value (tree tonegate, gimple_stmt_iterator *gsip)
4643 {
4644   gimple *negatedefstmt = NULL;
4645   tree resultofnegate;
4646   gimple_stmt_iterator gsi;
4647   unsigned int uid;
4648
4649   /* If we are trying to negate a name, defined by an add, negate the
4650      add operands instead.  */
4651   if (TREE_CODE (tonegate) == SSA_NAME)
4652     negatedefstmt = SSA_NAME_DEF_STMT (tonegate);
4653   if (TREE_CODE (tonegate) == SSA_NAME
4654       && is_gimple_assign (negatedefstmt)
4655       && TREE_CODE (gimple_assign_lhs (negatedefstmt)) == SSA_NAME
4656       && has_single_use (gimple_assign_lhs (negatedefstmt))
4657       && gimple_assign_rhs_code (negatedefstmt) == PLUS_EXPR)
4658     {
4659       tree rhs1 = gimple_assign_rhs1 (negatedefstmt);
4660       tree rhs2 = gimple_assign_rhs2 (negatedefstmt);
4661       tree lhs = gimple_assign_lhs (negatedefstmt);
4662       gimple *g;
4663
4664       gsi = gsi_for_stmt (negatedefstmt);
4665       rhs1 = negate_value (rhs1, &gsi);
4666
4667       gsi = gsi_for_stmt (negatedefstmt);
4668       rhs2 = negate_value (rhs2, &gsi);
4669
4670       gsi = gsi_for_stmt (negatedefstmt);
4671       lhs = make_ssa_name (TREE_TYPE (lhs));
4672       gimple_set_visited (negatedefstmt, true);
4673       g = gimple_build_assign (lhs, PLUS_EXPR, rhs1, rhs2);
4674       gimple_set_uid (g, gimple_uid (negatedefstmt));
4675       gsi_insert_before (&gsi, g, GSI_SAME_STMT);
4676       return lhs;
4677     }
4678
4679   tonegate = fold_build1 (NEGATE_EXPR, TREE_TYPE (tonegate), tonegate);
4680   resultofnegate = force_gimple_operand_gsi (gsip, tonegate, true,
4681                                              NULL_TREE, true, GSI_SAME_STMT);
4682   gsi = *gsip;
4683   uid = gimple_uid (gsi_stmt (gsi));
4684   for (gsi_prev (&gsi); !gsi_end_p (gsi); gsi_prev (&gsi))
4685     {
4686       gimple *stmt = gsi_stmt (gsi);
4687       if (gimple_uid (stmt) != 0)
4688         break;
4689       gimple_set_uid (stmt, uid);
4690     }
4691   return resultofnegate;
4692 }
4693
4694 /* Return true if we should break up the subtract in STMT into an add
4695    with negate.  This is true when we the subtract operands are really
4696    adds, or the subtract itself is used in an add expression.  In
4697    either case, breaking up the subtract into an add with negate
4698    exposes the adds to reassociation.  */
4699
4700 static bool
4701 should_break_up_subtract (gimple *stmt)
4702 {
4703   tree lhs = gimple_assign_lhs (stmt);
4704   tree binlhs = gimple_assign_rhs1 (stmt);
4705   tree binrhs = gimple_assign_rhs2 (stmt);
4706   gimple *immusestmt;
4707   struct loop *loop = loop_containing_stmt (stmt);
4708
4709   if (TREE_CODE (binlhs) == SSA_NAME
4710       && is_reassociable_op (SSA_NAME_DEF_STMT (binlhs), PLUS_EXPR, loop))
4711     return true;
4712
4713   if (TREE_CODE (binrhs) == SSA_NAME
4714       && is_reassociable_op (SSA_NAME_DEF_STMT (binrhs), PLUS_EXPR, loop))
4715     return true;
4716
4717   if (TREE_CODE (lhs) == SSA_NAME
4718       && (immusestmt = get_single_immediate_use (lhs))
4719       && is_gimple_assign (immusestmt)
4720       && (gimple_assign_rhs_code (immusestmt) == PLUS_EXPR
4721           ||  gimple_assign_rhs_code (immusestmt) == MULT_EXPR))
4722     return true;
4723   return false;
4724 }
4725
4726 /* Transform STMT from A - B into A + -B.  */
4727
4728 static void
4729 break_up_subtract (gimple *stmt, gimple_stmt_iterator *gsip)
4730 {
4731   tree rhs1 = gimple_assign_rhs1 (stmt);
4732   tree rhs2 = gimple_assign_rhs2 (stmt);
4733
4734   if (dump_file && (dump_flags & TDF_DETAILS))
4735     {
4736       fprintf (dump_file, "Breaking up subtract ");
4737       print_gimple_stmt (dump_file, stmt, 0);
4738     }
4739
4740   rhs2 = negate_value (rhs2, gsip);
4741   gimple_assign_set_rhs_with_ops (gsip, PLUS_EXPR, rhs1, rhs2);
4742   update_stmt (stmt);
4743 }
4744
4745 /* Determine whether STMT is a builtin call that raises an SSA name
4746    to an integer power and has only one use.  If so, and this is early
4747    reassociation and unsafe math optimizations are permitted, place
4748    the SSA name in *BASE and the exponent in *EXPONENT, and return TRUE.
4749    If any of these conditions does not hold, return FALSE.  */
4750
4751 static bool
4752 acceptable_pow_call (gcall *stmt, tree *base, HOST_WIDE_INT *exponent)
4753 {
4754   tree arg1;
4755   REAL_VALUE_TYPE c, cint;
4756
4757   switch (gimple_call_combined_fn (stmt))
4758     {
4759     CASE_CFN_POW:
4760       if (flag_errno_math)
4761         return false;
4762
4763       *base = gimple_call_arg (stmt, 0);
4764       arg1 = gimple_call_arg (stmt, 1);
4765
4766       if (TREE_CODE (arg1) != REAL_CST)
4767         return false;
4768
4769       c = TREE_REAL_CST (arg1);
4770
4771       if (REAL_EXP (&c) > HOST_BITS_PER_WIDE_INT)
4772         return false;
4773
4774       *exponent = real_to_integer (&c);
4775       real_from_integer (&cint, VOIDmode, *exponent, SIGNED);
4776       if (!real_identical (&c, &cint))
4777         return false;
4778
4779       break;
4780
4781     CASE_CFN_POWI:
4782       *base = gimple_call_arg (stmt, 0);
4783       arg1 = gimple_call_arg (stmt, 1);
4784
4785       if (!tree_fits_shwi_p (arg1))
4786         return false;
4787
4788       *exponent = tree_to_shwi (arg1);
4789       break;
4790
4791     default:
4792       return false;
4793     }
4794
4795   /* Expanding negative exponents is generally unproductive, so we don't
4796      complicate matters with those.  Exponents of zero and one should
4797      have been handled by expression folding.  */
4798   if (*exponent < 2 || TREE_CODE (*base) != SSA_NAME)
4799     return false;
4800
4801   return true;
4802 }
4803
4804 /* Try to derive and add operand entry for OP to *OPS.  Return false if
4805    unsuccessful.  */
4806
4807 static bool
4808 try_special_add_to_ops (vec<operand_entry *> *ops,
4809                         enum tree_code code,
4810                         tree op, gimple* def_stmt)
4811 {
4812   tree base = NULL_TREE;
4813   HOST_WIDE_INT exponent = 0;
4814
4815   if (TREE_CODE (op) != SSA_NAME
4816       || ! has_single_use (op))
4817     return false;
4818
4819   if (code == MULT_EXPR
4820       && reassoc_insert_powi_p
4821       && flag_unsafe_math_optimizations
4822       && is_gimple_call (def_stmt)
4823       && acceptable_pow_call (as_a <gcall *> (def_stmt), &base, &exponent))
4824     {
4825       add_repeat_to_ops_vec (ops, base, exponent);
4826       gimple_set_visited (def_stmt, true);
4827       return true;
4828     }
4829   else if (code == MULT_EXPR
4830            && is_gimple_assign (def_stmt)
4831            && gimple_assign_rhs_code (def_stmt) == NEGATE_EXPR
4832            && !HONOR_SNANS (TREE_TYPE (op))
4833            && (!HONOR_SIGNED_ZEROS (TREE_TYPE (op))
4834                || !COMPLEX_FLOAT_TYPE_P (TREE_TYPE (op))))
4835     {
4836       tree rhs1 = gimple_assign_rhs1 (def_stmt);
4837       tree cst = build_minus_one_cst (TREE_TYPE (op));
4838       add_to_ops_vec (ops, rhs1);
4839       add_to_ops_vec (ops, cst);
4840       gimple_set_visited (def_stmt, true);
4841       return true;
4842     }
4843
4844   return false;
4845 }
4846
4847 /* Recursively linearize a binary expression that is the RHS of STMT.
4848    Place the operands of the expression tree in the vector named OPS.  */
4849
4850 static void
4851 linearize_expr_tree (vec<operand_entry *> *ops, gimple *stmt,
4852                      bool is_associative, bool set_visited)
4853 {
4854   tree binlhs = gimple_assign_rhs1 (stmt);
4855   tree binrhs = gimple_assign_rhs2 (stmt);
4856   gimple *binlhsdef = NULL, *binrhsdef = NULL;
4857   bool binlhsisreassoc = false;
4858   bool binrhsisreassoc = false;
4859   enum tree_code rhscode = gimple_assign_rhs_code (stmt);
4860   struct loop *loop = loop_containing_stmt (stmt);
4861
4862   if (set_visited)
4863     gimple_set_visited (stmt, true);
4864
4865   if (TREE_CODE (binlhs) == SSA_NAME)
4866     {
4867       binlhsdef = SSA_NAME_DEF_STMT (binlhs);
4868       binlhsisreassoc = (is_reassociable_op (binlhsdef, rhscode, loop)
4869                          && !stmt_could_throw_p (binlhsdef));
4870     }
4871
4872   if (TREE_CODE (binrhs) == SSA_NAME)
4873     {
4874       binrhsdef = SSA_NAME_DEF_STMT (binrhs);
4875       binrhsisreassoc = (is_reassociable_op (binrhsdef, rhscode, loop)
4876                          && !stmt_could_throw_p (binrhsdef));
4877     }
4878
4879   /* If the LHS is not reassociable, but the RHS is, we need to swap
4880      them.  If neither is reassociable, there is nothing we can do, so
4881      just put them in the ops vector.  If the LHS is reassociable,
4882      linearize it.  If both are reassociable, then linearize the RHS
4883      and the LHS.  */
4884
4885   if (!binlhsisreassoc)
4886     {
4887       /* If this is not a associative operation like division, give up.  */
4888       if (!is_associative)
4889         {
4890           add_to_ops_vec (ops, binrhs);
4891           return;
4892         }
4893
4894       if (!binrhsisreassoc)
4895         {
4896           if (!try_special_add_to_ops (ops, rhscode, binrhs, binrhsdef))
4897             add_to_ops_vec (ops, binrhs);
4898
4899           if (!try_special_add_to_ops (ops, rhscode, binlhs, binlhsdef))
4900             add_to_ops_vec (ops, binlhs);
4901
4902           return;
4903         }
4904
4905       if (dump_file && (dump_flags & TDF_DETAILS))
4906         {
4907           fprintf (dump_file, "swapping operands of ");
4908           print_gimple_stmt (dump_file, stmt, 0);
4909         }
4910
4911       swap_ssa_operands (stmt,
4912                          gimple_assign_rhs1_ptr (stmt),
4913                          gimple_assign_rhs2_ptr (stmt));
4914       update_stmt (stmt);
4915
4916       if (dump_file && (dump_flags & TDF_DETAILS))
4917         {
4918           fprintf (dump_file, " is now ");
4919           print_gimple_stmt (dump_file, stmt, 0);
4920         }
4921
4922       /* We want to make it so the lhs is always the reassociative op,
4923          so swap.  */
4924       std::swap (binlhs, binrhs);
4925     }
4926   else if (binrhsisreassoc)
4927     {
4928       linearize_expr (stmt);
4929       binlhs = gimple_assign_rhs1 (stmt);
4930       binrhs = gimple_assign_rhs2 (stmt);
4931     }
4932
4933   gcc_assert (TREE_CODE (binrhs) != SSA_NAME
4934               || !is_reassociable_op (SSA_NAME_DEF_STMT (binrhs),
4935                                       rhscode, loop));
4936   linearize_expr_tree (ops, SSA_NAME_DEF_STMT (binlhs),
4937                        is_associative, set_visited);
4938
4939   if (!try_special_add_to_ops (ops, rhscode, binrhs, binrhsdef))
4940     add_to_ops_vec (ops, binrhs);
4941 }
4942
4943 /* Repropagate the negates back into subtracts, since no other pass
4944    currently does it.  */
4945
4946 static void
4947 repropagate_negates (void)
4948 {
4949   unsigned int i = 0;
4950   tree negate;
4951
4952   FOR_EACH_VEC_ELT (plus_negates, i, negate)
4953     {
4954       gimple *user = get_single_immediate_use (negate);
4955
4956       if (!user || !is_gimple_assign (user))
4957         continue;
4958
4959       /* The negate operand can be either operand of a PLUS_EXPR
4960          (it can be the LHS if the RHS is a constant for example).
4961
4962          Force the negate operand to the RHS of the PLUS_EXPR, then
4963          transform the PLUS_EXPR into a MINUS_EXPR.  */
4964       if (gimple_assign_rhs_code (user) == PLUS_EXPR)
4965         {
4966           /* If the negated operand appears on the LHS of the
4967              PLUS_EXPR, exchange the operands of the PLUS_EXPR
4968              to force the negated operand to the RHS of the PLUS_EXPR.  */
4969           if (gimple_assign_rhs1 (user) == negate)
4970             {
4971               swap_ssa_operands (user,
4972                                  gimple_assign_rhs1_ptr (user),
4973                                  gimple_assign_rhs2_ptr (user));
4974             }
4975
4976           /* Now transform the PLUS_EXPR into a MINUS_EXPR and replace
4977              the RHS of the PLUS_EXPR with the operand of the NEGATE_EXPR.  */
4978           if (gimple_assign_rhs2 (user) == negate)
4979             {
4980               tree rhs1 = gimple_assign_rhs1 (user);
4981               tree rhs2 = gimple_assign_rhs1 (SSA_NAME_DEF_STMT (negate));
4982               gimple_stmt_iterator gsi = gsi_for_stmt (user);
4983               gimple_assign_set_rhs_with_ops (&gsi, MINUS_EXPR, rhs1, rhs2);
4984               update_stmt (user);
4985             }
4986         }
4987       else if (gimple_assign_rhs_code (user) == MINUS_EXPR)
4988         {
4989           if (gimple_assign_rhs1 (user) == negate)
4990             {
4991               /* We have
4992                    x = -a
4993                    y = x - b
4994                  which we transform into
4995                    x = a + b
4996                    y = -x .
4997                  This pushes down the negate which we possibly can merge
4998                  into some other operation, hence insert it into the
4999                  plus_negates vector.  */
5000               gimple *feed = SSA_NAME_DEF_STMT (negate);
5001               tree a = gimple_assign_rhs1 (feed);
5002               tree b = gimple_assign_rhs2 (user);
5003               gimple_stmt_iterator gsi = gsi_for_stmt (feed);
5004               gimple_stmt_iterator gsi2 = gsi_for_stmt (user);
5005               tree x = make_ssa_name (TREE_TYPE (gimple_assign_lhs (feed)));
5006               gimple *g = gimple_build_assign (x, PLUS_EXPR, a, b);
5007               gsi_insert_before (&gsi2, g, GSI_SAME_STMT);
5008               gimple_assign_set_rhs_with_ops (&gsi2, NEGATE_EXPR, x);
5009               user = gsi_stmt (gsi2);
5010               update_stmt (user);
5011               reassoc_remove_stmt (&gsi);
5012               release_defs (feed);
5013               plus_negates.safe_push (gimple_assign_lhs (user));
5014             }
5015           else
5016             {
5017               /* Transform "x = -a; y = b - x" into "y = b + a", getting
5018                  rid of one operation.  */
5019               gimple *feed = SSA_NAME_DEF_STMT (negate);
5020               tree a = gimple_assign_rhs1 (feed);
5021               tree rhs1 = gimple_assign_rhs1 (user);
5022               gimple_stmt_iterator gsi = gsi_for_stmt (user);
5023               gimple_assign_set_rhs_with_ops (&gsi, PLUS_EXPR, rhs1, a);
5024               update_stmt (gsi_stmt (gsi));
5025             }
5026         }
5027     }
5028 }
5029
5030 /* Returns true if OP is of a type for which we can do reassociation.
5031    That is for integral or non-saturating fixed-point types, and for
5032    floating point type when associative-math is enabled.  */
5033
5034 static bool
5035 can_reassociate_p (tree op)
5036 {
5037   tree type = TREE_TYPE (op);
5038   if (TREE_CODE (op) == SSA_NAME && SSA_NAME_OCCURS_IN_ABNORMAL_PHI (op))
5039     return false;
5040   if ((ANY_INTEGRAL_TYPE_P (type) && TYPE_OVERFLOW_WRAPS (type))
5041       || NON_SAT_FIXED_POINT_TYPE_P (type)
5042       || (flag_associative_math && FLOAT_TYPE_P (type)))
5043     return true;
5044   return false;
5045 }
5046
5047 /* Break up subtract operations in block BB.
5048
5049    We do this top down because we don't know whether the subtract is
5050    part of a possible chain of reassociation except at the top.
5051
5052    IE given
5053    d = f + g
5054    c = a + e
5055    b = c - d
5056    q = b - r
5057    k = t - q
5058
5059    we want to break up k = t - q, but we won't until we've transformed q
5060    = b - r, which won't be broken up until we transform b = c - d.
5061
5062    En passant, clear the GIMPLE visited flag on every statement
5063    and set UIDs within each basic block.  */
5064
5065 static void
5066 break_up_subtract_bb (basic_block bb)
5067 {
5068   gimple_stmt_iterator gsi;
5069   basic_block son;
5070   unsigned int uid = 1;
5071
5072   for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
5073     {
5074       gimple *stmt = gsi_stmt (gsi);
5075       gimple_set_visited (stmt, false);
5076       gimple_set_uid (stmt, uid++);
5077
5078       if (!is_gimple_assign (stmt)
5079           || !can_reassociate_p (gimple_assign_lhs (stmt)))
5080         continue;
5081
5082       /* Look for simple gimple subtract operations.  */
5083       if (gimple_assign_rhs_code (stmt) == MINUS_EXPR)
5084         {
5085           if (!can_reassociate_p (gimple_assign_rhs1 (stmt))
5086               || !can_reassociate_p (gimple_assign_rhs2 (stmt)))
5087             continue;
5088
5089           /* Check for a subtract used only in an addition.  If this
5090              is the case, transform it into add of a negate for better
5091              reassociation.  IE transform C = A-B into C = A + -B if C
5092              is only used in an addition.  */
5093           if (should_break_up_subtract (stmt))
5094             break_up_subtract (stmt, &gsi);
5095         }
5096       else if (gimple_assign_rhs_code (stmt) == NEGATE_EXPR
5097                && can_reassociate_p (gimple_assign_rhs1 (stmt)))
5098         plus_negates.safe_push (gimple_assign_lhs (stmt));
5099     }
5100   for (son = first_dom_son (CDI_DOMINATORS, bb);
5101        son;
5102        son = next_dom_son (CDI_DOMINATORS, son))
5103     break_up_subtract_bb (son);
5104 }
5105
5106 /* Used for repeated factor analysis.  */
5107 struct repeat_factor
5108 {
5109   /* An SSA name that occurs in a multiply chain.  */
5110   tree factor;
5111
5112   /* Cached rank of the factor.  */
5113   unsigned rank;
5114
5115   /* Number of occurrences of the factor in the chain.  */
5116   HOST_WIDE_INT count;
5117
5118   /* An SSA name representing the product of this factor and
5119      all factors appearing later in the repeated factor vector.  */
5120   tree repr;
5121 };
5122
5123
5124 static vec<repeat_factor> repeat_factor_vec;
5125
5126 /* Used for sorting the repeat factor vector.  Sort primarily by
5127    ascending occurrence count, secondarily by descending rank.  */
5128
5129 static int
5130 compare_repeat_factors (const void *x1, const void *x2)
5131 {
5132   const repeat_factor *rf1 = (const repeat_factor *) x1;
5133   const repeat_factor *rf2 = (const repeat_factor *) x2;
5134
5135   if (rf1->count != rf2->count)
5136     return rf1->count - rf2->count;
5137
5138   return rf2->rank - rf1->rank;
5139 }
5140
5141 /* Look for repeated operands in OPS in the multiply tree rooted at
5142    STMT.  Replace them with an optimal sequence of multiplies and powi
5143    builtin calls, and remove the used operands from OPS.  Return an
5144    SSA name representing the value of the replacement sequence.  */
5145
5146 static tree
5147 attempt_builtin_powi (gimple *stmt, vec<operand_entry *> *ops)
5148 {
5149   unsigned i, j, vec_len;
5150   int ii;
5151   operand_entry *oe;
5152   repeat_factor *rf1, *rf2;
5153   repeat_factor rfnew;
5154   tree result = NULL_TREE;
5155   tree target_ssa, iter_result;
5156   tree type = TREE_TYPE (gimple_get_lhs (stmt));
5157   tree powi_fndecl = mathfn_built_in (type, BUILT_IN_POWI);
5158   gimple_stmt_iterator gsi = gsi_for_stmt (stmt);
5159   gimple *mul_stmt, *pow_stmt;
5160
5161   /* Nothing to do if BUILT_IN_POWI doesn't exist for this type and
5162      target.  */
5163   if (!powi_fndecl)
5164     return NULL_TREE;
5165
5166   /* Allocate the repeated factor vector.  */
5167   repeat_factor_vec.create (10);
5168
5169   /* Scan the OPS vector for all SSA names in the product and build
5170      up a vector of occurrence counts for each factor.  */
5171   FOR_EACH_VEC_ELT (*ops, i, oe)
5172     {
5173       if (TREE_CODE (oe->op) == SSA_NAME)
5174         {
5175           FOR_EACH_VEC_ELT (repeat_factor_vec, j, rf1)
5176             {
5177               if (rf1->factor == oe->op)
5178                 {
5179                   rf1->count += oe->count;
5180                   break;
5181                 }
5182             }
5183
5184           if (j >= repeat_factor_vec.length ())
5185             {
5186               rfnew.factor = oe->op;
5187               rfnew.rank = oe->rank;
5188               rfnew.count = oe->count;
5189               rfnew.repr = NULL_TREE;
5190               repeat_factor_vec.safe_push (rfnew);
5191             }
5192         }
5193     }
5194
5195   /* Sort the repeated factor vector by (a) increasing occurrence count,
5196      and (b) decreasing rank.  */
5197   repeat_factor_vec.qsort (compare_repeat_factors);
5198
5199   /* It is generally best to combine as many base factors as possible
5200      into a product before applying __builtin_powi to the result.
5201      However, the sort order chosen for the repeated factor vector
5202      allows us to cache partial results for the product of the base
5203      factors for subsequent use.  When we already have a cached partial
5204      result from a previous iteration, it is best to make use of it
5205      before looking for another __builtin_pow opportunity.
5206
5207      As an example, consider x * x * y * y * y * z * z * z * z.
5208      We want to first compose the product x * y * z, raise it to the
5209      second power, then multiply this by y * z, and finally multiply
5210      by z.  This can be done in 5 multiplies provided we cache y * z
5211      for use in both expressions:
5212
5213         t1 = y * z
5214         t2 = t1 * x
5215         t3 = t2 * t2
5216         t4 = t1 * t3
5217         result = t4 * z
5218
5219      If we instead ignored the cached y * z and first multiplied by
5220      the __builtin_pow opportunity z * z, we would get the inferior:
5221
5222         t1 = y * z
5223         t2 = t1 * x
5224         t3 = t2 * t2
5225         t4 = z * z
5226         t5 = t3 * t4
5227         result = t5 * y  */
5228
5229   vec_len = repeat_factor_vec.length ();
5230
5231   /* Repeatedly look for opportunities to create a builtin_powi call.  */
5232   while (true)
5233     {
5234       HOST_WIDE_INT power;
5235
5236       /* First look for the largest cached product of factors from
5237          preceding iterations.  If found, create a builtin_powi for
5238          it if the minimum occurrence count for its factors is at
5239          least 2, or just use this cached product as our next
5240          multiplicand if the minimum occurrence count is 1.  */
5241       FOR_EACH_VEC_ELT (repeat_factor_vec, j, rf1)
5242         {
5243           if (rf1->repr && rf1->count > 0)
5244             break;
5245         }
5246
5247       if (j < vec_len)
5248         {
5249           power = rf1->count;
5250
5251           if (power == 1)
5252             {
5253               iter_result = rf1->repr;
5254
5255               if (dump_file && (dump_flags & TDF_DETAILS))
5256                 {
5257                   unsigned elt;
5258                   repeat_factor *rf;
5259                   fputs ("Multiplying by cached product ", dump_file);
5260                   for (elt = j; elt < vec_len; elt++)
5261                     {
5262                       rf = &repeat_factor_vec[elt];
5263                       print_generic_expr (dump_file, rf->factor);
5264                       if (elt < vec_len - 1)
5265                         fputs (" * ", dump_file);
5266                     }
5267                   fputs ("\n", dump_file);
5268                 }
5269             }
5270           else
5271             {
5272               iter_result = make_temp_ssa_name (type, NULL, "reassocpow");
5273               pow_stmt = gimple_build_call (powi_fndecl, 2, rf1->repr,
5274                                             build_int_cst (integer_type_node,
5275                                                            power));
5276               gimple_call_set_lhs (pow_stmt, iter_result);
5277               gimple_set_location (pow_stmt, gimple_location (stmt));
5278               gimple_set_uid (pow_stmt, gimple_uid (stmt));
5279               gsi_insert_before (&gsi, pow_stmt, GSI_SAME_STMT);
5280
5281               if (dump_file && (dump_flags & TDF_DETAILS))
5282                 {
5283                   unsigned elt;
5284                   repeat_factor *rf;
5285                   fputs ("Building __builtin_pow call for cached product (",
5286                          dump_file);
5287                   for (elt = j; elt < vec_len; elt++)
5288                     {
5289                       rf = &repeat_factor_vec[elt];
5290                       print_generic_expr (dump_file, rf->factor);
5291                       if (elt < vec_len - 1)
5292                         fputs (" * ", dump_file);
5293                     }
5294                   fprintf (dump_file, ")^" HOST_WIDE_INT_PRINT_DEC"\n",
5295                            power);
5296                 }
5297             }
5298         }
5299       else
5300         {
5301           /* Otherwise, find the first factor in the repeated factor
5302              vector whose occurrence count is at least 2.  If no such
5303              factor exists, there are no builtin_powi opportunities
5304              remaining.  */
5305           FOR_EACH_VEC_ELT (repeat_factor_vec, j, rf1)
5306             {
5307               if (rf1->count >= 2)
5308                 break;
5309             }
5310
5311           if (j >= vec_len)
5312             break;
5313
5314           power = rf1->count;
5315
5316           if (dump_file && (dump_flags & TDF_DETAILS))
5317             {
5318               unsigned elt;
5319               repeat_factor *rf;
5320               fputs ("Building __builtin_pow call for (", dump_file);
5321               for (elt = j; elt < vec_len; elt++)
5322                 {
5323                   rf = &repeat_factor_vec[elt];
5324                   print_generic_expr (dump_file, rf->factor);
5325                   if (elt < vec_len - 1)
5326                     fputs (" * ", dump_file);
5327                 }
5328               fprintf (dump_file, ")^" HOST_WIDE_INT_PRINT_DEC"\n", power);
5329             }
5330
5331           reassociate_stats.pows_created++;
5332
5333           /* Visit each element of the vector in reverse order (so that
5334              high-occurrence elements are visited first, and within the
5335              same occurrence count, lower-ranked elements are visited
5336              first).  Form a linear product of all elements in this order
5337              whose occurrencce count is at least that of element J.
5338              Record the SSA name representing the product of each element
5339              with all subsequent elements in the vector.  */
5340           if (j == vec_len - 1)
5341             rf1->repr = rf1->factor;
5342           else
5343             {
5344               for (ii = vec_len - 2; ii >= (int)j; ii--)
5345                 {
5346                   tree op1, op2;
5347
5348                   rf1 = &repeat_factor_vec[ii];
5349                   rf2 = &repeat_factor_vec[ii + 1];
5350
5351                   /* Init the last factor's representative to be itself.  */
5352                   if (!rf2->repr)
5353                     rf2->repr = rf2->factor;
5354
5355                   op1 = rf1->factor;
5356                   op2 = rf2->repr;
5357
5358                   target_ssa = make_temp_ssa_name (type, NULL, "reassocpow");
5359                   mul_stmt = gimple_build_assign (target_ssa, MULT_EXPR,
5360                                                   op1, op2);
5361                   gimple_set_location (mul_stmt, gimple_location (stmt));
5362                   gimple_set_uid (mul_stmt, gimple_uid (stmt));
5363                   gsi_insert_before (&gsi, mul_stmt, GSI_SAME_STMT);
5364                   rf1->repr = target_ssa;
5365
5366                   /* Don't reprocess the multiply we just introduced.  */
5367                   gimple_set_visited (mul_stmt, true);
5368                 }
5369             }
5370
5371           /* Form a call to __builtin_powi for the maximum product
5372              just formed, raised to the power obtained earlier.  */
5373           rf1 = &repeat_factor_vec[j];
5374           iter_result = make_temp_ssa_name (type, NULL, "reassocpow");
5375           pow_stmt = gimple_build_call (powi_fndecl, 2, rf1->repr,
5376                                         build_int_cst (integer_type_node,
5377                                                        power));
5378           gimple_call_set_lhs (pow_stmt, iter_result);
5379           gimple_set_location (pow_stmt, gimple_location (stmt));
5380           gimple_set_uid (pow_stmt, gimple_uid (stmt));
5381           gsi_insert_before (&gsi, pow_stmt, GSI_SAME_STMT);
5382         }
5383
5384       /* If we previously formed at least one other builtin_powi call,
5385          form the product of this one and those others.  */
5386       if (result)
5387         {
5388           tree new_result = make_temp_ssa_name (type, NULL, "reassocpow");
5389           mul_stmt = gimple_build_assign (new_result, MULT_EXPR,
5390                                           result, iter_result);
5391           gimple_set_location (mul_stmt, gimple_location (stmt));
5392           gimple_set_uid (mul_stmt, gimple_uid (stmt));
5393           gsi_insert_before (&gsi, mul_stmt, GSI_SAME_STMT);
5394           gimple_set_visited (mul_stmt, true);
5395           result = new_result;
5396         }
5397       else
5398         result = iter_result;
5399
5400       /* Decrement the occurrence count of each element in the product
5401          by the count found above, and remove this many copies of each
5402          factor from OPS.  */
5403       for (i = j; i < vec_len; i++)
5404         {
5405           unsigned k = power;
5406           unsigned n;
5407
5408           rf1 = &repeat_factor_vec[i];
5409           rf1->count -= power;
5410
5411           FOR_EACH_VEC_ELT_REVERSE (*ops, n, oe)
5412             {
5413               if (oe->op == rf1->factor)
5414                 {
5415                   if (oe->count <= k)
5416                     {
5417                       ops->ordered_remove (n);
5418                       k -= oe->count;
5419
5420                       if (k == 0)
5421                         break;
5422                     }
5423                   else
5424                     {
5425                       oe->count -= k;
5426                       break;
5427                     }
5428                 }
5429             }
5430         }
5431     }
5432
5433   /* At this point all elements in the repeated factor vector have a
5434      remaining occurrence count of 0 or 1, and those with a count of 1
5435      don't have cached representatives.  Re-sort the ops vector and
5436      clean up.  */
5437   ops->qsort (sort_by_operand_rank);
5438   repeat_factor_vec.release ();
5439
5440   /* Return the final product computed herein.  Note that there may
5441      still be some elements with single occurrence count left in OPS;
5442      those will be handled by the normal reassociation logic.  */
5443   return result;
5444 }
5445
5446 /* Attempt to optimize
5447    CST1 * copysign (CST2, y) -> copysign (CST1 * CST2, y) if CST1 > 0, or
5448    CST1 * copysign (CST2, y) -> -copysign (CST1 * CST2, y) if CST1 < 0.  */
5449
5450 static void
5451 attempt_builtin_copysign (vec<operand_entry *> *ops)
5452 {
5453   operand_entry *oe;
5454   unsigned int i;
5455   unsigned int length = ops->length ();
5456   tree cst = ops->last ()->op;
5457
5458   if (length == 1 || TREE_CODE (cst) != REAL_CST)
5459     return;
5460
5461   FOR_EACH_VEC_ELT (*ops, i, oe)
5462     {
5463       if (TREE_CODE (oe->op) == SSA_NAME
5464           && has_single_use (oe->op))
5465         {
5466           gimple *def_stmt = SSA_NAME_DEF_STMT (oe->op);
5467           if (gcall *old_call = dyn_cast <gcall *> (def_stmt))
5468             {
5469               tree arg0, arg1;
5470               switch (gimple_call_combined_fn (old_call))
5471                 {
5472                 CASE_CFN_COPYSIGN:
5473                   arg0 = gimple_call_arg (old_call, 0);
5474                   arg1 = gimple_call_arg (old_call, 1);
5475                   /* The first argument of copysign must be a constant,
5476                      otherwise there's nothing to do.  */
5477                   if (TREE_CODE (arg0) == REAL_CST)
5478                     {
5479                       tree type = TREE_TYPE (arg0);
5480                       tree mul = const_binop (MULT_EXPR, type, cst, arg0);
5481                       /* If we couldn't fold to a single constant, skip it.
5482                          That happens e.g. for inexact multiplication when
5483                          -frounding-math.  */
5484                       if (mul == NULL_TREE)
5485                         break;
5486                       /* Instead of adjusting OLD_CALL, let's build a new
5487                          call to not leak the LHS and prevent keeping bogus
5488                          debug statements.  DCE will clean up the old call.  */
5489                       gcall *new_call;
5490                       if (gimple_call_internal_p (old_call))
5491                         new_call = gimple_build_call_internal
5492                           (IFN_COPYSIGN, 2, mul, arg1);
5493                       else
5494                         new_call = gimple_build_call
5495                           (gimple_call_fndecl (old_call), 2, mul, arg1);
5496                       tree lhs = make_ssa_name (type);
5497                       gimple_call_set_lhs (new_call, lhs);
5498                       gimple_set_location (new_call,
5499                                            gimple_location (old_call));
5500                       insert_stmt_after (new_call, old_call);
5501                       /* We've used the constant, get rid of it.  */
5502                       ops->pop ();
5503                       bool cst1_neg = real_isneg (TREE_REAL_CST_PTR (cst));
5504                       /* Handle the CST1 < 0 case by negating the result.  */
5505                       if (cst1_neg)
5506                         {
5507                           tree negrhs = make_ssa_name (TREE_TYPE (lhs));
5508                           gimple *negate_stmt
5509                             = gimple_build_assign (negrhs, NEGATE_EXPR, lhs);
5510                           insert_stmt_after (negate_stmt, new_call);
5511                           oe->op = negrhs;
5512                         }
5513                       else
5514                         oe->op = lhs;
5515                       if (dump_file && (dump_flags & TDF_DETAILS))
5516                         {
5517                           fprintf (dump_file, "Optimizing copysign: ");
5518                           print_generic_expr (dump_file, cst);
5519                           fprintf (dump_file, " * COPYSIGN (");
5520                           print_generic_expr (dump_file, arg0);
5521                           fprintf (dump_file, ", ");
5522                           print_generic_expr (dump_file, arg1);
5523                           fprintf (dump_file, ") into %sCOPYSIGN (",
5524                                    cst1_neg ? "-" : "");
5525                           print_generic_expr (dump_file, mul);
5526                           fprintf (dump_file, ", ");
5527                           print_generic_expr (dump_file, arg1);
5528                           fprintf (dump_file, "\n");
5529                         }
5530                       return;
5531                     }
5532                   break;
5533                 default:
5534                   break;
5535                 }
5536             }
5537         }
5538     }
5539 }
5540
5541 /* Transform STMT at *GSI into a copy by replacing its rhs with NEW_RHS.  */
5542
5543 static void
5544 transform_stmt_to_copy (gimple_stmt_iterator *gsi, gimple *stmt, tree new_rhs)
5545 {
5546   tree rhs1;
5547
5548   if (dump_file && (dump_flags & TDF_DETAILS))
5549     {
5550       fprintf (dump_file, "Transforming ");
5551       print_gimple_stmt (dump_file, stmt, 0);
5552     }
5553
5554   rhs1 = gimple_assign_rhs1 (stmt);
5555   gimple_assign_set_rhs_from_tree (gsi, new_rhs);
5556   update_stmt (stmt);
5557   remove_visited_stmt_chain (rhs1);
5558
5559   if (dump_file && (dump_flags & TDF_DETAILS))
5560     {
5561       fprintf (dump_file, " into ");
5562       print_gimple_stmt (dump_file, stmt, 0);
5563     }
5564 }
5565
5566 /* Transform STMT at *GSI into a multiply of RHS1 and RHS2.  */
5567
5568 static void
5569 transform_stmt_to_multiply (gimple_stmt_iterator *gsi, gimple *stmt,
5570                             tree rhs1, tree rhs2)
5571 {
5572   if (dump_file && (dump_flags & TDF_DETAILS))
5573     {
5574       fprintf (dump_file, "Transforming ");
5575       print_gimple_stmt (dump_file, stmt, 0);
5576     }
5577
5578   gimple_assign_set_rhs_with_ops (gsi, MULT_EXPR, rhs1, rhs2);
5579   update_stmt (gsi_stmt (*gsi));
5580   remove_visited_stmt_chain (rhs1);
5581
5582   if (dump_file && (dump_flags & TDF_DETAILS))
5583     {
5584       fprintf (dump_file, " into ");
5585       print_gimple_stmt (dump_file, stmt, 0);
5586     }
5587 }
5588
5589 /* Reassociate expressions in basic block BB and its post-dominator as
5590    children.
5591
5592    Bubble up return status from maybe_optimize_range_tests.  */
5593
5594 static bool
5595 reassociate_bb (basic_block bb)
5596 {
5597   gimple_stmt_iterator gsi;
5598   basic_block son;
5599   gimple *stmt = last_stmt (bb);
5600   bool cfg_cleanup_needed = false;
5601
5602   if (stmt && !gimple_visited_p (stmt))
5603     cfg_cleanup_needed |= maybe_optimize_range_tests (stmt);
5604
5605   for (gsi = gsi_last_bb (bb); !gsi_end_p (gsi); gsi_prev (&gsi))
5606     {
5607       stmt = gsi_stmt (gsi);
5608
5609       if (is_gimple_assign (stmt)
5610           && !stmt_could_throw_p (stmt))
5611         {
5612           tree lhs, rhs1, rhs2;
5613           enum tree_code rhs_code = gimple_assign_rhs_code (stmt);
5614
5615           /* If this is not a gimple binary expression, there is
5616              nothing for us to do with it.  */
5617           if (get_gimple_rhs_class (rhs_code) != GIMPLE_BINARY_RHS)
5618             continue;
5619
5620           /* If this was part of an already processed statement,
5621              we don't need to touch it again. */
5622           if (gimple_visited_p (stmt))
5623             {
5624               /* This statement might have become dead because of previous
5625                  reassociations.  */
5626               if (has_zero_uses (gimple_get_lhs (stmt)))
5627                 {
5628                   reassoc_remove_stmt (&gsi);
5629                   release_defs (stmt);
5630                   /* We might end up removing the last stmt above which
5631                      places the iterator to the end of the sequence.
5632                      Reset it to the last stmt in this case which might
5633                      be the end of the sequence as well if we removed
5634                      the last statement of the sequence.  In which case
5635                      we need to bail out.  */
5636                   if (gsi_end_p (gsi))
5637                     {
5638                       gsi = gsi_last_bb (bb);
5639                       if (gsi_end_p (gsi))
5640                         break;
5641                     }
5642                 }
5643               continue;
5644             }
5645
5646           lhs = gimple_assign_lhs (stmt);
5647           rhs1 = gimple_assign_rhs1 (stmt);
5648           rhs2 = gimple_assign_rhs2 (stmt);
5649
5650           /* For non-bit or min/max operations we can't associate
5651              all types.  Verify that here.  */
5652           if (rhs_code != BIT_IOR_EXPR
5653               && rhs_code != BIT_AND_EXPR
5654               && rhs_code != BIT_XOR_EXPR
5655               && rhs_code != MIN_EXPR
5656               && rhs_code != MAX_EXPR
5657               && (!can_reassociate_p (lhs)
5658                   || !can_reassociate_p (rhs1)
5659                   || !can_reassociate_p (rhs2)))
5660             continue;
5661
5662           if (associative_tree_code (rhs_code))
5663             {
5664               auto_vec<operand_entry *> ops;
5665               tree powi_result = NULL_TREE;
5666               bool is_vector = VECTOR_TYPE_P (TREE_TYPE (lhs));
5667
5668               /* There may be no immediate uses left by the time we
5669                  get here because we may have eliminated them all.  */
5670               if (TREE_CODE (lhs) == SSA_NAME && has_zero_uses (lhs))
5671                 continue;
5672
5673               gimple_set_visited (stmt, true);
5674               linearize_expr_tree (&ops, stmt, true, true);
5675               ops.qsort (sort_by_operand_rank);
5676               int orig_len = ops.length ();
5677               optimize_ops_list (rhs_code, &ops);
5678               if (undistribute_ops_list (rhs_code, &ops,
5679                                          loop_containing_stmt (stmt)))
5680                 {
5681                   ops.qsort (sort_by_operand_rank);
5682                   optimize_ops_list (rhs_code, &ops);
5683                 }
5684
5685               if (rhs_code == PLUS_EXPR
5686                   && transform_add_to_multiply (&ops))
5687                 ops.qsort (sort_by_operand_rank);
5688
5689               if (rhs_code == BIT_IOR_EXPR || rhs_code == BIT_AND_EXPR)
5690                 {
5691                   if (is_vector)
5692                     optimize_vec_cond_expr (rhs_code, &ops);
5693                   else
5694                     optimize_range_tests (rhs_code, &ops);
5695                 }
5696
5697               if (rhs_code == MULT_EXPR && !is_vector)
5698                 {
5699                   attempt_builtin_copysign (&ops);
5700
5701                   if (reassoc_insert_powi_p
5702                       && flag_unsafe_math_optimizations)
5703                     powi_result = attempt_builtin_powi (stmt, &ops);
5704                 }
5705
5706               operand_entry *last;
5707               bool negate_result = false;
5708               if (ops.length () > 1
5709                   && rhs_code == MULT_EXPR)
5710                 {
5711                   last = ops.last ();
5712                   if ((integer_minus_onep (last->op)
5713                        || real_minus_onep (last->op))
5714                       && !HONOR_SNANS (TREE_TYPE (lhs))
5715                       && (!HONOR_SIGNED_ZEROS (TREE_TYPE (lhs))
5716                           || !COMPLEX_FLOAT_TYPE_P (TREE_TYPE (lhs))))
5717                     {
5718                       ops.pop ();
5719                       negate_result = true;
5720                     }
5721                 }
5722
5723               tree new_lhs = lhs;
5724               /* If the operand vector is now empty, all operands were
5725                  consumed by the __builtin_powi optimization.  */
5726               if (ops.length () == 0)
5727                 transform_stmt_to_copy (&gsi, stmt, powi_result);
5728               else if (ops.length () == 1)
5729                 {
5730                   tree last_op = ops.last ()->op;
5731
5732                   /* If the stmt that defines operand has to be inserted, insert it
5733                      before the use.  */
5734                   if (ops.last ()->stmt_to_insert)
5735                     insert_stmt_before_use (stmt, ops.last ()->stmt_to_insert);
5736                   if (powi_result)
5737                     transform_stmt_to_multiply (&gsi, stmt, last_op,
5738                                                 powi_result);
5739                   else
5740                     transform_stmt_to_copy (&gsi, stmt, last_op);
5741                 }
5742               else
5743                 {
5744                   machine_mode mode = TYPE_MODE (TREE_TYPE (lhs));
5745                   int ops_num = ops.length ();
5746                   int width = get_reassociation_width (ops_num, rhs_code, mode);
5747
5748                   if (dump_file && (dump_flags & TDF_DETAILS))
5749                     fprintf (dump_file,
5750                              "Width = %d was chosen for reassociation\n", width);
5751
5752                   if (width > 1
5753                       && ops.length () > 3)
5754                     rewrite_expr_tree_parallel (as_a <gassign *> (stmt),
5755                                                 width, ops);
5756                   else
5757                     {
5758                       /* When there are three operands left, we want
5759                          to make sure the ones that get the double
5760                          binary op are chosen wisely.  */
5761                       int len = ops.length ();
5762                       if (len >= 3)
5763                         swap_ops_for_binary_stmt (ops, len - 3, stmt);
5764
5765                       new_lhs = rewrite_expr_tree (stmt, 0, ops,
5766                                                    powi_result != NULL
5767                                                    || negate_result,
5768                                                    len != orig_len);
5769                     }
5770
5771                   /* If we combined some repeated factors into a
5772                      __builtin_powi call, multiply that result by the
5773                      reassociated operands.  */
5774                   if (powi_result)
5775                     {
5776                       gimple *mul_stmt, *lhs_stmt = SSA_NAME_DEF_STMT (lhs);
5777                       tree type = TREE_TYPE (lhs);
5778                       tree target_ssa = make_temp_ssa_name (type, NULL,
5779                                                             "reassocpow");
5780                       gimple_set_lhs (lhs_stmt, target_ssa);
5781                       update_stmt (lhs_stmt);
5782                       if (lhs != new_lhs)
5783                         {
5784                           target_ssa = new_lhs;
5785                           new_lhs = lhs;
5786                         }
5787                       mul_stmt = gimple_build_assign (lhs, MULT_EXPR,
5788                                                       powi_result, target_ssa);
5789                       gimple_set_location (mul_stmt, gimple_location (stmt));
5790                       gimple_set_uid (mul_stmt, gimple_uid (stmt));
5791                       gsi_insert_after (&gsi, mul_stmt, GSI_NEW_STMT);
5792                     }
5793                 }
5794
5795               if (negate_result)
5796                 {
5797                   stmt = SSA_NAME_DEF_STMT (lhs);
5798                   tree tmp = make_ssa_name (TREE_TYPE (lhs));
5799                   gimple_set_lhs (stmt, tmp);
5800                   if (lhs != new_lhs)
5801                     tmp = new_lhs;
5802                   gassign *neg_stmt = gimple_build_assign (lhs, NEGATE_EXPR,
5803                                                            tmp);
5804                   gimple_set_uid (neg_stmt, gimple_uid (stmt));
5805                   gsi_insert_after (&gsi, neg_stmt, GSI_NEW_STMT);
5806                   update_stmt (stmt);
5807                 }
5808             }
5809         }
5810     }
5811   for (son = first_dom_son (CDI_POST_DOMINATORS, bb);
5812        son;
5813        son = next_dom_son (CDI_POST_DOMINATORS, son))
5814     cfg_cleanup_needed |= reassociate_bb (son);
5815
5816   return cfg_cleanup_needed;
5817 }
5818
5819 /* Add jumps around shifts for range tests turned into bit tests.
5820    For each SSA_NAME VAR we have code like:
5821    VAR = ...; // final stmt of range comparison
5822    // bit test here...;
5823    OTHERVAR = ...; // final stmt of the bit test sequence
5824    RES = VAR | OTHERVAR;
5825    Turn the above into:
5826    VAR = ...;
5827    if (VAR != 0)
5828      goto <l3>;
5829    else
5830      goto <l2>;
5831    <l2>:
5832    // bit test here...;
5833    OTHERVAR = ...;
5834    <l3>:
5835    # RES = PHI<1(l1), OTHERVAR(l2)>;  */
5836
5837 static void
5838 branch_fixup (void)
5839 {
5840   tree var;
5841   unsigned int i;
5842
5843   FOR_EACH_VEC_ELT (reassoc_branch_fixups, i, var)
5844     {
5845       gimple *def_stmt = SSA_NAME_DEF_STMT (var);
5846       gimple *use_stmt;
5847       use_operand_p use;
5848       bool ok = single_imm_use (var, &use, &use_stmt);
5849       gcc_assert (ok
5850                   && is_gimple_assign (use_stmt)
5851                   && gimple_assign_rhs_code (use_stmt) == BIT_IOR_EXPR
5852                   && gimple_bb (def_stmt) == gimple_bb (use_stmt));
5853
5854       basic_block cond_bb = gimple_bb (def_stmt);
5855       basic_block then_bb = split_block (cond_bb, def_stmt)->dest;
5856       basic_block merge_bb = split_block (then_bb, use_stmt)->dest;
5857
5858       gimple_stmt_iterator gsi = gsi_for_stmt (def_stmt);
5859       gimple *g = gimple_build_cond (NE_EXPR, var,
5860                                      build_zero_cst (TREE_TYPE (var)),
5861                                      NULL_TREE, NULL_TREE);
5862       location_t loc = gimple_location (use_stmt);
5863       gimple_set_location (g, loc);
5864       gsi_insert_after (&gsi, g, GSI_NEW_STMT);
5865
5866       edge etrue = make_edge (cond_bb, merge_bb, EDGE_TRUE_VALUE);
5867       etrue->probability = profile_probability::even ();
5868       etrue->count = cond_bb->count.apply_scale (1, 2);
5869       edge efalse = find_edge (cond_bb, then_bb);
5870       efalse->flags = EDGE_FALSE_VALUE;
5871       efalse->probability -= etrue->probability;
5872       efalse->count -= etrue->count;
5873       then_bb->count -= etrue->count;
5874
5875       tree othervar = NULL_TREE;
5876       if (gimple_assign_rhs1 (use_stmt) == var)
5877         othervar = gimple_assign_rhs2 (use_stmt);
5878       else if (gimple_assign_rhs2 (use_stmt) == var)
5879         othervar = gimple_assign_rhs1 (use_stmt);
5880       else
5881         gcc_unreachable ();
5882       tree lhs = gimple_assign_lhs (use_stmt);
5883       gphi *phi = create_phi_node (lhs, merge_bb);
5884       add_phi_arg (phi, build_one_cst (TREE_TYPE (lhs)), etrue, loc);
5885       add_phi_arg (phi, othervar, single_succ_edge (then_bb), loc);
5886       gsi = gsi_for_stmt (use_stmt);
5887       gsi_remove (&gsi, true);
5888
5889       set_immediate_dominator (CDI_DOMINATORS, merge_bb, cond_bb);
5890       set_immediate_dominator (CDI_POST_DOMINATORS, cond_bb, merge_bb);
5891     }
5892   reassoc_branch_fixups.release ();
5893 }
5894
5895 void dump_ops_vector (FILE *file, vec<operand_entry *> ops);
5896 void debug_ops_vector (vec<operand_entry *> ops);
5897
5898 /* Dump the operand entry vector OPS to FILE.  */
5899
5900 void
5901 dump_ops_vector (FILE *file, vec<operand_entry *> ops)
5902 {
5903   operand_entry *oe;
5904   unsigned int i;
5905
5906   FOR_EACH_VEC_ELT (ops, i, oe)
5907     {
5908       fprintf (file, "Op %d -> rank: %d, tree: ", i, oe->rank);
5909       print_generic_expr (file, oe->op);
5910       fprintf (file, "\n");
5911     }
5912 }
5913
5914 /* Dump the operand entry vector OPS to STDERR.  */
5915
5916 DEBUG_FUNCTION void
5917 debug_ops_vector (vec<operand_entry *> ops)
5918 {
5919   dump_ops_vector (stderr, ops);
5920 }
5921
5922 /* Bubble up return status from reassociate_bb.  */
5923
5924 static bool
5925 do_reassoc (void)
5926 {
5927   break_up_subtract_bb (ENTRY_BLOCK_PTR_FOR_FN (cfun));
5928   return reassociate_bb (EXIT_BLOCK_PTR_FOR_FN (cfun));
5929 }
5930
5931 /* Initialize the reassociation pass.  */
5932
5933 static void
5934 init_reassoc (void)
5935 {
5936   int i;
5937   long rank = 2;
5938   int *bbs = XNEWVEC (int, n_basic_blocks_for_fn (cfun) - NUM_FIXED_BLOCKS);
5939
5940   /* Find the loops, so that we can prevent moving calculations in
5941      them.  */
5942   loop_optimizer_init (AVOID_CFG_MODIFICATIONS);
5943
5944   memset (&reassociate_stats, 0, sizeof (reassociate_stats));
5945
5946   next_operand_entry_id = 0;
5947
5948   /* Reverse RPO (Reverse Post Order) will give us something where
5949      deeper loops come later.  */
5950   pre_and_rev_post_order_compute (NULL, bbs, false);
5951   bb_rank = XCNEWVEC (long, last_basic_block_for_fn (cfun));
5952   operand_rank = new hash_map<tree, long>;
5953
5954   /* Give each default definition a distinct rank.  This includes
5955      parameters and the static chain.  Walk backwards over all
5956      SSA names so that we get proper rank ordering according
5957      to tree_swap_operands_p.  */
5958   for (i = num_ssa_names - 1; i > 0; --i)
5959     {
5960       tree name = ssa_name (i);
5961       if (name && SSA_NAME_IS_DEFAULT_DEF (name))
5962         insert_operand_rank (name, ++rank);
5963     }
5964
5965   /* Set up rank for each BB  */
5966   for (i = 0; i < n_basic_blocks_for_fn (cfun) - NUM_FIXED_BLOCKS; i++)
5967     bb_rank[bbs[i]] = ++rank  << 16;
5968
5969   free (bbs);
5970   calculate_dominance_info (CDI_POST_DOMINATORS);
5971   plus_negates = vNULL;
5972 }
5973
5974 /* Cleanup after the reassociation pass, and print stats if
5975    requested.  */
5976
5977 static void
5978 fini_reassoc (void)
5979 {
5980   statistics_counter_event (cfun, "Linearized",
5981                             reassociate_stats.linearized);
5982   statistics_counter_event (cfun, "Constants eliminated",
5983                             reassociate_stats.constants_eliminated);
5984   statistics_counter_event (cfun, "Ops eliminated",
5985                             reassociate_stats.ops_eliminated);
5986   statistics_counter_event (cfun, "Statements rewritten",
5987                             reassociate_stats.rewritten);
5988   statistics_counter_event (cfun, "Built-in pow[i] calls encountered",
5989                             reassociate_stats.pows_encountered);
5990   statistics_counter_event (cfun, "Built-in powi calls created",
5991                             reassociate_stats.pows_created);
5992
5993   delete operand_rank;
5994   operand_entry_pool.release ();
5995   free (bb_rank);
5996   plus_negates.release ();
5997   free_dominance_info (CDI_POST_DOMINATORS);
5998   loop_optimizer_finalize ();
5999 }
6000
6001 /* Gate and execute functions for Reassociation.  If INSERT_POWI_P, enable
6002    insertion of __builtin_powi calls.
6003
6004    Returns TODO_cfg_cleanup if a CFG cleanup pass is desired due to
6005    optimization of a gimple conditional.  Otherwise returns zero.  */
6006
6007 static unsigned int
6008 execute_reassoc (bool insert_powi_p)
6009 {
6010   reassoc_insert_powi_p = insert_powi_p;
6011
6012   init_reassoc ();
6013
6014   bool cfg_cleanup_needed;
6015   cfg_cleanup_needed = do_reassoc ();
6016   repropagate_negates ();
6017   branch_fixup ();
6018
6019   fini_reassoc ();
6020   return cfg_cleanup_needed ? TODO_cleanup_cfg : 0;
6021 }
6022
6023 namespace {
6024
6025 const pass_data pass_data_reassoc =
6026 {
6027   GIMPLE_PASS, /* type */
6028   "reassoc", /* name */
6029   OPTGROUP_NONE, /* optinfo_flags */
6030   TV_TREE_REASSOC, /* tv_id */
6031   ( PROP_cfg | PROP_ssa ), /* properties_required */
6032   0, /* properties_provided */
6033   0, /* properties_destroyed */
6034   0, /* todo_flags_start */
6035   TODO_update_ssa_only_virtuals, /* todo_flags_finish */
6036 };
6037
6038 class pass_reassoc : public gimple_opt_pass
6039 {
6040 public:
6041   pass_reassoc (gcc::context *ctxt)
6042     : gimple_opt_pass (pass_data_reassoc, ctxt), insert_powi_p (false)
6043   {}
6044
6045   /* opt_pass methods: */
6046   opt_pass * clone () { return new pass_reassoc (m_ctxt); }
6047   void set_pass_param (unsigned int n, bool param)
6048     {
6049       gcc_assert (n == 0);
6050       insert_powi_p = param;
6051     }
6052   virtual bool gate (function *) { return flag_tree_reassoc != 0; }
6053   virtual unsigned int execute (function *)
6054     { return execute_reassoc (insert_powi_p); }
6055
6056  private:
6057   /* Enable insertion of __builtin_powi calls during execute_reassoc.  See
6058      point 3a in the pass header comment.  */
6059   bool insert_powi_p;
6060 }; // class pass_reassoc
6061
6062 } // anon namespace
6063
6064 gimple_opt_pass *
6065 make_pass_reassoc (gcc::context *ctxt)
6066 {
6067   return new pass_reassoc (ctxt);
6068 }