dist/gcc/tree-ssa-loop-niter.cc

1.1  mrg /* Functions to determine/estimate number of iterations of a loop.
1.1  mrg    Copyright (C) 2004-2022 Free Software Foundation, Inc.
1.1  mrg
1.1  mrg This file is part of GCC.
1.1  mrg
1.1  mrg GCC is free software; you can redistribute it and/or modify it
1.1  mrg under the terms of the GNU General Public License as published by the
1.1  mrg Free Software Foundation; either version 3, or (at your option) any
1.1  mrg later version.
1.1  mrg
1.1  mrg GCC is distributed in the hope that it will be useful, but WITHOUT
1.1  mrg ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
1.1  mrg FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
1.1  mrg for more details.
1.1  mrg
1.1  mrg You should have received a copy of the GNU General Public License
1.1  mrg along with GCC; see the file COPYING3.  If not see
1.1  mrg <http://www.gnu.org/licenses/>.  */
1.1  mrg
1.1  mrg #include "config.h"
1.1  mrg #include "system.h"
1.1  mrg #include "coretypes.h"
1.1  mrg #include "backend.h"
1.1  mrg #include "rtl.h"
1.1  mrg #include "tree.h"
1.1  mrg #include "gimple.h"
1.1  mrg #include "tree-pass.h"
1.1  mrg #include "ssa.h"
1.1  mrg #include "gimple-pretty-print.h"
1.1  mrg #include "diagnostic-core.h"
1.1  mrg #include "stor-layout.h"
1.1  mrg #include "fold-const.h"
1.1  mrg #include "calls.h"
1.1  mrg #include "intl.h"
1.1  mrg #include "gimplify.h"
1.1  mrg #include "gimple-iterator.h"
1.1  mrg #include "tree-cfg.h"
1.1  mrg #include "tree-ssa-loop-ivopts.h"
1.1  mrg #include "tree-ssa-loop-niter.h"
1.1  mrg #include "tree-ssa-loop.h"
1.1  mrg #include "cfgloop.h"
1.1  mrg #include "tree-chrec.h"
1.1  mrg #include "tree-scalar-evolution.h"
1.1  mrg #include "tree-dfa.h"
1.1  mrg #include "gimple-range.h"
1.1  mrg
1.1  mrg
1.1  mrg /* The maximum number of dominator BBs we search for conditions
1.1  mrg    of loop header copies we use for simplifying a conditional
1.1  mrg    expression.  */
1.1  mrg #define MAX_DOMINATORS_TO_WALK 8
1.1  mrg
1.1  mrg /*
1.1  mrg
1.1  mrg    Analysis of number of iterations of an affine exit test.
1.1  mrg
1.1  mrg */
1.1  mrg
1.1  mrg /* Bounds on some value, BELOW <= X <= UP.  */
1.1  mrg
1.1  mrg struct bounds
1.1  mrg {
1.1  mrg   mpz_t below, up;
1.1  mrg };
1.1  mrg
1.1  mrg static bool number_of_iterations_popcount (loop_p loop, edge exit,
1.1  mrg 					   enum tree_code code,
1.1  mrg 					   class tree_niter_desc *niter);
1.1  mrg
1.1  mrg
1.1  mrg /* Splits expression EXPR to a variable part VAR and constant OFFSET.  */
1.1  mrg
1.1  mrg static void
1.1  mrg split_to_var_and_offset (tree expr, tree *var, mpz_t offset)
1.1  mrg {
1.1  mrg   tree type = TREE_TYPE (expr);
1.1  mrg   tree op0, op1;
1.1  mrg   bool negate = false;
1.1  mrg
1.1  mrg   *var = expr;
1.1  mrg   mpz_set_ui (offset, 0);
1.1  mrg
1.1  mrg   switch (TREE_CODE (expr))
1.1  mrg     {
1.1  mrg     case MINUS_EXPR:
1.1  mrg       negate = true;
1.1  mrg       /* Fallthru.  */
1.1  mrg
1.1  mrg     case PLUS_EXPR:
1.1  mrg     case POINTER_PLUS_EXPR:
1.1  mrg       op0 = TREE_OPERAND (expr, 0);
1.1  mrg       op1 = TREE_OPERAND (expr, 1);
1.1  mrg
1.1  mrg       if (TREE_CODE (op1) != INTEGER_CST)
1.1  mrg 	break;
1.1  mrg
1.1  mrg       *var = op0;
1.1  mrg       /* Always sign extend the offset.  */
1.1  mrg       wi::to_mpz (wi::to_wide (op1), offset, SIGNED);
1.1  mrg       if (negate)
1.1  mrg 	mpz_neg (offset, offset);
1.1  mrg       break;
1.1  mrg
1.1  mrg     case INTEGER_CST:
1.1  mrg       *var = build_int_cst_type (type, 0);
1.1  mrg       wi::to_mpz (wi::to_wide (expr), offset, TYPE_SIGN (type));
1.1  mrg       break;
1.1  mrg
1.1  mrg     default:
1.1  mrg       break;
1.1  mrg     }
1.1  mrg }
1.1  mrg
1.1  mrg /* From condition C0 CMP C1 derives information regarding the value range
1.1  mrg    of VAR, which is of TYPE.  Results are stored in to BELOW and UP.  */
1.1  mrg
1.1  mrg static void
1.1  mrg refine_value_range_using_guard (tree type, tree var,
1.1  mrg 				tree c0, enum tree_code cmp, tree c1,
1.1  mrg 				mpz_t below, mpz_t up)
1.1  mrg {
1.1  mrg   tree varc0, varc1, ctype;
1.1  mrg   mpz_t offc0, offc1;
1.1  mrg   mpz_t mint, maxt, minc1, maxc1;
1.1  mrg   bool no_wrap = nowrap_type_p (type);
1.1  mrg   bool c0_ok, c1_ok;
1.1  mrg   signop sgn = TYPE_SIGN (type);
1.1  mrg
1.1  mrg   switch (cmp)
1.1  mrg     {
1.1  mrg     case LT_EXPR:
1.1  mrg     case LE_EXPR:
1.1  mrg     case GT_EXPR:
1.1  mrg     case GE_EXPR:
1.1  mrg       STRIP_SIGN_NOPS (c0);
1.1  mrg       STRIP_SIGN_NOPS (c1);
1.1  mrg       ctype = TREE_TYPE (c0);
1.1  mrg       if (!useless_type_conversion_p (ctype, type))
1.1  mrg 	return;
1.1  mrg
1.1  mrg       break;
1.1  mrg
1.1  mrg     case EQ_EXPR:
1.1  mrg       /* We could derive quite precise information from EQ_EXPR, however,
1.1  mrg 	 such a guard is unlikely to appear, so we do not bother with
1.1  mrg 	 handling it.  */
1.1  mrg       return;
1.1  mrg
1.1  mrg     case NE_EXPR:
1.1  mrg       /* NE_EXPR comparisons do not contain much of useful information,
1.1  mrg 	 except for cases of comparing with bounds.  */
1.1  mrg       if (TREE_CODE (c1) != INTEGER_CST
1.1  mrg 	  || !INTEGRAL_TYPE_P (type))
1.1  mrg 	return;
1.1  mrg
1.1  mrg       /* Ensure that the condition speaks about an expression in the same
1.1  mrg 	 type as X and Y.  */
1.1  mrg       ctype = TREE_TYPE (c0);
1.1  mrg       if (TYPE_PRECISION (ctype) != TYPE_PRECISION (type))
1.1  mrg 	return;
1.1  mrg       c0 = fold_convert (type, c0);
1.1  mrg       c1 = fold_convert (type, c1);
1.1  mrg
1.1  mrg       if (operand_equal_p (var, c0, 0))
1.1  mrg 	{
1.1  mrg 	  mpz_t valc1;
1.1  mrg
1.1  mrg 	  /* Case of comparing VAR with its below/up bounds.  */
1.1  mrg 	  mpz_init (valc1);
1.1  mrg 	  wi::to_mpz (wi::to_wide (c1), valc1, TYPE_SIGN (type));
1.1  mrg 	  if (mpz_cmp (valc1, below) == 0)
1.1  mrg 	    cmp = GT_EXPR;
1.1  mrg 	  if (mpz_cmp (valc1, up) == 0)
1.1  mrg 	    cmp = LT_EXPR;
1.1  mrg
1.1  mrg 	  mpz_clear (valc1);
1.1  mrg 	}
1.1  mrg       else
1.1  mrg 	{
1.1  mrg 	  /* Case of comparing with the bounds of the type.  */
1.1  mrg 	  wide_int min = wi::min_value (type);
1.1  mrg 	  wide_int max = wi::max_value (type);
1.1  mrg
1.1  mrg 	  if (wi::to_wide (c1) == min)
1.1  mrg 	    cmp = GT_EXPR;
1.1  mrg 	  if (wi::to_wide (c1) == max)
1.1  mrg 	    cmp = LT_EXPR;
1.1  mrg 	}
1.1  mrg
1.1  mrg       /* Quick return if no useful information.  */
1.1  mrg       if (cmp == NE_EXPR)
1.1  mrg 	return;
1.1  mrg
1.1  mrg       break;
1.1  mrg
1.1  mrg     default:
1.1  mrg       return;
1.1  mrg     }
1.1  mrg
1.1  mrg   mpz_init (offc0);
1.1  mrg   mpz_init (offc1);
1.1  mrg   split_to_var_and_offset (expand_simple_operations (c0), &varc0, offc0);
1.1  mrg   split_to_var_and_offset (expand_simple_operations (c1), &varc1, offc1);
1.1  mrg
1.1  mrg   /* We are only interested in comparisons of expressions based on VAR.  */
1.1  mrg   if (operand_equal_p (var, varc1, 0))
1.1  mrg     {
1.1  mrg       std::swap (varc0, varc1);
1.1  mrg       mpz_swap (offc0, offc1);
1.1  mrg       cmp = swap_tree_comparison (cmp);
1.1  mrg     }
1.1  mrg   else if (!operand_equal_p (var, varc0, 0))
1.1  mrg     {
1.1  mrg       mpz_clear (offc0);
1.1  mrg       mpz_clear (offc1);
1.1  mrg       return;
1.1  mrg     }
1.1  mrg
1.1  mrg   mpz_init (mint);
1.1  mrg   mpz_init (maxt);
1.1  mrg   get_type_static_bounds (type, mint, maxt);
1.1  mrg   mpz_init (minc1);
1.1  mrg   mpz_init (maxc1);
1.1  mrg   value_range r;
1.1  mrg   /* Setup range information for varc1.  */
1.1  mrg   if (integer_zerop (varc1))
1.1  mrg     {
1.1  mrg       wi::to_mpz (0, minc1, TYPE_SIGN (type));
1.1  mrg       wi::to_mpz (0, maxc1, TYPE_SIGN (type));
1.1  mrg     }
1.1  mrg   else if (TREE_CODE (varc1) == SSA_NAME
1.1  mrg 	   && INTEGRAL_TYPE_P (type)
1.1  mrg 	   && get_range_query (cfun)->range_of_expr (r, varc1)
1.1  mrg 	   && r.kind () == VR_RANGE)
1.1  mrg     {
1.1  mrg       gcc_assert (wi::le_p (r.lower_bound (), r.upper_bound (), sgn));
1.1  mrg       wi::to_mpz (r.lower_bound (), minc1, sgn);
1.1  mrg       wi::to_mpz (r.upper_bound (), maxc1, sgn);
1.1  mrg     }
1.1  mrg   else
1.1  mrg     {
1.1  mrg       mpz_set (minc1, mint);
1.1  mrg       mpz_set (maxc1, maxt);
1.1  mrg     }
1.1  mrg
1.1  mrg   /* Compute valid range information for varc1 + offc1.  Note nothing
1.1  mrg      useful can be derived if it overflows or underflows.  Overflow or
1.1  mrg      underflow could happen when:
1.1  mrg
1.1  mrg        offc1 > 0 && varc1 + offc1 > MAX_VAL (type)
1.1  mrg        offc1 < 0 && varc1 + offc1 < MIN_VAL (type).  */
1.1  mrg   mpz_add (minc1, minc1, offc1);
1.1  mrg   mpz_add (maxc1, maxc1, offc1);
1.1  mrg   c1_ok = (no_wrap
1.1  mrg 	   || mpz_sgn (offc1) == 0
1.1  mrg 	   || (mpz_sgn (offc1) < 0 && mpz_cmp (minc1, mint) >= 0)
1.1  mrg 	   || (mpz_sgn (offc1) > 0 && mpz_cmp (maxc1, maxt) <= 0));
1.1  mrg   if (!c1_ok)
1.1  mrg     goto end;
1.1  mrg
1.1  mrg   if (mpz_cmp (minc1, mint) < 0)
1.1  mrg     mpz_set (minc1, mint);
1.1  mrg   if (mpz_cmp (maxc1, maxt) > 0)
1.1  mrg     mpz_set (maxc1, maxt);
1.1  mrg
1.1  mrg   if (cmp == LT_EXPR)
1.1  mrg     {
1.1  mrg       cmp = LE_EXPR;
1.1  mrg       mpz_sub_ui (maxc1, maxc1, 1);
1.1  mrg     }
1.1  mrg   if (cmp == GT_EXPR)
1.1  mrg     {
1.1  mrg       cmp = GE_EXPR;
1.1  mrg       mpz_add_ui (minc1, minc1, 1);
1.1  mrg     }
1.1  mrg
1.1  mrg   /* Compute range information for varc0.  If there is no overflow,
1.1  mrg      the condition implied that
1.1  mrg
1.1  mrg        (varc0) cmp (varc1 + offc1 - offc0)
1.1  mrg
1.1  mrg      We can possibly improve the upper bound of varc0 if cmp is LE_EXPR,
1.1  mrg      or the below bound if cmp is GE_EXPR.
1.1  mrg
1.1  mrg      To prove there is no overflow/underflow, we need to check below
1.1  mrg      four cases:
1.1  mrg        1) cmp == LE_EXPR && offc0 > 0
1.1  mrg
1.1  mrg 	    (varc0 + offc0) doesn't overflow
1.1  mrg 	    && (varc1 + offc1 - offc0) doesn't underflow
1.1  mrg
1.1  mrg        2) cmp == LE_EXPR && offc0 < 0
1.1  mrg
1.1  mrg 	    (varc0 + offc0) doesn't underflow
1.1  mrg 	    && (varc1 + offc1 - offc0) doesn't overfloe
1.1  mrg
1.1  mrg 	  In this case, (varc0 + offc0) will never underflow if we can
1.1  mrg 	  prove (varc1 + offc1 - offc0) doesn't overflow.
1.1  mrg
1.1  mrg        3) cmp == GE_EXPR && offc0 < 0
1.1  mrg
1.1  mrg 	    (varc0 + offc0) doesn't underflow
1.1  mrg 	    && (varc1 + offc1 - offc0) doesn't overflow
1.1  mrg
1.1  mrg        4) cmp == GE_EXPR && offc0 > 0
1.1  mrg
1.1  mrg 	    (varc0 + offc0) doesn't overflow
1.1  mrg 	    && (varc1 + offc1 - offc0) doesn't underflow
1.1  mrg
1.1  mrg 	  In this case, (varc0 + offc0) will never overflow if we can
1.1  mrg 	  prove (varc1 + offc1 - offc0) doesn't underflow.
1.1  mrg
1.1  mrg      Note we only handle case 2 and 4 in below code.  */
1.1  mrg
1.1  mrg   mpz_sub (minc1, minc1, offc0);
1.1  mrg   mpz_sub (maxc1, maxc1, offc0);
1.1  mrg   c0_ok = (no_wrap
1.1  mrg 	   || mpz_sgn (offc0) == 0
1.1  mrg 	   || (cmp == LE_EXPR
1.1  mrg 	       && mpz_sgn (offc0) < 0 && mpz_cmp (maxc1, maxt) <= 0)
1.1  mrg 	   || (cmp == GE_EXPR
1.1  mrg 	       && mpz_sgn (offc0) > 0 && mpz_cmp (minc1, mint) >= 0));
1.1  mrg   if (!c0_ok)
1.1  mrg     goto end;
1.1  mrg
1.1  mrg   if (cmp == LE_EXPR)
1.1  mrg     {
1.1  mrg       if (mpz_cmp (up, maxc1) > 0)
1.1  mrg 	mpz_set (up, maxc1);
1.1  mrg     }
1.1  mrg   else
1.1  mrg     {
1.1  mrg       if (mpz_cmp (below, minc1) < 0)
1.1  mrg 	mpz_set (below, minc1);
1.1  mrg     }
1.1  mrg
1.1  mrg end:
1.1  mrg   mpz_clear (mint);
1.1  mrg   mpz_clear (maxt);
1.1  mrg   mpz_clear (minc1);
1.1  mrg   mpz_clear (maxc1);
1.1  mrg   mpz_clear (offc0);
1.1  mrg   mpz_clear (offc1);
1.1  mrg }
1.1  mrg
1.1  mrg /* Stores estimate on the minimum/maximum value of the expression VAR + OFF
1.1  mrg    in TYPE to MIN and MAX.  */
1.1  mrg
1.1  mrg static void
1.1  mrg determine_value_range (class loop *loop, tree type, tree var, mpz_t off,
1.1  mrg 		       mpz_t min, mpz_t max)
1.1  mrg {
1.1  mrg   int cnt = 0;
1.1  mrg   mpz_t minm, maxm;
1.1  mrg   basic_block bb;
1.1  mrg   wide_int minv, maxv;
1.1  mrg   enum value_range_kind rtype = VR_VARYING;
1.1  mrg
1.1  mrg   /* If the expression is a constant, we know its value exactly.  */
1.1  mrg   if (integer_zerop (var))
1.1  mrg     {
1.1  mrg       mpz_set (min, off);
1.1  mrg       mpz_set (max, off);
1.1  mrg       return;
1.1  mrg     }
1.1  mrg
1.1  mrg   get_type_static_bounds (type, min, max);
1.1  mrg
1.1  mrg   /* See if we have some range info from VRP.  */
1.1  mrg   if (TREE_CODE (var) == SSA_NAME && INTEGRAL_TYPE_P (type))
1.1  mrg     {
1.1  mrg       edge e = loop_preheader_edge (loop);
1.1  mrg       signop sgn = TYPE_SIGN (type);
1.1  mrg       gphi_iterator gsi;
1.1  mrg
1.1  mrg       /* Either for VAR itself...  */
1.1  mrg       value_range var_range;
1.1  mrg       get_range_query (cfun)->range_of_expr (var_range, var);
1.1  mrg       rtype = var_range.kind ();
1.1  mrg       if (!var_range.undefined_p ())
1.1  mrg 	{
1.1  mrg 	  minv = var_range.lower_bound ();
1.1  mrg 	  maxv = var_range.upper_bound ();
1.1  mrg 	}
1.1  mrg
1.1  mrg       /* Or for PHI results in loop->header where VAR is used as
1.1  mrg 	 PHI argument from the loop preheader edge.  */
1.1  mrg       for (gsi = gsi_start_phis (loop->header); !gsi_end_p (gsi); gsi_next (&gsi))
1.1  mrg 	{
1.1  mrg 	  gphi *phi = gsi.phi ();
1.1  mrg 	  value_range phi_range;
1.1  mrg 	  if (PHI_ARG_DEF_FROM_EDGE (phi, e) == var
1.1  mrg 	      && get_range_query (cfun)->range_of_expr (phi_range,
1.1  mrg 						    gimple_phi_result (phi))
1.1  mrg 	      && phi_range.kind () == VR_RANGE)
1.1  mrg 	    {
1.1  mrg 	      if (rtype != VR_RANGE)
1.1  mrg 		{
1.1  mrg 		  rtype = VR_RANGE;
1.1  mrg 		  minv = phi_range.lower_bound ();
1.1  mrg 		  maxv = phi_range.upper_bound ();
1.1  mrg 		}
1.1  mrg 	      else
1.1  mrg 		{
1.1  mrg 		  minv = wi::max (minv, phi_range.lower_bound (), sgn);
1.1  mrg 		  maxv = wi::min (maxv, phi_range.upper_bound (), sgn);
1.1  mrg 		  /* If the PHI result range are inconsistent with
1.1  mrg 		     the VAR range, give up on looking at the PHI
1.1  mrg 		     results.  This can happen if VR_UNDEFINED is
1.1  mrg 		     involved.  */
1.1  mrg 		  if (wi::gt_p (minv, maxv, sgn))
1.1  mrg 		    {
1.1  mrg 		      value_range vr;
1.1  mrg 		      get_range_query (cfun)->range_of_expr (vr, var);
1.1  mrg 		      rtype = vr.kind ();
1.1  mrg 		      if (!vr.undefined_p ())
1.1  mrg 			{
1.1  mrg 			  minv = vr.lower_bound ();
1.1  mrg 			  maxv = vr.upper_bound ();
1.1  mrg 			}
1.1  mrg 		      break;
1.1  mrg 		    }
1.1  mrg 		}
1.1  mrg 	    }
1.1  mrg 	}
1.1  mrg       mpz_init (minm);
1.1  mrg       mpz_init (maxm);
1.1  mrg       if (rtype != VR_RANGE)
1.1  mrg 	{
1.1  mrg 	  mpz_set (minm, min);
1.1  mrg 	  mpz_set (maxm, max);
1.1  mrg 	}
1.1  mrg       else
1.1  mrg 	{
1.1  mrg 	  gcc_assert (wi::le_p (minv, maxv, sgn));
1.1  mrg 	  wi::to_mpz (minv, minm, sgn);
1.1  mrg 	  wi::to_mpz (maxv, maxm, sgn);
1.1  mrg 	}
1.1  mrg       /* Now walk the dominators of the loop header and use the entry
1.1  mrg 	 guards to refine the estimates.  */
1.1  mrg       for (bb = loop->header;
1.1  mrg 	   bb != ENTRY_BLOCK_PTR_FOR_FN (cfun) && cnt < MAX_DOMINATORS_TO_WALK;
1.1  mrg 	   bb = get_immediate_dominator (CDI_DOMINATORS, bb))
1.1  mrg 	{
1.1  mrg 	  edge e;
1.1  mrg 	  tree c0, c1;
1.1  mrg 	  gimple *cond;
1.1  mrg 	  enum tree_code cmp;
1.1  mrg
1.1  mrg 	  if (!single_pred_p (bb))
1.1  mrg 	    continue;
1.1  mrg 	  e = single_pred_edge (bb);
1.1  mrg
1.1  mrg 	  if (!(e->flags & (EDGE_TRUE_VALUE | EDGE_FALSE_VALUE)))
1.1  mrg 	    continue;
1.1  mrg
1.1  mrg 	  cond = last_stmt (e->src);
1.1  mrg 	  c0 = gimple_cond_lhs (cond);
1.1  mrg 	  cmp = gimple_cond_code (cond);
1.1  mrg 	  c1 = gimple_cond_rhs (cond);
1.1  mrg
1.1  mrg 	  if (e->flags & EDGE_FALSE_VALUE)
1.1  mrg 	    cmp = invert_tree_comparison (cmp, false);
1.1  mrg
1.1  mrg 	  refine_value_range_using_guard (type, var, c0, cmp, c1, minm, maxm);
1.1  mrg 	  ++cnt;
1.1  mrg 	}
1.1  mrg
1.1  mrg       mpz_add (minm, minm, off);
1.1  mrg       mpz_add (maxm, maxm, off);
1.1  mrg       /* If the computation may not wrap or off is zero, then this
1.1  mrg 	 is always fine.  If off is negative and minv + off isn't
1.1  mrg 	 smaller than type's minimum, or off is positive and
1.1  mrg 	 maxv + off isn't bigger than type's maximum, use the more
1.1  mrg 	 precise range too.  */
1.1  mrg       if (nowrap_type_p (type)
1.1  mrg 	  || mpz_sgn (off) == 0
1.1  mrg 	  || (mpz_sgn (off) < 0 && mpz_cmp (minm, min) >= 0)
1.1  mrg 	  || (mpz_sgn (off) > 0 && mpz_cmp (maxm, max) <= 0))
1.1  mrg 	{
1.1  mrg 	  mpz_set (min, minm);
1.1  mrg 	  mpz_set (max, maxm);
1.1  mrg 	  mpz_clear (minm);
1.1  mrg 	  mpz_clear (maxm);
1.1  mrg 	  return;
1.1  mrg 	}
1.1  mrg       mpz_clear (minm);
1.1  mrg       mpz_clear (maxm);
1.1  mrg     }
1.1  mrg
1.1  mrg   /* If the computation may wrap, we know nothing about the value, except for
1.1  mrg      the range of the type.  */
1.1  mrg   if (!nowrap_type_p (type))
1.1  mrg     return;
1.1  mrg
1.1  mrg   /* Since the addition of OFF does not wrap, if OFF is positive, then we may
1.1  mrg      add it to MIN, otherwise to MAX.  */
1.1  mrg   if (mpz_sgn (off) < 0)
1.1  mrg     mpz_add (max, max, off);
1.1  mrg   else
1.1  mrg     mpz_add (min, min, off);
1.1  mrg }
1.1  mrg
1.1  mrg /* Stores the bounds on the difference of the values of the expressions
1.1  mrg    (var + X) and (var + Y), computed in TYPE, to BNDS.  */
1.1  mrg
1.1  mrg static void
1.1  mrg bound_difference_of_offsetted_base (tree type, mpz_t x, mpz_t y,
1.1  mrg 				    bounds *bnds)
1.1  mrg {
1.1  mrg   int rel = mpz_cmp (x, y);
1.1  mrg   bool may_wrap = !nowrap_type_p (type);
1.1  mrg   mpz_t m;
1.1  mrg
1.1  mrg   /* If X == Y, then the expressions are always equal.
1.1  mrg      If X > Y, there are the following possibilities:
1.1  mrg        a) neither of var + X and var + Y overflow or underflow, or both of
1.1  mrg 	  them do.  Then their difference is X - Y.
1.1  mrg        b) var + X overflows, and var + Y does not.  Then the values of the
1.1  mrg 	  expressions are var + X - M and var + Y, where M is the range of
1.1  mrg 	  the type, and their difference is X - Y - M.
1.1  mrg        c) var + Y underflows and var + X does not.  Their difference again
1.1  mrg 	  is M - X + Y.
1.1  mrg        Therefore, if the arithmetics in type does not overflow, then the
1.1  mrg        bounds are (X - Y, X - Y), otherwise they are (X - Y - M, X - Y)
1.1  mrg      Similarly, if X < Y, the bounds are either (X - Y, X - Y) or
1.1  mrg      (X - Y, X - Y + M).  */
1.1  mrg
1.1  mrg   if (rel == 0)
1.1  mrg     {
1.1  mrg       mpz_set_ui (bnds->below, 0);
1.1  mrg       mpz_set_ui (bnds->up, 0);
1.1  mrg       return;
1.1  mrg     }
1.1  mrg
1.1  mrg   mpz_init (m);
1.1  mrg   wi::to_mpz (wi::minus_one (TYPE_PRECISION (type)), m, UNSIGNED);
1.1  mrg   mpz_add_ui (m, m, 1);
1.1  mrg   mpz_sub (bnds->up, x, y);
1.1  mrg   mpz_set (bnds->below, bnds->up);
1.1  mrg
1.1  mrg   if (may_wrap)
1.1  mrg     {
1.1  mrg       if (rel > 0)
1.1  mrg 	mpz_sub (bnds->below, bnds->below, m);
1.1  mrg       else
1.1  mrg 	mpz_add (bnds->up, bnds->up, m);
1.1  mrg     }
1.1  mrg
1.1  mrg   mpz_clear (m);
1.1  mrg }
1.1  mrg
1.1  mrg /* From condition C0 CMP C1 derives information regarding the
1.1  mrg    difference of values of VARX + OFFX and VARY + OFFY, computed in TYPE,
1.1  mrg    and stores it to BNDS.  */
1.1  mrg
1.1  mrg static void
1.1  mrg refine_bounds_using_guard (tree type, tree varx, mpz_t offx,
1.1  mrg 			   tree vary, mpz_t offy,
1.1  mrg 			   tree c0, enum tree_code cmp, tree c1,
1.1  mrg 			   bounds *bnds)
1.1  mrg {
1.1  mrg   tree varc0, varc1, ctype;
1.1  mrg   mpz_t offc0, offc1, loffx, loffy, bnd;
1.1  mrg   bool lbound = false;
1.1  mrg   bool no_wrap = nowrap_type_p (type);
1.1  mrg   bool x_ok, y_ok;
1.1  mrg
1.1  mrg   switch (cmp)
1.1  mrg     {
1.1  mrg     case LT_EXPR:
1.1  mrg     case LE_EXPR:
1.1  mrg     case GT_EXPR:
1.1  mrg     case GE_EXPR:
1.1  mrg       STRIP_SIGN_NOPS (c0);
1.1  mrg       STRIP_SIGN_NOPS (c1);
1.1  mrg       ctype = TREE_TYPE (c0);
1.1  mrg       if (!useless_type_conversion_p (ctype, type))
1.1  mrg 	return;
1.1  mrg
1.1  mrg       break;
1.1  mrg
1.1  mrg     case EQ_EXPR:
1.1  mrg       /* We could derive quite precise information from EQ_EXPR, however, such
1.1  mrg 	 a guard is unlikely to appear, so we do not bother with handling
1.1  mrg 	 it.  */
1.1  mrg       return;
1.1  mrg
1.1  mrg     case NE_EXPR:
1.1  mrg       /* NE_EXPR comparisons do not contain much of useful information, except for
1.1  mrg 	 special case of comparing with the bounds of the type.  */
1.1  mrg       if (TREE_CODE (c1) != INTEGER_CST
1.1  mrg 	  || !INTEGRAL_TYPE_P (type))
1.1  mrg 	return;
1.1  mrg
1.1  mrg       /* Ensure that the condition speaks about an expression in the same type
1.1  mrg 	 as X and Y.  */
1.1  mrg       ctype = TREE_TYPE (c0);
1.1  mrg       if (TYPE_PRECISION (ctype) != TYPE_PRECISION (type))
1.1  mrg 	return;
1.1  mrg       c0 = fold_convert (type, c0);
1.1  mrg       c1 = fold_convert (type, c1);
1.1  mrg
1.1  mrg       if (TYPE_MIN_VALUE (type)
1.1  mrg 	  && operand_equal_p (c1, TYPE_MIN_VALUE (type), 0))
1.1  mrg 	{
1.1  mrg 	  cmp = GT_EXPR;
1.1  mrg 	  break;
1.1  mrg 	}
1.1  mrg       if (TYPE_MAX_VALUE (type)
1.1  mrg 	  && operand_equal_p (c1, TYPE_MAX_VALUE (type), 0))
1.1  mrg 	{
1.1  mrg 	  cmp = LT_EXPR;
1.1  mrg 	  break;
1.1  mrg 	}
1.1  mrg
1.1  mrg       return;
1.1  mrg     default:
1.1  mrg       return;
1.1  mrg     }
1.1  mrg
1.1  mrg   mpz_init (offc0);
1.1  mrg   mpz_init (offc1);
1.1  mrg   split_to_var_and_offset (expand_simple_operations (c0), &varc0, offc0);
1.1  mrg   split_to_var_and_offset (expand_simple_operations (c1), &varc1, offc1);
1.1  mrg
1.1  mrg   /* We are only interested in comparisons of expressions based on VARX and
1.1  mrg      VARY.  TODO -- we might also be able to derive some bounds from
1.1  mrg      expressions containing just one of the variables.  */
1.1  mrg
1.1  mrg   if (operand_equal_p (varx, varc1, 0))
1.1  mrg     {
1.1  mrg       std::swap (varc0, varc1);
1.1  mrg       mpz_swap (offc0, offc1);
1.1  mrg       cmp = swap_tree_comparison (cmp);
1.1  mrg     }
1.1  mrg
1.1  mrg   if (!operand_equal_p (varx, varc0, 0)
1.1  mrg       || !operand_equal_p (vary, varc1, 0))
1.1  mrg     goto end;
1.1  mrg
1.1  mrg   mpz_init_set (loffx, offx);
1.1  mrg   mpz_init_set (loffy, offy);
1.1  mrg
1.1  mrg   if (cmp == GT_EXPR || cmp == GE_EXPR)
1.1  mrg     {
1.1  mrg       std::swap (varx, vary);
1.1  mrg       mpz_swap (offc0, offc1);
1.1  mrg       mpz_swap (loffx, loffy);
1.1  mrg       cmp = swap_tree_comparison (cmp);
1.1  mrg       lbound = true;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* If there is no overflow, the condition implies that
1.1  mrg
1.1  mrg      (VARX + OFFX) cmp (VARY + OFFY) + (OFFX - OFFY + OFFC1 - OFFC0).
1.1  mrg
1.1  mrg      The overflows and underflows may complicate things a bit; each
1.1  mrg      overflow decreases the appropriate offset by M, and underflow
1.1  mrg      increases it by M.  The above inequality would not necessarily be
1.1  mrg      true if
1.1  mrg
1.1  mrg      -- VARX + OFFX underflows and VARX + OFFC0 does not, or
1.1  mrg 	VARX + OFFC0 overflows, but VARX + OFFX does not.
1.1  mrg 	This may only happen if OFFX < OFFC0.
1.1  mrg      -- VARY + OFFY overflows and VARY + OFFC1 does not, or
1.1  mrg 	VARY + OFFC1 underflows and VARY + OFFY does not.
1.1  mrg 	This may only happen if OFFY > OFFC1.  */
1.1  mrg
1.1  mrg   if (no_wrap)
1.1  mrg     {
1.1  mrg       x_ok = true;
1.1  mrg       y_ok = true;
1.1  mrg     }
1.1  mrg   else
1.1  mrg     {
1.1  mrg       x_ok = (integer_zerop (varx)
1.1  mrg 	      || mpz_cmp (loffx, offc0) >= 0);
1.1  mrg       y_ok = (integer_zerop (vary)
1.1  mrg 	      || mpz_cmp (loffy, offc1) <= 0);
1.1  mrg     }
1.1  mrg
1.1  mrg   if (x_ok && y_ok)
1.1  mrg     {
1.1  mrg       mpz_init (bnd);
1.1  mrg       mpz_sub (bnd, loffx, loffy);
1.1  mrg       mpz_add (bnd, bnd, offc1);
1.1  mrg       mpz_sub (bnd, bnd, offc0);
1.1  mrg
1.1  mrg       if (cmp == LT_EXPR)
1.1  mrg 	mpz_sub_ui (bnd, bnd, 1);
1.1  mrg
1.1  mrg       if (lbound)
1.1  mrg 	{
1.1  mrg 	  mpz_neg (bnd, bnd);
1.1  mrg 	  if (mpz_cmp (bnds->below, bnd) < 0)
1.1  mrg 	    mpz_set (bnds->below, bnd);
1.1  mrg 	}
1.1  mrg       else
1.1  mrg 	{
1.1  mrg 	  if (mpz_cmp (bnd, bnds->up) < 0)
1.1  mrg 	    mpz_set (bnds->up, bnd);
1.1  mrg 	}
1.1  mrg       mpz_clear (bnd);
1.1  mrg     }
1.1  mrg
1.1  mrg   mpz_clear (loffx);
1.1  mrg   mpz_clear (loffy);
1.1  mrg end:
1.1  mrg   mpz_clear (offc0);
1.1  mrg   mpz_clear (offc1);
1.1  mrg }
1.1  mrg
1.1  mrg /* Stores the bounds on the value of the expression X - Y in LOOP to BNDS.
1.1  mrg    The subtraction is considered to be performed in arbitrary precision,
1.1  mrg    without overflows.
1.1  mrg
1.1  mrg    We do not attempt to be too clever regarding the value ranges of X and
1.1  mrg    Y; most of the time, they are just integers or ssa names offsetted by
1.1  mrg    integer.  However, we try to use the information contained in the
1.1  mrg    comparisons before the loop (usually created by loop header copying).  */
1.1  mrg
1.1  mrg static void
1.1  mrg bound_difference (class loop *loop, tree x, tree y, bounds *bnds)
1.1  mrg {
1.1  mrg   tree type = TREE_TYPE (x);
1.1  mrg   tree varx, vary;
1.1  mrg   mpz_t offx, offy;
1.1  mrg   mpz_t minx, maxx, miny, maxy;
1.1  mrg   int cnt = 0;
1.1  mrg   edge e;
1.1  mrg   basic_block bb;
1.1  mrg   tree c0, c1;
1.1  mrg   gimple *cond;
1.1  mrg   enum tree_code cmp;
1.1  mrg
1.1  mrg   /* Get rid of unnecessary casts, but preserve the value of
1.1  mrg      the expressions.  */
1.1  mrg   STRIP_SIGN_NOPS (x);
1.1  mrg   STRIP_SIGN_NOPS (y);
1.1  mrg
1.1  mrg   mpz_init (bnds->below);
1.1  mrg   mpz_init (bnds->up);
1.1  mrg   mpz_init (offx);
1.1  mrg   mpz_init (offy);
1.1  mrg   split_to_var_and_offset (x, &varx, offx);
1.1  mrg   split_to_var_and_offset (y, &vary, offy);
1.1  mrg
1.1  mrg   if (!integer_zerop (varx)
1.1  mrg       && operand_equal_p (varx, vary, 0))
1.1  mrg     {
1.1  mrg       /* Special case VARX == VARY -- we just need to compare the
1.1  mrg          offsets.  The matters are a bit more complicated in the
1.1  mrg 	 case addition of offsets may wrap.  */
1.1  mrg       bound_difference_of_offsetted_base (type, offx, offy, bnds);
1.1  mrg     }
1.1  mrg   else
1.1  mrg     {
1.1  mrg       /* Otherwise, use the value ranges to determine the initial
1.1  mrg 	 estimates on below and up.  */
1.1  mrg       mpz_init (minx);
1.1  mrg       mpz_init (maxx);
1.1  mrg       mpz_init (miny);
1.1  mrg       mpz_init (maxy);
1.1  mrg       determine_value_range (loop, type, varx, offx, minx, maxx);
1.1  mrg       determine_value_range (loop, type, vary, offy, miny, maxy);
1.1  mrg
1.1  mrg       mpz_sub (bnds->below, minx, maxy);
1.1  mrg       mpz_sub (bnds->up, maxx, miny);
1.1  mrg       mpz_clear (minx);
1.1  mrg       mpz_clear (maxx);
1.1  mrg       mpz_clear (miny);
1.1  mrg       mpz_clear (maxy);
1.1  mrg     }
1.1  mrg
1.1  mrg   /* If both X and Y are constants, we cannot get any more precise.  */
1.1  mrg   if (integer_zerop (varx) && integer_zerop (vary))
1.1  mrg     goto end;
1.1  mrg
1.1  mrg   /* Now walk the dominators of the loop header and use the entry
1.1  mrg      guards to refine the estimates.  */
1.1  mrg   for (bb = loop->header;
1.1  mrg        bb != ENTRY_BLOCK_PTR_FOR_FN (cfun) && cnt < MAX_DOMINATORS_TO_WALK;
1.1  mrg        bb = get_immediate_dominator (CDI_DOMINATORS, bb))
1.1  mrg     {
1.1  mrg       if (!single_pred_p (bb))
1.1  mrg 	continue;
1.1  mrg       e = single_pred_edge (bb);
1.1  mrg
1.1  mrg       if (!(e->flags & (EDGE_TRUE_VALUE | EDGE_FALSE_VALUE)))
1.1  mrg 	continue;
1.1  mrg
1.1  mrg       cond = last_stmt (e->src);
1.1  mrg       c0 = gimple_cond_lhs (cond);
1.1  mrg       cmp = gimple_cond_code (cond);
1.1  mrg       c1 = gimple_cond_rhs (cond);
1.1  mrg
1.1  mrg       if (e->flags & EDGE_FALSE_VALUE)
1.1  mrg 	cmp = invert_tree_comparison (cmp, false);
1.1  mrg
1.1  mrg       refine_bounds_using_guard (type, varx, offx, vary, offy,
1.1  mrg 				 c0, cmp, c1, bnds);
1.1  mrg       ++cnt;
1.1  mrg     }
1.1  mrg
1.1  mrg end:
1.1  mrg   mpz_clear (offx);
1.1  mrg   mpz_clear (offy);
1.1  mrg }
1.1  mrg
1.1  mrg /* Update the bounds in BNDS that restrict the value of X to the bounds
1.1  mrg    that restrict the value of X + DELTA.  X can be obtained as a
1.1  mrg    difference of two values in TYPE.  */
1.1  mrg
1.1  mrg static void
1.1  mrg bounds_add (bounds *bnds, const widest_int &delta, tree type)
1.1  mrg {
1.1  mrg   mpz_t mdelta, max;
1.1  mrg
1.1  mrg   mpz_init (mdelta);
1.1  mrg   wi::to_mpz (delta, mdelta, SIGNED);
1.1  mrg
1.1  mrg   mpz_init (max);
1.1  mrg   wi::to_mpz (wi::minus_one (TYPE_PRECISION (type)), max, UNSIGNED);
1.1  mrg
1.1  mrg   mpz_add (bnds->up, bnds->up, mdelta);
1.1  mrg   mpz_add (bnds->below, bnds->below, mdelta);
1.1  mrg
1.1  mrg   if (mpz_cmp (bnds->up, max) > 0)
1.1  mrg     mpz_set (bnds->up, max);
1.1  mrg
1.1  mrg   mpz_neg (max, max);
1.1  mrg   if (mpz_cmp (bnds->below, max) < 0)
1.1  mrg     mpz_set (bnds->below, max);
1.1  mrg
1.1  mrg   mpz_clear (mdelta);
1.1  mrg   mpz_clear (max);
1.1  mrg }
1.1  mrg
1.1  mrg /* Update the bounds in BNDS that restrict the value of X to the bounds
1.1  mrg    that restrict the value of -X.  */
1.1  mrg
1.1  mrg static void
1.1  mrg bounds_negate (bounds *bnds)
1.1  mrg {
1.1  mrg   mpz_t tmp;
1.1  mrg
1.1  mrg   mpz_init_set (tmp, bnds->up);
1.1  mrg   mpz_neg (bnds->up, bnds->below);
1.1  mrg   mpz_neg (bnds->below, tmp);
1.1  mrg   mpz_clear (tmp);
1.1  mrg }
1.1  mrg
1.1  mrg /* Returns inverse of X modulo 2^s, where MASK = 2^s-1.  */
1.1  mrg
1.1  mrg static tree
1.1  mrg inverse (tree x, tree mask)
1.1  mrg {
1.1  mrg   tree type = TREE_TYPE (x);
1.1  mrg   tree rslt;
1.1  mrg   unsigned ctr = tree_floor_log2 (mask);
1.1  mrg
1.1  mrg   if (TYPE_PRECISION (type) <= HOST_BITS_PER_WIDE_INT)
1.1  mrg     {
1.1  mrg       unsigned HOST_WIDE_INT ix;
1.1  mrg       unsigned HOST_WIDE_INT imask;
1.1  mrg       unsigned HOST_WIDE_INT irslt = 1;
1.1  mrg
1.1  mrg       gcc_assert (cst_and_fits_in_hwi (x));
1.1  mrg       gcc_assert (cst_and_fits_in_hwi (mask));
1.1  mrg
1.1  mrg       ix = int_cst_value (x);
1.1  mrg       imask = int_cst_value (mask);
1.1  mrg
1.1  mrg       for (; ctr; ctr--)
1.1  mrg 	{
1.1  mrg 	  irslt *= ix;
1.1  mrg 	  ix *= ix;
1.1  mrg 	}
1.1  mrg       irslt &= imask;
1.1  mrg
1.1  mrg       rslt = build_int_cst_type (type, irslt);
1.1  mrg     }
1.1  mrg   else
1.1  mrg     {
1.1  mrg       rslt = build_int_cst (type, 1);
1.1  mrg       for (; ctr; ctr--)
1.1  mrg 	{
1.1  mrg 	  rslt = int_const_binop (MULT_EXPR, rslt, x);
1.1  mrg 	  x = int_const_binop (MULT_EXPR, x, x);
1.1  mrg 	}
1.1  mrg       rslt = int_const_binop (BIT_AND_EXPR, rslt, mask);
1.1  mrg     }
1.1  mrg
1.1  mrg   return rslt;
1.1  mrg }
1.1  mrg
1.1  mrg /* Derives the upper bound BND on the number of executions of loop with exit
1.1  mrg    condition S * i <> C.  If NO_OVERFLOW is true, then the control variable of
1.1  mrg    the loop does not overflow.  EXIT_MUST_BE_TAKEN is true if we are guaranteed
1.1  mrg    that the loop ends through this exit, i.e., the induction variable ever
1.1  mrg    reaches the value of C.
1.1  mrg
1.1  mrg    The value C is equal to final - base, where final and base are the final and
1.1  mrg    initial value of the actual induction variable in the analysed loop.  BNDS
1.1  mrg    bounds the value of this difference when computed in signed type with
1.1  mrg    unbounded range, while the computation of C is performed in an unsigned
1.1  mrg    type with the range matching the range of the type of the induction variable.
1.1  mrg    In particular, BNDS.up contains an upper bound on C in the following cases:
1.1  mrg    -- if the iv must reach its final value without overflow, i.e., if
1.1  mrg       NO_OVERFLOW && EXIT_MUST_BE_TAKEN is true, or
1.1  mrg    -- if final >= base, which we know to hold when BNDS.below >= 0.  */
1.1  mrg
1.1  mrg static void
1.1  mrg number_of_iterations_ne_max (mpz_t bnd, bool no_overflow, tree c, tree s,
1.1  mrg 			     bounds *bnds, bool exit_must_be_taken)
1.1  mrg {
1.1  mrg   widest_int max;
1.1  mrg   mpz_t d;
1.1  mrg   tree type = TREE_TYPE (c);
1.1  mrg   bool bnds_u_valid = ((no_overflow && exit_must_be_taken)
1.1  mrg 		       || mpz_sgn (bnds->below) >= 0);
1.1  mrg
1.1  mrg   if (integer_onep (s)
1.1  mrg       || (TREE_CODE (c) == INTEGER_CST
1.1  mrg 	  && TREE_CODE (s) == INTEGER_CST
1.1  mrg 	  && wi::mod_trunc (wi::to_wide (c), wi::to_wide (s),
1.1  mrg 			    TYPE_SIGN (type)) == 0)
1.1  mrg       || (TYPE_OVERFLOW_UNDEFINED (type)
1.1  mrg 	  && multiple_of_p (type, c, s)))
1.1  mrg     {
1.1  mrg       /* If C is an exact multiple of S, then its value will be reached before
1.1  mrg 	 the induction variable overflows (unless the loop is exited in some
1.1  mrg 	 other way before).  Note that the actual induction variable in the
1.1  mrg 	 loop (which ranges from base to final instead of from 0 to C) may
1.1  mrg 	 overflow, in which case BNDS.up will not be giving a correct upper
1.1  mrg 	 bound on C; thus, BNDS_U_VALID had to be computed in advance.  */
1.1  mrg       no_overflow = true;
1.1  mrg       exit_must_be_taken = true;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* If the induction variable can overflow, the number of iterations is at
1.1  mrg      most the period of the control variable (or infinite, but in that case
1.1  mrg      the whole # of iterations analysis will fail).  */
1.1  mrg   if (!no_overflow)
1.1  mrg     {
1.1  mrg       max = wi::mask <widest_int> (TYPE_PRECISION (type)
1.1  mrg 				   - wi::ctz (wi::to_wide (s)), false);
1.1  mrg       wi::to_mpz (max, bnd, UNSIGNED);
1.1  mrg       return;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* Now we know that the induction variable does not overflow, so the loop
1.1  mrg      iterates at most (range of type / S) times.  */
1.1  mrg   wi::to_mpz (wi::minus_one (TYPE_PRECISION (type)), bnd, UNSIGNED);
1.1  mrg
1.1  mrg   /* If the induction variable is guaranteed to reach the value of C before
1.1  mrg      overflow, ... */
1.1  mrg   if (exit_must_be_taken)
1.1  mrg     {
1.1  mrg       /* ... then we can strengthen this to C / S, and possibly we can use
1.1  mrg 	 the upper bound on C given by BNDS.  */
1.1  mrg       if (TREE_CODE (c) == INTEGER_CST)
1.1  mrg 	wi::to_mpz (wi::to_wide (c), bnd, UNSIGNED);
1.1  mrg       else if (bnds_u_valid)
1.1  mrg 	mpz_set (bnd, bnds->up);
1.1  mrg     }
1.1  mrg
1.1  mrg   mpz_init (d);
1.1  mrg   wi::to_mpz (wi::to_wide (s), d, UNSIGNED);
1.1  mrg   mpz_fdiv_q (bnd, bnd, d);
1.1  mrg   mpz_clear (d);
1.1  mrg }
1.1  mrg
1.1  mrg /* Determines number of iterations of loop whose ending condition
1.1  mrg    is IV <> FINAL.  TYPE is the type of the iv.  The number of
1.1  mrg    iterations is stored to NITER.  EXIT_MUST_BE_TAKEN is true if
1.1  mrg    we know that the exit must be taken eventually, i.e., that the IV
1.1  mrg    ever reaches the value FINAL (we derived this earlier, and possibly set
1.1  mrg    NITER->assumptions to make sure this is the case).  BNDS contains the
1.1  mrg    bounds on the difference FINAL - IV->base.  */
1.1  mrg
1.1  mrg static bool
1.1  mrg number_of_iterations_ne (class loop *loop, tree type, affine_iv *iv,
1.1  mrg 			 tree final, class tree_niter_desc *niter,
1.1  mrg 			 bool exit_must_be_taken, bounds *bnds)
1.1  mrg {
1.1  mrg   tree niter_type = unsigned_type_for (type);
1.1  mrg   tree s, c, d, bits, assumption, tmp, bound;
1.1  mrg   mpz_t max;
1.1  mrg
1.1  mrg   niter->control = *iv;
1.1  mrg   niter->bound = final;
1.1  mrg   niter->cmp = NE_EXPR;
1.1  mrg
1.1  mrg   /* Rearrange the terms so that we get inequality S * i <> C, with S
1.1  mrg      positive.  Also cast everything to the unsigned type.  If IV does
1.1  mrg      not overflow, BNDS bounds the value of C.  Also, this is the
1.1  mrg      case if the computation |FINAL - IV->base| does not overflow, i.e.,
1.1  mrg      if BNDS->below in the result is nonnegative.  */
1.1  mrg   if (tree_int_cst_sign_bit (iv->step))
1.1  mrg     {
1.1  mrg       s = fold_convert (niter_type,
1.1  mrg 			fold_build1 (NEGATE_EXPR, type, iv->step));
1.1  mrg       c = fold_build2 (MINUS_EXPR, niter_type,
1.1  mrg 		       fold_convert (niter_type, iv->base),
1.1  mrg 		       fold_convert (niter_type, final));
1.1  mrg       bounds_negate (bnds);
1.1  mrg     }
1.1  mrg   else
1.1  mrg     {
1.1  mrg       s = fold_convert (niter_type, iv->step);
1.1  mrg       c = fold_build2 (MINUS_EXPR, niter_type,
1.1  mrg 		       fold_convert (niter_type, final),
1.1  mrg 		       fold_convert (niter_type, iv->base));
1.1  mrg     }
1.1  mrg
1.1  mrg   mpz_init (max);
1.1  mrg   number_of_iterations_ne_max (max, iv->no_overflow, c, s, bnds,
1.1  mrg 			       exit_must_be_taken);
1.1  mrg   niter->max = widest_int::from (wi::from_mpz (niter_type, max, false),
1.1  mrg 				 TYPE_SIGN (niter_type));
1.1  mrg   mpz_clear (max);
1.1  mrg
1.1  mrg   /* Compute no-overflow information for the control iv.  This can be
1.1  mrg      proven when below two conditions are satisfied:
1.1  mrg
1.1  mrg        1) IV evaluates toward FINAL at beginning, i.e:
1.1  mrg 	    base <= FINAL ; step > 0
1.1  mrg 	    base >= FINAL ; step < 0
1.1  mrg
1.1  mrg        2) |FINAL - base| is an exact multiple of step.
1.1  mrg
1.1  mrg      Unfortunately, it's hard to prove above conditions after pass loop-ch
1.1  mrg      because loop with exit condition (IV != FINAL) usually will be guarded
1.1  mrg      by initial-condition (IV.base - IV.step != FINAL).  In this case, we
1.1  mrg      can alternatively try to prove below conditions:
1.1  mrg
1.1  mrg        1') IV evaluates toward FINAL at beginning, i.e:
1.1  mrg 	    new_base = base - step < FINAL ; step > 0
1.1  mrg 					     && base - step doesn't underflow
1.1  mrg 	    new_base = base - step > FINAL ; step < 0
1.1  mrg 					     && base - step doesn't overflow
1.1  mrg
1.1  mrg      Please refer to PR34114 as an example of loop-ch's impact.
1.1  mrg
1.1  mrg      Note, for NE_EXPR, base equals to FINAL is a special case, in
1.1  mrg      which the loop exits immediately, and the iv does not overflow.
1.1  mrg
1.1  mrg      Also note, we prove condition 2) by checking base and final seperately
1.1  mrg      along with condition 1) or 1').  Since we ensure the difference
1.1  mrg      computation of c does not wrap with cond below and the adjusted s
1.1  mrg      will fit a signed type as well as an unsigned we can safely do
1.1  mrg      this using the type of the IV if it is not pointer typed.  */
1.1  mrg   tree mtype = type;
1.1  mrg   if (POINTER_TYPE_P (type))
1.1  mrg     mtype = niter_type;
1.1  mrg   if (!niter->control.no_overflow
1.1  mrg       && (integer_onep (s)
1.1  mrg 	  || (multiple_of_p (mtype, fold_convert (mtype, iv->base),
1.1  mrg 			     fold_convert (mtype, s), false)
1.1  mrg 	      && multiple_of_p (mtype, fold_convert (mtype, final),
1.1  mrg 				fold_convert (mtype, s), false))))
1.1  mrg     {
1.1  mrg       tree t, cond, relaxed_cond = boolean_false_node;
1.1  mrg
1.1  mrg       if (tree_int_cst_sign_bit (iv->step))
1.1  mrg 	{
1.1  mrg 	  cond = fold_build2 (GE_EXPR, boolean_type_node, iv->base, final);
1.1  mrg 	  if (TREE_CODE (type) == INTEGER_TYPE)
1.1  mrg 	    {
1.1  mrg 	      /* Only when base - step doesn't overflow.  */
1.1  mrg 	      t = TYPE_MAX_VALUE (type);
1.1  mrg 	      t = fold_build2 (PLUS_EXPR, type, t, iv->step);
1.1  mrg 	      t = fold_build2 (GE_EXPR, boolean_type_node, t, iv->base);
1.1  mrg 	      if (integer_nonzerop (t))
1.1  mrg 		{
1.1  mrg 		  t = fold_build2 (MINUS_EXPR, type, iv->base, iv->step);
1.1  mrg 		  relaxed_cond = fold_build2 (GT_EXPR, boolean_type_node, t,
1.1  mrg 					      final);
1.1  mrg 		}
1.1  mrg 	    }
1.1  mrg 	}
1.1  mrg       else
1.1  mrg 	{
1.1  mrg 	  cond = fold_build2 (LE_EXPR, boolean_type_node, iv->base, final);
1.1  mrg 	  if (TREE_CODE (type) == INTEGER_TYPE)
1.1  mrg 	    {
1.1  mrg 	      /* Only when base - step doesn't underflow.  */
1.1  mrg 	      t = TYPE_MIN_VALUE (type);
1.1  mrg 	      t = fold_build2 (PLUS_EXPR, type, t, iv->step);
1.1  mrg 	      t = fold_build2 (LE_EXPR, boolean_type_node, t, iv->base);
1.1  mrg 	      if (integer_nonzerop (t))
1.1  mrg 		{
1.1  mrg 		  t = fold_build2 (MINUS_EXPR, type, iv->base, iv->step);
1.1  mrg 		  relaxed_cond = fold_build2 (LT_EXPR, boolean_type_node, t,
1.1  mrg 					      final);
1.1  mrg 		}
1.1  mrg 	    }
1.1  mrg 	}
1.1  mrg
1.1  mrg       t = simplify_using_initial_conditions (loop, cond);
1.1  mrg       if (!t || !integer_onep (t))
1.1  mrg 	t = simplify_using_initial_conditions (loop, relaxed_cond);
1.1  mrg
1.1  mrg       if (t && integer_onep (t))
1.1  mrg 	{
1.1  mrg 	  niter->control.no_overflow = true;
1.1  mrg 	  niter->niter = fold_build2 (EXACT_DIV_EXPR, niter_type, c, s);
1.1  mrg 	  return true;
1.1  mrg 	}
1.1  mrg     }
1.1  mrg
1.1  mrg   /* Let nsd (step, size of mode) = d.  If d does not divide c, the loop
1.1  mrg      is infinite.  Otherwise, the number of iterations is
1.1  mrg      (inverse(s/d) * (c/d)) mod (size of mode/d).  */
1.1  mrg   bits = num_ending_zeros (s);
1.1  mrg   bound = build_low_bits_mask (niter_type,
1.1  mrg 			       (TYPE_PRECISION (niter_type)
1.1  mrg 				- tree_to_uhwi (bits)));
1.1  mrg
1.1  mrg   d = fold_binary_to_constant (LSHIFT_EXPR, niter_type,
1.1  mrg 			       build_int_cst (niter_type, 1), bits);
1.1  mrg   s = fold_binary_to_constant (RSHIFT_EXPR, niter_type, s, bits);
1.1  mrg
1.1  mrg   if (!exit_must_be_taken)
1.1  mrg     {
1.1  mrg       /* If we cannot assume that the exit is taken eventually, record the
1.1  mrg 	 assumptions for divisibility of c.  */
1.1  mrg       assumption = fold_build2 (FLOOR_MOD_EXPR, niter_type, c, d);
1.1  mrg       assumption = fold_build2 (EQ_EXPR, boolean_type_node,
1.1  mrg 				assumption, build_int_cst (niter_type, 0));
1.1  mrg       if (!integer_nonzerop (assumption))
1.1  mrg 	niter->assumptions = fold_build2 (TRUTH_AND_EXPR, boolean_type_node,
1.1  mrg 					  niter->assumptions, assumption);
1.1  mrg     }
1.1  mrg
1.1  mrg   c = fold_build2 (EXACT_DIV_EXPR, niter_type, c, d);
1.1  mrg   if (integer_onep (s))
1.1  mrg     {
1.1  mrg       niter->niter = c;
1.1  mrg     }
1.1  mrg   else
1.1  mrg     {
1.1  mrg       tmp = fold_build2 (MULT_EXPR, niter_type, c, inverse (s, bound));
1.1  mrg       niter->niter = fold_build2 (BIT_AND_EXPR, niter_type, tmp, bound);
1.1  mrg     }
1.1  mrg   return true;
1.1  mrg }
1.1  mrg
1.1  mrg /* Checks whether we can determine the final value of the control variable
1.1  mrg    of the loop with ending condition IV0 < IV1 (computed in TYPE).
1.1  mrg    DELTA is the difference IV1->base - IV0->base, STEP is the absolute value
1.1  mrg    of the step.  The assumptions necessary to ensure that the computation
1.1  mrg    of the final value does not overflow are recorded in NITER.  If we
1.1  mrg    find the final value, we adjust DELTA and return TRUE.  Otherwise
1.1  mrg    we return false.  BNDS bounds the value of IV1->base - IV0->base,
1.1  mrg    and will be updated by the same amount as DELTA.  EXIT_MUST_BE_TAKEN is
1.1  mrg    true if we know that the exit must be taken eventually.  */
1.1  mrg
1.1  mrg static bool
1.1  mrg number_of_iterations_lt_to_ne (tree type, affine_iv *iv0, affine_iv *iv1,
1.1  mrg 			       class tree_niter_desc *niter,
1.1  mrg 			       tree *delta, tree step,
1.1  mrg 			       bool exit_must_be_taken, bounds *bnds)
1.1  mrg {
1.1  mrg   tree niter_type = TREE_TYPE (step);
1.1  mrg   tree mod = fold_build2 (FLOOR_MOD_EXPR, niter_type, *delta, step);
1.1  mrg   tree tmod;
1.1  mrg   mpz_t mmod;
1.1  mrg   tree assumption = boolean_true_node, bound, noloop;
1.1  mrg   bool ret = false, fv_comp_no_overflow;
1.1  mrg   tree type1 = type;
1.1  mrg   if (POINTER_TYPE_P (type))
1.1  mrg     type1 = sizetype;
1.1  mrg
1.1  mrg   if (TREE_CODE (mod) != INTEGER_CST)
1.1  mrg     return false;
1.1  mrg   if (integer_nonzerop (mod))
1.1  mrg     mod = fold_build2 (MINUS_EXPR, niter_type, step, mod);
1.1  mrg   tmod = fold_convert (type1, mod);
1.1  mrg
1.1  mrg   mpz_init (mmod);
1.1  mrg   wi::to_mpz (wi::to_wide (mod), mmod, UNSIGNED);
1.1  mrg   mpz_neg (mmod, mmod);
1.1  mrg
1.1  mrg   /* If the induction variable does not overflow and the exit is taken,
1.1  mrg      then the computation of the final value does not overflow.  This is
1.1  mrg      also obviously the case if the new final value is equal to the
1.1  mrg      current one.  Finally, we postulate this for pointer type variables,
1.1  mrg      as the code cannot rely on the object to that the pointer points being
1.1  mrg      placed at the end of the address space (and more pragmatically,
1.1  mrg      TYPE_{MIN,MAX}_VALUE is not defined for pointers).  */
1.1  mrg   if (integer_zerop (mod) || POINTER_TYPE_P (type))
1.1  mrg     fv_comp_no_overflow = true;
1.1  mrg   else if (!exit_must_be_taken)
1.1  mrg     fv_comp_no_overflow = false;
1.1  mrg   else
1.1  mrg     fv_comp_no_overflow =
1.1  mrg 	    (iv0->no_overflow && integer_nonzerop (iv0->step))
1.1  mrg 	    || (iv1->no_overflow && integer_nonzerop (iv1->step));
1.1  mrg
1.1  mrg   if (integer_nonzerop (iv0->step))
1.1  mrg     {
1.1  mrg       /* The final value of the iv is iv1->base + MOD, assuming that this
1.1  mrg 	 computation does not overflow, and that
1.1  mrg 	 iv0->base <= iv1->base + MOD.  */
1.1  mrg       if (!fv_comp_no_overflow)
1.1  mrg 	{
1.1  mrg 	  bound = fold_build2 (MINUS_EXPR, type1,
1.1  mrg 			       TYPE_MAX_VALUE (type1), tmod);
1.1  mrg 	  assumption = fold_build2 (LE_EXPR, boolean_type_node,
1.1  mrg 				    iv1->base, bound);
1.1  mrg 	  if (integer_zerop (assumption))
1.1  mrg 	    goto end;
1.1  mrg 	}
1.1  mrg     }
1.1  mrg   else
1.1  mrg     {
1.1  mrg       /* The final value of the iv is iv0->base - MOD, assuming that this
1.1  mrg 	 computation does not overflow, and that
1.1  mrg 	 iv0->base - MOD <= iv1->base. */
1.1  mrg       if (!fv_comp_no_overflow)
1.1  mrg 	{
1.1  mrg 	  bound = fold_build2 (PLUS_EXPR, type1,
1.1  mrg 			       TYPE_MIN_VALUE (type1), tmod);
1.1  mrg 	  assumption = fold_build2 (GE_EXPR, boolean_type_node,
1.1  mrg 				    iv0->base, bound);
1.1  mrg 	  if (integer_zerop (assumption))
1.1  mrg 	    goto end;
1.1  mrg 	}
1.1  mrg     }
1.1  mrg
1.1  mrg   /* IV0 < IV1 does not loop if IV0->base >= IV1->base.  */
1.1  mrg   if (mpz_cmp (mmod, bnds->below) < 0)
1.1  mrg     noloop = boolean_false_node;
1.1  mrg   else
1.1  mrg     noloop = fold_build2 (GE_EXPR, boolean_type_node,
1.1  mrg 			  iv0->base, iv1->base);
1.1  mrg
1.1  mrg   if (!integer_nonzerop (assumption))
1.1  mrg     niter->assumptions = fold_build2 (TRUTH_AND_EXPR, boolean_type_node,
1.1  mrg 				      niter->assumptions,
1.1  mrg 				      assumption);
1.1  mrg   if (!integer_zerop (noloop))
1.1  mrg     niter->may_be_zero = fold_build2 (TRUTH_OR_EXPR, boolean_type_node,
1.1  mrg 				      niter->may_be_zero,
1.1  mrg 				      noloop);
1.1  mrg   bounds_add (bnds, wi::to_widest (mod), type);
1.1  mrg   *delta = fold_build2 (PLUS_EXPR, niter_type, *delta, mod);
1.1  mrg
1.1  mrg   ret = true;
1.1  mrg end:
1.1  mrg   mpz_clear (mmod);
1.1  mrg   return ret;
1.1  mrg }
1.1  mrg
1.1  mrg /* Add assertions to NITER that ensure that the control variable of the loop
1.1  mrg    with ending condition IV0 < IV1 does not overflow.  Types of IV0 and IV1
1.1  mrg    are TYPE.  Returns false if we can prove that there is an overflow, true
1.1  mrg    otherwise.  STEP is the absolute value of the step.  */
1.1  mrg
1.1  mrg static bool
1.1  mrg assert_no_overflow_lt (tree type, affine_iv *iv0, affine_iv *iv1,
1.1  mrg 		       class tree_niter_desc *niter, tree step)
1.1  mrg {
1.1  mrg   tree bound, d, assumption, diff;
1.1  mrg   tree niter_type = TREE_TYPE (step);
1.1  mrg
1.1  mrg   if (integer_nonzerop (iv0->step))
1.1  mrg     {
1.1  mrg       /* for (i = iv0->base; i < iv1->base; i += iv0->step) */
1.1  mrg       if (iv0->no_overflow)
1.1  mrg 	return true;
1.1  mrg
1.1  mrg       /* If iv0->base is a constant, we can determine the last value before
1.1  mrg 	 overflow precisely; otherwise we conservatively assume
1.1  mrg 	 MAX - STEP + 1.  */
1.1  mrg
1.1  mrg       if (TREE_CODE (iv0->base) == INTEGER_CST)
1.1  mrg 	{
1.1  mrg 	  d = fold_build2 (MINUS_EXPR, niter_type,
1.1  mrg 			   fold_convert (niter_type, TYPE_MAX_VALUE (type)),
1.1  mrg 			   fold_convert (niter_type, iv0->base));
1.1  mrg 	  diff = fold_build2 (FLOOR_MOD_EXPR, niter_type, d, step);
1.1  mrg 	}
1.1  mrg       else
1.1  mrg 	diff = fold_build2 (MINUS_EXPR, niter_type, step,
1.1  mrg 			    build_int_cst (niter_type, 1));
1.1  mrg       bound = fold_build2 (MINUS_EXPR, type,
1.1  mrg 			   TYPE_MAX_VALUE (type), fold_convert (type, diff));
1.1  mrg       assumption = fold_build2 (LE_EXPR, boolean_type_node,
1.1  mrg 				iv1->base, bound);
1.1  mrg     }
1.1  mrg   else
1.1  mrg     {
1.1  mrg       /* for (i = iv1->base; i > iv0->base; i += iv1->step) */
1.1  mrg       if (iv1->no_overflow)
1.1  mrg 	return true;
1.1  mrg
1.1  mrg       if (TREE_CODE (iv1->base) == INTEGER_CST)
1.1  mrg 	{
1.1  mrg 	  d = fold_build2 (MINUS_EXPR, niter_type,
1.1  mrg 			   fold_convert (niter_type, iv1->base),
1.1  mrg 			   fold_convert (niter_type, TYPE_MIN_VALUE (type)));
1.1  mrg 	  diff = fold_build2 (FLOOR_MOD_EXPR, niter_type, d, step);
1.1  mrg 	}
1.1  mrg       else
1.1  mrg 	diff = fold_build2 (MINUS_EXPR, niter_type, step,
1.1  mrg 			    build_int_cst (niter_type, 1));
1.1  mrg       bound = fold_build2 (PLUS_EXPR, type,
1.1  mrg 			   TYPE_MIN_VALUE (type), fold_convert (type, diff));
1.1  mrg       assumption = fold_build2 (GE_EXPR, boolean_type_node,
1.1  mrg 				iv0->base, bound);
1.1  mrg     }
1.1  mrg
1.1  mrg   if (integer_zerop (assumption))
1.1  mrg     return false;
1.1  mrg   if (!integer_nonzerop (assumption))
1.1  mrg     niter->assumptions = fold_build2 (TRUTH_AND_EXPR, boolean_type_node,
1.1  mrg 				      niter->assumptions, assumption);
1.1  mrg
1.1  mrg   iv0->no_overflow = true;
1.1  mrg   iv1->no_overflow = true;
1.1  mrg   return true;
1.1  mrg }
1.1  mrg
1.1  mrg /* Add an assumption to NITER that a loop whose ending condition
1.1  mrg    is IV0 < IV1 rolls.  TYPE is the type of the control iv.  BNDS
1.1  mrg    bounds the value of IV1->base - IV0->base.  */
1.1  mrg
1.1  mrg static void
1.1  mrg assert_loop_rolls_lt (tree type, affine_iv *iv0, affine_iv *iv1,
1.1  mrg 		      class tree_niter_desc *niter, bounds *bnds)
1.1  mrg {
1.1  mrg   tree assumption = boolean_true_node, bound, diff;
1.1  mrg   tree mbz, mbzl, mbzr, type1;
1.1  mrg   bool rolls_p, no_overflow_p;
1.1  mrg   widest_int dstep;
1.1  mrg   mpz_t mstep, max;
1.1  mrg
1.1  mrg   /* We are going to compute the number of iterations as
1.1  mrg      (iv1->base - iv0->base + step - 1) / step, computed in the unsigned
1.1  mrg      variant of TYPE.  This formula only works if
1.1  mrg
1.1  mrg      -step + 1 <= (iv1->base - iv0->base) <= MAX - step + 1
1.1  mrg
1.1  mrg      (where MAX is the maximum value of the unsigned variant of TYPE, and
1.1  mrg      the computations in this formula are performed in full precision,
1.1  mrg      i.e., without overflows).
1.1  mrg
1.1  mrg      Usually, for loops with exit condition iv0->base + step * i < iv1->base,
1.1  mrg      we have a condition of the form iv0->base - step < iv1->base before the loop,
1.1  mrg      and for loops iv0->base < iv1->base - step * i the condition
1.1  mrg      iv0->base < iv1->base + step, due to loop header copying, which enable us
1.1  mrg      to prove the lower bound.
1.1  mrg
1.1  mrg      The upper bound is more complicated.  Unless the expressions for initial
1.1  mrg      and final value themselves contain enough information, we usually cannot
1.1  mrg      derive it from the context.  */
1.1  mrg
1.1  mrg   /* First check whether the answer does not follow from the bounds we gathered
1.1  mrg      before.  */
1.1  mrg   if (integer_nonzerop (iv0->step))
1.1  mrg     dstep = wi::to_widest (iv0->step);
1.1  mrg   else
1.1  mrg     {
1.1  mrg       dstep = wi::sext (wi::to_widest (iv1->step), TYPE_PRECISION (type));
1.1  mrg       dstep = -dstep;
1.1  mrg     }
1.1  mrg
1.1  mrg   mpz_init (mstep);
1.1  mrg   wi::to_mpz (dstep, mstep, UNSIGNED);
1.1  mrg   mpz_neg (mstep, mstep);
1.1  mrg   mpz_add_ui (mstep, mstep, 1);
1.1  mrg
1.1  mrg   rolls_p = mpz_cmp (mstep, bnds->below) <= 0;
1.1  mrg
1.1  mrg   mpz_init (max);
1.1  mrg   wi::to_mpz (wi::minus_one (TYPE_PRECISION (type)), max, UNSIGNED);
1.1  mrg   mpz_add (max, max, mstep);
1.1  mrg   no_overflow_p = (mpz_cmp (bnds->up, max) <= 0
1.1  mrg 		   /* For pointers, only values lying inside a single object
1.1  mrg 		      can be compared or manipulated by pointer arithmetics.
1.1  mrg 		      Gcc in general does not allow or handle objects larger
1.1  mrg 		      than half of the address space, hence the upper bound
1.1  mrg 		      is satisfied for pointers.  */
1.1  mrg 		   || POINTER_TYPE_P (type));
1.1  mrg   mpz_clear (mstep);
1.1  mrg   mpz_clear (max);
1.1  mrg
1.1  mrg   if (rolls_p && no_overflow_p)
1.1  mrg     return;
1.1  mrg
1.1  mrg   type1 = type;
1.1  mrg   if (POINTER_TYPE_P (type))
1.1  mrg     type1 = sizetype;
1.1  mrg
1.1  mrg   /* Now the hard part; we must formulate the assumption(s) as expressions, and
1.1  mrg      we must be careful not to introduce overflow.  */
1.1  mrg
1.1  mrg   if (integer_nonzerop (iv0->step))
1.1  mrg     {
1.1  mrg       diff = fold_build2 (MINUS_EXPR, type1,
1.1  mrg 			  iv0->step, build_int_cst (type1, 1));
1.1  mrg
1.1  mrg       /* We need to know that iv0->base >= MIN + iv0->step - 1.  Since
1.1  mrg 	 0 address never belongs to any object, we can assume this for
1.1  mrg 	 pointers.  */
1.1  mrg       if (!POINTER_TYPE_P (type))
1.1  mrg 	{
1.1  mrg 	  bound = fold_build2 (PLUS_EXPR, type1,
1.1  mrg 			       TYPE_MIN_VALUE (type), diff);
1.1  mrg 	  assumption = fold_build2 (GE_EXPR, boolean_type_node,
1.1  mrg 				    iv0->base, bound);
1.1  mrg 	}
1.1  mrg
1.1  mrg       /* And then we can compute iv0->base - diff, and compare it with
1.1  mrg 	 iv1->base.  */
1.1  mrg       mbzl = fold_build2 (MINUS_EXPR, type1,
1.1  mrg 			  fold_convert (type1, iv0->base), diff);
1.1  mrg       mbzr = fold_convert (type1, iv1->base);
1.1  mrg     }
1.1  mrg   else
1.1  mrg     {
1.1  mrg       diff = fold_build2 (PLUS_EXPR, type1,
1.1  mrg 			  iv1->step, build_int_cst (type1, 1));
1.1  mrg
1.1  mrg       if (!POINTER_TYPE_P (type))
1.1  mrg 	{
1.1  mrg 	  bound = fold_build2 (PLUS_EXPR, type1,
1.1  mrg 			       TYPE_MAX_VALUE (type), diff);
1.1  mrg 	  assumption = fold_build2 (LE_EXPR, boolean_type_node,
1.1  mrg 				    iv1->base, bound);
1.1  mrg 	}
1.1  mrg
1.1  mrg       mbzl = fold_convert (type1, iv0->base);
1.1  mrg       mbzr = fold_build2 (MINUS_EXPR, type1,
1.1  mrg 			  fold_convert (type1, iv1->base), diff);
1.1  mrg     }
1.1  mrg
1.1  mrg   if (!integer_nonzerop (assumption))
1.1  mrg     niter->assumptions = fold_build2 (TRUTH_AND_EXPR, boolean_type_node,
1.1  mrg 				      niter->assumptions, assumption);
1.1  mrg   if (!rolls_p)
1.1  mrg     {
1.1  mrg       mbz = fold_build2 (GT_EXPR, boolean_type_node, mbzl, mbzr);
1.1  mrg       niter->may_be_zero = fold_build2 (TRUTH_OR_EXPR, boolean_type_node,
1.1  mrg 					niter->may_be_zero, mbz);
1.1  mrg     }
1.1  mrg }
1.1  mrg
1.1  mrg /* Determines number of iterations of loop whose ending condition
1.1  mrg    is IV0 < IV1 which likes:  {base, -C} < n,  or n < {base, C}.
1.1  mrg    The number of iterations is stored to NITER.  */
1.1  mrg
1.1  mrg static bool
1.1  mrg number_of_iterations_until_wrap (class loop *loop, tree type, affine_iv *iv0,
1.1  mrg 				 affine_iv *iv1, class tree_niter_desc *niter)
1.1  mrg {
1.1  mrg   tree niter_type = unsigned_type_for (type);
1.1  mrg   tree step, num, assumptions, may_be_zero, span;
1.1  mrg   wide_int high, low, max, min;
1.1  mrg
1.1  mrg   may_be_zero = fold_build2 (LE_EXPR, boolean_type_node, iv1->base, iv0->base);
1.1  mrg   if (integer_onep (may_be_zero))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   int prec = TYPE_PRECISION (type);
1.1  mrg   signop sgn = TYPE_SIGN (type);
1.1  mrg   min = wi::min_value (prec, sgn);
1.1  mrg   max = wi::max_value (prec, sgn);
1.1  mrg
1.1  mrg   /* n < {base, C}. */
1.1  mrg   if (integer_zerop (iv0->step) && !tree_int_cst_sign_bit (iv1->step))
1.1  mrg     {
1.1  mrg       step = iv1->step;
1.1  mrg       /* MIN + C - 1 <= n.  */
1.1  mrg       tree last = wide_int_to_tree (type, min + wi::to_wide (step) - 1);
1.1  mrg       assumptions = fold_build2 (LE_EXPR, boolean_type_node, last, iv0->base);
1.1  mrg       if (integer_zerop (assumptions))
1.1  mrg 	return false;
1.1  mrg
1.1  mrg       num = fold_build2 (MINUS_EXPR, niter_type,
1.1  mrg 			 wide_int_to_tree (niter_type, max),
1.1  mrg 			 fold_convert (niter_type, iv1->base));
1.1  mrg
1.1  mrg       /* When base has the form iv + 1, if we know iv >= n, then iv + 1 < n
1.1  mrg 	 only when iv + 1 overflows, i.e. when iv == TYPE_VALUE_MAX.  */
1.1  mrg       if (sgn == UNSIGNED
1.1  mrg 	  && integer_onep (step)
1.1  mrg 	  && TREE_CODE (iv1->base) == PLUS_EXPR
1.1  mrg 	  && integer_onep (TREE_OPERAND (iv1->base, 1)))
1.1  mrg 	{
1.1  mrg 	  tree cond = fold_build2 (GE_EXPR, boolean_type_node,
1.1  mrg 				   TREE_OPERAND (iv1->base, 0), iv0->base);
1.1  mrg 	  cond = simplify_using_initial_conditions (loop, cond);
1.1  mrg 	  if (integer_onep (cond))
1.1  mrg 	    may_be_zero = fold_build2 (EQ_EXPR, boolean_type_node,
1.1  mrg 				       TREE_OPERAND (iv1->base, 0),
1.1  mrg 				       TYPE_MAX_VALUE (type));
1.1  mrg 	}
1.1  mrg
1.1  mrg       high = max;
1.1  mrg       if (TREE_CODE (iv1->base) == INTEGER_CST)
1.1  mrg 	low = wi::to_wide (iv1->base) - 1;
1.1  mrg       else if (TREE_CODE (iv0->base) == INTEGER_CST)
1.1  mrg 	low = wi::to_wide (iv0->base);
1.1  mrg       else
1.1  mrg 	low = min;
1.1  mrg     }
1.1  mrg   /* {base, -C} < n.  */
1.1  mrg   else if (tree_int_cst_sign_bit (iv0->step) && integer_zerop (iv1->step))
1.1  mrg     {
1.1  mrg       step = fold_build1 (NEGATE_EXPR, TREE_TYPE (iv0->step), iv0->step);
1.1  mrg       /* MAX - C + 1 >= n.  */
1.1  mrg       tree last = wide_int_to_tree (type, max - wi::to_wide (step) + 1);
1.1  mrg       assumptions = fold_build2 (GE_EXPR, boolean_type_node, last, iv1->base);
1.1  mrg       if (integer_zerop (assumptions))
1.1  mrg 	return false;
1.1  mrg
1.1  mrg       num = fold_build2 (MINUS_EXPR, niter_type,
1.1  mrg 			 fold_convert (niter_type, iv0->base),
1.1  mrg 			 wide_int_to_tree (niter_type, min));
1.1  mrg       low = min;
1.1  mrg       if (TREE_CODE (iv0->base) == INTEGER_CST)
1.1  mrg 	high = wi::to_wide (iv0->base) + 1;
1.1  mrg       else if (TREE_CODE (iv1->base) == INTEGER_CST)
1.1  mrg 	high = wi::to_wide (iv1->base);
1.1  mrg       else
1.1  mrg 	high = max;
1.1  mrg     }
1.1  mrg   else
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* (delta + step - 1) / step */
1.1  mrg   step = fold_convert (niter_type, step);
1.1  mrg   num = fold_build2 (PLUS_EXPR, niter_type, num, step);
1.1  mrg   niter->niter = fold_build2 (FLOOR_DIV_EXPR, niter_type, num, step);
1.1  mrg
1.1  mrg   widest_int delta, s;
1.1  mrg   delta = widest_int::from (high, sgn) - widest_int::from (low, sgn);
1.1  mrg   s = wi::to_widest (step);
1.1  mrg   delta = delta + s - 1;
1.1  mrg   niter->max = wi::udiv_floor (delta, s);
1.1  mrg
1.1  mrg   niter->may_be_zero = may_be_zero;
1.1  mrg
1.1  mrg   if (!integer_nonzerop (assumptions))
1.1  mrg     niter->assumptions = fold_build2 (TRUTH_AND_EXPR, boolean_type_node,
1.1  mrg 				      niter->assumptions, assumptions);
1.1  mrg
1.1  mrg   niter->control.no_overflow = false;
1.1  mrg
1.1  mrg   /* Update bound and exit condition as:
1.1  mrg      bound = niter * STEP + (IVbase - STEP).
1.1  mrg      { IVbase - STEP, +, STEP } != bound
1.1  mrg      Here, biasing IVbase by 1 step makes 'bound' be the value before wrap.
1.1  mrg      */
1.1  mrg   tree base_type = TREE_TYPE (niter->control.base);
1.1  mrg   if (POINTER_TYPE_P (base_type))
1.1  mrg     {
1.1  mrg       tree utype = unsigned_type_for (base_type);
1.1  mrg       niter->control.base
1.1  mrg 	= fold_build2 (MINUS_EXPR, utype,
1.1  mrg 		       fold_convert (utype, niter->control.base),
1.1  mrg 		       fold_convert (utype, niter->control.step));
1.1  mrg       niter->control.base = fold_convert (base_type, niter->control.base);
1.1  mrg     }
1.1  mrg   else
1.1  mrg     niter->control.base
1.1  mrg       = fold_build2 (MINUS_EXPR, base_type, niter->control.base,
1.1  mrg 		     niter->control.step);
1.1  mrg
1.1  mrg   span = fold_build2 (MULT_EXPR, niter_type, niter->niter,
1.1  mrg 		      fold_convert (niter_type, niter->control.step));
1.1  mrg   niter->bound = fold_build2 (PLUS_EXPR, niter_type, span,
1.1  mrg 			      fold_convert (niter_type, niter->control.base));
1.1  mrg   niter->bound = fold_convert (type, niter->bound);
1.1  mrg   niter->cmp = NE_EXPR;
1.1  mrg
1.1  mrg   return true;
1.1  mrg }
1.1  mrg
1.1  mrg /* Determines number of iterations of loop whose ending condition
1.1  mrg    is IV0 < IV1.  TYPE is the type of the iv.  The number of
1.1  mrg    iterations is stored to NITER.  BNDS bounds the difference
1.1  mrg    IV1->base - IV0->base.  EXIT_MUST_BE_TAKEN is true if we know
1.1  mrg    that the exit must be taken eventually.  */
1.1  mrg
1.1  mrg static bool
1.1  mrg number_of_iterations_lt (class loop *loop, tree type, affine_iv *iv0,
1.1  mrg 			 affine_iv *iv1, class tree_niter_desc *niter,
1.1  mrg 			 bool exit_must_be_taken, bounds *bnds)
1.1  mrg {
1.1  mrg   tree niter_type = unsigned_type_for (type);
1.1  mrg   tree delta, step, s;
1.1  mrg   mpz_t mstep, tmp;
1.1  mrg
1.1  mrg   if (integer_nonzerop (iv0->step))
1.1  mrg     {
1.1  mrg       niter->control = *iv0;
1.1  mrg       niter->cmp = LT_EXPR;
1.1  mrg       niter->bound = iv1->base;
1.1  mrg     }
1.1  mrg   else
1.1  mrg     {
1.1  mrg       niter->control = *iv1;
1.1  mrg       niter->cmp = GT_EXPR;
1.1  mrg       niter->bound = iv0->base;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* {base, -C} < n,  or n < {base, C} */
1.1  mrg   if (tree_int_cst_sign_bit (iv0->step)
1.1  mrg       || (!integer_zerop (iv1->step) && !tree_int_cst_sign_bit (iv1->step)))
1.1  mrg     return number_of_iterations_until_wrap (loop, type, iv0, iv1, niter);
1.1  mrg
1.1  mrg   delta = fold_build2 (MINUS_EXPR, niter_type,
1.1  mrg 		       fold_convert (niter_type, iv1->base),
1.1  mrg 		       fold_convert (niter_type, iv0->base));
1.1  mrg
1.1  mrg   /* First handle the special case that the step is +-1.  */
1.1  mrg   if ((integer_onep (iv0->step) && integer_zerop (iv1->step))
1.1  mrg       || (integer_all_onesp (iv1->step) && integer_zerop (iv0->step)))
1.1  mrg     {
1.1  mrg       /* for (i = iv0->base; i < iv1->base; i++)
1.1  mrg
1.1  mrg 	 or
1.1  mrg
1.1  mrg 	 for (i = iv1->base; i > iv0->base; i--).
1.1  mrg
1.1  mrg 	 In both cases # of iterations is iv1->base - iv0->base, assuming that
1.1  mrg 	 iv1->base >= iv0->base.
1.1  mrg
1.1  mrg          First try to derive a lower bound on the value of
1.1  mrg 	 iv1->base - iv0->base, computed in full precision.  If the difference
1.1  mrg 	 is nonnegative, we are done, otherwise we must record the
1.1  mrg 	 condition.  */
1.1  mrg
1.1  mrg       if (mpz_sgn (bnds->below) < 0)
1.1  mrg 	niter->may_be_zero = fold_build2 (LT_EXPR, boolean_type_node,
1.1  mrg 					  iv1->base, iv0->base);
1.1  mrg       niter->niter = delta;
1.1  mrg       niter->max = widest_int::from (wi::from_mpz (niter_type, bnds->up, false),
1.1  mrg 				     TYPE_SIGN (niter_type));
1.1  mrg       niter->control.no_overflow = true;
1.1  mrg       return true;
1.1  mrg     }
1.1  mrg
1.1  mrg   if (integer_nonzerop (iv0->step))
1.1  mrg     step = fold_convert (niter_type, iv0->step);
1.1  mrg   else
1.1  mrg     step = fold_convert (niter_type,
1.1  mrg 			 fold_build1 (NEGATE_EXPR, type, iv1->step));
1.1  mrg
1.1  mrg   /* If we can determine the final value of the control iv exactly, we can
1.1  mrg      transform the condition to != comparison.  In particular, this will be
1.1  mrg      the case if DELTA is constant.  */
1.1  mrg   if (number_of_iterations_lt_to_ne (type, iv0, iv1, niter, &delta, step,
1.1  mrg 				     exit_must_be_taken, bnds))
1.1  mrg     {
1.1  mrg       affine_iv zps;
1.1  mrg
1.1  mrg       zps.base = build_int_cst (niter_type, 0);
1.1  mrg       zps.step = step;
1.1  mrg       /* number_of_iterations_lt_to_ne will add assumptions that ensure that
1.1  mrg 	 zps does not overflow.  */
1.1  mrg       zps.no_overflow = true;
1.1  mrg
1.1  mrg       return number_of_iterations_ne (loop, type, &zps,
1.1  mrg 				      delta, niter, true, bnds);
1.1  mrg     }
1.1  mrg
1.1  mrg   /* Make sure that the control iv does not overflow.  */
1.1  mrg   if (!assert_no_overflow_lt (type, iv0, iv1, niter, step))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* We determine the number of iterations as (delta + step - 1) / step.  For
1.1  mrg      this to work, we must know that iv1->base >= iv0->base - step + 1,
1.1  mrg      otherwise the loop does not roll.  */
1.1  mrg   assert_loop_rolls_lt (type, iv0, iv1, niter, bnds);
1.1  mrg
1.1  mrg   s = fold_build2 (MINUS_EXPR, niter_type,
1.1  mrg 		   step, build_int_cst (niter_type, 1));
1.1  mrg   delta = fold_build2 (PLUS_EXPR, niter_type, delta, s);
1.1  mrg   niter->niter = fold_build2 (FLOOR_DIV_EXPR, niter_type, delta, step);
1.1  mrg
1.1  mrg   mpz_init (mstep);
1.1  mrg   mpz_init (tmp);
1.1  mrg   wi::to_mpz (wi::to_wide (step), mstep, UNSIGNED);
1.1  mrg   mpz_add (tmp, bnds->up, mstep);
1.1  mrg   mpz_sub_ui (tmp, tmp, 1);
1.1  mrg   mpz_fdiv_q (tmp, tmp, mstep);
1.1  mrg   niter->max = widest_int::from (wi::from_mpz (niter_type, tmp, false),
1.1  mrg 				 TYPE_SIGN (niter_type));
1.1  mrg   mpz_clear (mstep);
1.1  mrg   mpz_clear (tmp);
1.1  mrg
1.1  mrg   return true;
1.1  mrg }
1.1  mrg
1.1  mrg /* Determines number of iterations of loop whose ending condition
1.1  mrg    is IV0 <= IV1.  TYPE is the type of the iv.  The number of
1.1  mrg    iterations is stored to NITER.  EXIT_MUST_BE_TAKEN is true if
1.1  mrg    we know that this condition must eventually become false (we derived this
1.1  mrg    earlier, and possibly set NITER->assumptions to make sure this
1.1  mrg    is the case).  BNDS bounds the difference IV1->base - IV0->base.  */
1.1  mrg
1.1  mrg static bool
1.1  mrg number_of_iterations_le (class loop *loop, tree type, affine_iv *iv0,
1.1  mrg 			 affine_iv *iv1, class tree_niter_desc *niter,
1.1  mrg 			 bool exit_must_be_taken, bounds *bnds)
1.1  mrg {
1.1  mrg   tree assumption;
1.1  mrg   tree type1 = type;
1.1  mrg   if (POINTER_TYPE_P (type))
1.1  mrg     type1 = sizetype;
1.1  mrg
1.1  mrg   /* Say that IV0 is the control variable.  Then IV0 <= IV1 iff
1.1  mrg      IV0 < IV1 + 1, assuming that IV1 is not equal to the greatest
1.1  mrg      value of the type.  This we must know anyway, since if it is
1.1  mrg      equal to this value, the loop rolls forever.  We do not check
1.1  mrg      this condition for pointer type ivs, as the code cannot rely on
1.1  mrg      the object to that the pointer points being placed at the end of
1.1  mrg      the address space (and more pragmatically, TYPE_{MIN,MAX}_VALUE is
1.1  mrg      not defined for pointers).  */
1.1  mrg
1.1  mrg   if (!exit_must_be_taken && !POINTER_TYPE_P (type))
1.1  mrg     {
1.1  mrg       if (integer_nonzerop (iv0->step))
1.1  mrg 	assumption = fold_build2 (NE_EXPR, boolean_type_node,
1.1  mrg 				  iv1->base, TYPE_MAX_VALUE (type));
1.1  mrg       else
1.1  mrg 	assumption = fold_build2 (NE_EXPR, boolean_type_node,
1.1  mrg 				  iv0->base, TYPE_MIN_VALUE (type));
1.1  mrg
1.1  mrg       if (integer_zerop (assumption))
1.1  mrg 	return false;
1.1  mrg       if (!integer_nonzerop (assumption))
1.1  mrg 	niter->assumptions = fold_build2 (TRUTH_AND_EXPR, boolean_type_node,
1.1  mrg 					  niter->assumptions, assumption);
1.1  mrg     }
1.1  mrg
1.1  mrg   if (integer_nonzerop (iv0->step))
1.1  mrg     {
1.1  mrg       if (POINTER_TYPE_P (type))
1.1  mrg 	iv1->base = fold_build_pointer_plus_hwi (iv1->base, 1);
1.1  mrg       else
1.1  mrg 	iv1->base = fold_build2 (PLUS_EXPR, type1, iv1->base,
1.1  mrg 				 build_int_cst (type1, 1));
1.1  mrg     }
1.1  mrg   else if (POINTER_TYPE_P (type))
1.1  mrg     iv0->base = fold_build_pointer_plus_hwi (iv0->base, -1);
1.1  mrg   else
1.1  mrg     iv0->base = fold_build2 (MINUS_EXPR, type1,
1.1  mrg 			     iv0->base, build_int_cst (type1, 1));
1.1  mrg
1.1  mrg   bounds_add (bnds, 1, type1);
1.1  mrg
1.1  mrg   return number_of_iterations_lt (loop, type, iv0, iv1, niter, exit_must_be_taken,
1.1  mrg 				  bnds);
1.1  mrg }
1.1  mrg
1.1  mrg /* Dumps description of affine induction variable IV to FILE.  */
1.1  mrg
1.1  mrg static void
1.1  mrg dump_affine_iv (FILE *file, affine_iv *iv)
1.1  mrg {
1.1  mrg   if (!integer_zerop (iv->step))
1.1  mrg     fprintf (file, "[");
1.1  mrg
1.1  mrg   print_generic_expr (dump_file, iv->base, TDF_SLIM);
1.1  mrg
1.1  mrg   if (!integer_zerop (iv->step))
1.1  mrg     {
1.1  mrg       fprintf (file, ", + , ");
1.1  mrg       print_generic_expr (dump_file, iv->step, TDF_SLIM);
1.1  mrg       fprintf (file, "]%s", iv->no_overflow ? "(no_overflow)" : "");
1.1  mrg     }
1.1  mrg }
1.1  mrg
1.1  mrg /* Determine the number of iterations according to condition (for staying
1.1  mrg    inside loop) which compares two induction variables using comparison
1.1  mrg    operator CODE.  The induction variable on left side of the comparison
1.1  mrg    is IV0, the right-hand side is IV1.  Both induction variables must have
1.1  mrg    type TYPE, which must be an integer or pointer type.  The steps of the
1.1  mrg    ivs must be constants (or NULL_TREE, which is interpreted as constant zero).
1.1  mrg
1.1  mrg    LOOP is the loop whose number of iterations we are determining.
1.1  mrg
1.1  mrg    ONLY_EXIT is true if we are sure this is the only way the loop could be
1.1  mrg    exited (including possibly non-returning function calls, exceptions, etc.)
1.1  mrg    -- in this case we can use the information whether the control induction
1.1  mrg    variables can overflow or not in a more efficient way.
1.1  mrg
1.1  mrg    if EVERY_ITERATION is true, we know the test is executed on every iteration.
1.1  mrg
1.1  mrg    The results (number of iterations and assumptions as described in
1.1  mrg    comments at class tree_niter_desc in tree-ssa-loop.h) are stored to NITER.
1.1  mrg    Returns false if it fails to determine number of iterations, true if it
1.1  mrg    was determined (possibly with some assumptions).  */
1.1  mrg
1.1  mrg static bool
1.1  mrg number_of_iterations_cond (class loop *loop,
1.1  mrg 			   tree type, affine_iv *iv0, enum tree_code code,
1.1  mrg 			   affine_iv *iv1, class tree_niter_desc *niter,
1.1  mrg 			   bool only_exit, bool every_iteration)
1.1  mrg {
1.1  mrg   bool exit_must_be_taken = false, ret;
1.1  mrg   bounds bnds;
1.1  mrg
1.1  mrg   /* If the test is not executed every iteration, wrapping may make the test
1.1  mrg      to pass again.
1.1  mrg      TODO: the overflow case can be still used as unreliable estimate of upper
1.1  mrg      bound.  But we have no API to pass it down to number of iterations code
1.1  mrg      and, at present, it will not use it anyway.  */
1.1  mrg   if (!every_iteration
1.1  mrg       && (!iv0->no_overflow || !iv1->no_overflow
1.1  mrg 	  || code == NE_EXPR || code == EQ_EXPR))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* The meaning of these assumptions is this:
1.1  mrg      if !assumptions
1.1  mrg        then the rest of information does not have to be valid
1.1  mrg      if may_be_zero then the loop does not roll, even if
1.1  mrg        niter != 0.  */
1.1  mrg   niter->assumptions = boolean_true_node;
1.1  mrg   niter->may_be_zero = boolean_false_node;
1.1  mrg   niter->niter = NULL_TREE;
1.1  mrg   niter->max = 0;
1.1  mrg   niter->bound = NULL_TREE;
1.1  mrg   niter->cmp = ERROR_MARK;
1.1  mrg
1.1  mrg   /* Make < comparison from > ones, and for NE_EXPR comparisons, ensure that
1.1  mrg      the control variable is on lhs.  */
1.1  mrg   if (code == GE_EXPR || code == GT_EXPR
1.1  mrg       || (code == NE_EXPR && integer_zerop (iv0->step)))
1.1  mrg     {
1.1  mrg       std::swap (iv0, iv1);
1.1  mrg       code = swap_tree_comparison (code);
1.1  mrg     }
1.1  mrg
1.1  mrg   if (POINTER_TYPE_P (type))
1.1  mrg     {
1.1  mrg       /* Comparison of pointers is undefined unless both iv0 and iv1 point
1.1  mrg 	 to the same object.  If they do, the control variable cannot wrap
1.1  mrg 	 (as wrap around the bounds of memory will never return a pointer
1.1  mrg 	 that would be guaranteed to point to the same object, even if we
1.1  mrg 	 avoid undefined behavior by casting to size_t and back).  */
1.1  mrg       iv0->no_overflow = true;
1.1  mrg       iv1->no_overflow = true;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* If the control induction variable does not overflow and the only exit
1.1  mrg      from the loop is the one that we analyze, we know it must be taken
1.1  mrg      eventually.  */
1.1  mrg   if (only_exit)
1.1  mrg     {
1.1  mrg       if (!integer_zerop (iv0->step) && iv0->no_overflow)
1.1  mrg 	exit_must_be_taken = true;
1.1  mrg       else if (!integer_zerop (iv1->step) && iv1->no_overflow)
1.1  mrg 	exit_must_be_taken = true;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* We can handle cases which neither of the sides of the comparison is
1.1  mrg      invariant:
1.1  mrg
1.1  mrg        {iv0.base, iv0.step} cmp_code {iv1.base, iv1.step}
1.1  mrg      as if:
1.1  mrg        {iv0.base, iv0.step - iv1.step} cmp_code {iv1.base, 0}
1.1  mrg
1.1  mrg      provided that either below condition is satisfied:
1.1  mrg
1.1  mrg        a) the test is NE_EXPR;
1.1  mrg        b) iv0 and iv1 do not overflow and iv0.step - iv1.step is of
1.1  mrg 	  the same sign and of less or equal magnitude than iv0.step
1.1  mrg
1.1  mrg      This rarely occurs in practice, but it is simple enough to manage.  */
1.1  mrg   if (!integer_zerop (iv0->step) && !integer_zerop (iv1->step))
1.1  mrg     {
1.1  mrg       tree step_type = POINTER_TYPE_P (type) ? sizetype : type;
1.1  mrg       tree step = fold_binary_to_constant (MINUS_EXPR, step_type,
1.1  mrg 					   iv0->step, iv1->step);
1.1  mrg
1.1  mrg       /* For code other than NE_EXPR we have to ensure moving the evolution
1.1  mrg 	 of IV1 to that of IV0 does not introduce overflow.  */
1.1  mrg       if (TREE_CODE (step) != INTEGER_CST
1.1  mrg 	  || !iv0->no_overflow || !iv1->no_overflow)
1.1  mrg 	{
1.1  mrg 	  if (code != NE_EXPR)
1.1  mrg 	    return false;
1.1  mrg 	  iv0->no_overflow = false;
1.1  mrg 	}
1.1  mrg       /* If the new step of IV0 has changed sign or is of greater
1.1  mrg 	 magnitude then we do not know whether IV0 does overflow
1.1  mrg 	 and thus the transform is not valid for code other than NE_EXPR.  */
1.1  mrg       else if (tree_int_cst_sign_bit (step) != tree_int_cst_sign_bit (iv0->step)
1.1  mrg 	       || wi::gtu_p (wi::abs (wi::to_widest (step)),
1.1  mrg 			     wi::abs (wi::to_widest (iv0->step))))
1.1  mrg 	{
1.1  mrg 	  if (POINTER_TYPE_P (type) && code != NE_EXPR)
1.1  mrg 	    /* For relational pointer compares we have further guarantees
1.1  mrg 	       that the pointers always point to the same object (or one
1.1  mrg 	       after it) and that objects do not cross the zero page.  So
1.1  mrg 	       not only is the transform always valid for relational
1.1  mrg 	       pointer compares, we also know the resulting IV does not
1.1  mrg 	       overflow.  */
1.1  mrg 	    ;
1.1  mrg 	  else if (code != NE_EXPR)
1.1  mrg 	    return false;
1.1  mrg 	  else
1.1  mrg 	    iv0->no_overflow = false;
1.1  mrg 	}
1.1  mrg
1.1  mrg       iv0->step = step;
1.1  mrg       iv1->step = build_int_cst (step_type, 0);
1.1  mrg       iv1->no_overflow = true;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* If the result of the comparison is a constant,  the loop is weird.  More
1.1  mrg      precise handling would be possible, but the situation is not common enough
1.1  mrg      to waste time on it.  */
1.1  mrg   if (integer_zerop (iv0->step) && integer_zerop (iv1->step))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* If the loop exits immediately, there is nothing to do.  */
1.1  mrg   tree tem = fold_binary (code, boolean_type_node, iv0->base, iv1->base);
1.1  mrg   if (tem && integer_zerop (tem))
1.1  mrg     {
1.1  mrg       if (!every_iteration)
1.1  mrg 	return false;
1.1  mrg       niter->niter = build_int_cst (unsigned_type_for (type), 0);
1.1  mrg       niter->max = 0;
1.1  mrg       return true;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* OK, now we know we have a senseful loop.  Handle several cases, depending
1.1  mrg      on what comparison operator is used.  */
1.1  mrg   bound_difference (loop, iv1->base, iv0->base, &bnds);
1.1  mrg
1.1  mrg   if (dump_file && (dump_flags & TDF_DETAILS))
1.1  mrg     {
1.1  mrg       fprintf (dump_file,
1.1  mrg 	       "Analyzing # of iterations of loop %d\n", loop->num);
1.1  mrg
1.1  mrg       fprintf (dump_file, "  exit condition ");
1.1  mrg       dump_affine_iv (dump_file, iv0);
1.1  mrg       fprintf (dump_file, " %s ",
1.1  mrg 	       code == NE_EXPR ? "!="
1.1  mrg 	       : code == LT_EXPR ? "<"
1.1  mrg 	       : "<=");
1.1  mrg       dump_affine_iv (dump_file, iv1);
1.1  mrg       fprintf (dump_file, "\n");
1.1  mrg
1.1  mrg       fprintf (dump_file, "  bounds on difference of bases: ");
1.1  mrg       mpz_out_str (dump_file, 10, bnds.below);
1.1  mrg       fprintf (dump_file, " ... ");
1.1  mrg       mpz_out_str (dump_file, 10, bnds.up);
1.1  mrg       fprintf (dump_file, "\n");
1.1  mrg     }
1.1  mrg
1.1  mrg   switch (code)
1.1  mrg     {
1.1  mrg     case NE_EXPR:
1.1  mrg       gcc_assert (integer_zerop (iv1->step));
1.1  mrg       ret = number_of_iterations_ne (loop, type, iv0, iv1->base, niter,
1.1  mrg 				     exit_must_be_taken, &bnds);
1.1  mrg       break;
1.1  mrg
1.1  mrg     case LT_EXPR:
1.1  mrg       ret = number_of_iterations_lt (loop, type, iv0, iv1, niter,
1.1  mrg 				     exit_must_be_taken, &bnds);
1.1  mrg       break;
1.1  mrg
1.1  mrg     case LE_EXPR:
1.1  mrg       ret = number_of_iterations_le (loop, type, iv0, iv1, niter,
1.1  mrg 				     exit_must_be_taken, &bnds);
1.1  mrg       break;
1.1  mrg
1.1  mrg     default:
1.1  mrg       gcc_unreachable ();
1.1  mrg     }
1.1  mrg
1.1  mrg   mpz_clear (bnds.up);
1.1  mrg   mpz_clear (bnds.below);
1.1  mrg
1.1  mrg   if (dump_file && (dump_flags & TDF_DETAILS))
1.1  mrg     {
1.1  mrg       if (ret)
1.1  mrg 	{
1.1  mrg 	  fprintf (dump_file, "  result:\n");
1.1  mrg 	  if (!integer_nonzerop (niter->assumptions))
1.1  mrg 	    {
1.1  mrg 	      fprintf (dump_file, "    under assumptions ");
1.1  mrg 	      print_generic_expr (dump_file, niter->assumptions, TDF_SLIM);
1.1  mrg 	      fprintf (dump_file, "\n");
1.1  mrg 	    }
1.1  mrg
1.1  mrg 	  if (!integer_zerop (niter->may_be_zero))
1.1  mrg 	    {
1.1  mrg 	      fprintf (dump_file, "    zero if ");
1.1  mrg 	      print_generic_expr (dump_file, niter->may_be_zero, TDF_SLIM);
1.1  mrg 	      fprintf (dump_file, "\n");
1.1  mrg 	    }
1.1  mrg
1.1  mrg 	  fprintf (dump_file, "    # of iterations ");
1.1  mrg 	  print_generic_expr (dump_file, niter->niter, TDF_SLIM);
1.1  mrg 	  fprintf (dump_file, ", bounded by ");
1.1  mrg 	  print_decu (niter->max, dump_file);
1.1  mrg 	  fprintf (dump_file, "\n");
1.1  mrg 	}
1.1  mrg       else
1.1  mrg 	fprintf (dump_file, "  failed\n\n");
1.1  mrg     }
1.1  mrg   return ret;
1.1  mrg }
1.1  mrg
1.1  mrg /* Substitute NEW_TREE for OLD in EXPR and fold the result.
1.1  mrg    If VALUEIZE is non-NULL then OLD and NEW_TREE are ignored and instead
1.1  mrg    all SSA names are replaced with the result of calling the VALUEIZE
1.1  mrg    function with the SSA name as argument.  */
1.1  mrg
1.1  mrg tree
1.1  mrg simplify_replace_tree (tree expr, tree old, tree new_tree,
1.1  mrg 		       tree (*valueize) (tree, void*), void *context,
1.1  mrg 		       bool do_fold)
1.1  mrg {
1.1  mrg   unsigned i, n;
1.1  mrg   tree ret = NULL_TREE, e, se;
1.1  mrg
1.1  mrg   if (!expr)
1.1  mrg     return NULL_TREE;
1.1  mrg
1.1  mrg   /* Do not bother to replace constants.  */
1.1  mrg   if (CONSTANT_CLASS_P (expr))
1.1  mrg     return expr;
1.1  mrg
1.1  mrg   if (valueize)
1.1  mrg     {
1.1  mrg       if (TREE_CODE (expr) == SSA_NAME)
1.1  mrg 	{
1.1  mrg 	  new_tree = valueize (expr, context);
1.1  mrg 	  if (new_tree != expr)
1.1  mrg 	    return new_tree;
1.1  mrg 	}
1.1  mrg     }
1.1  mrg   else if (expr == old
1.1  mrg 	   || operand_equal_p (expr, old, 0))
1.1  mrg     return unshare_expr (new_tree);
1.1  mrg
1.1  mrg   if (!EXPR_P (expr))
1.1  mrg     return expr;
1.1  mrg
1.1  mrg   n = TREE_OPERAND_LENGTH (expr);
1.1  mrg   for (i = 0; i < n; i++)
1.1  mrg     {
1.1  mrg       e = TREE_OPERAND (expr, i);
1.1  mrg       se = simplify_replace_tree (e, old, new_tree, valueize, context, do_fold);
1.1  mrg       if (e == se)
1.1  mrg 	continue;
1.1  mrg
1.1  mrg       if (!ret)
1.1  mrg 	ret = copy_node (expr);
1.1  mrg
1.1  mrg       TREE_OPERAND (ret, i) = se;
1.1  mrg     }
1.1  mrg
1.1  mrg   return (ret ? (do_fold ? fold (ret) : ret) : expr);
1.1  mrg }
1.1  mrg
1.1  mrg /* Expand definitions of ssa names in EXPR as long as they are simple
1.1  mrg    enough, and return the new expression.  If STOP is specified, stop
1.1  mrg    expanding if EXPR equals to it.  */
1.1  mrg
1.1  mrg static tree
1.1  mrg expand_simple_operations (tree expr, tree stop, hash_map<tree, tree> &cache)
1.1  mrg {
1.1  mrg   unsigned i, n;
1.1  mrg   tree ret = NULL_TREE, e, ee, e1;
1.1  mrg   enum tree_code code;
1.1  mrg   gimple *stmt;
1.1  mrg
1.1  mrg   if (expr == NULL_TREE)
1.1  mrg     return expr;
1.1  mrg
1.1  mrg   if (is_gimple_min_invariant (expr))
1.1  mrg     return expr;
1.1  mrg
1.1  mrg   code = TREE_CODE (expr);
1.1  mrg   if (IS_EXPR_CODE_CLASS (TREE_CODE_CLASS (code)))
1.1  mrg     {
1.1  mrg       n = TREE_OPERAND_LENGTH (expr);
1.1  mrg       for (i = 0; i < n; i++)
1.1  mrg 	{
1.1  mrg 	  e = TREE_OPERAND (expr, i);
1.1  mrg 	  /* SCEV analysis feeds us with a proper expression
1.1  mrg 	     graph matching the SSA graph.  Avoid turning it
1.1  mrg 	     into a tree here, thus handle tree sharing
1.1  mrg 	     properly.
1.1  mrg 	     ???  The SSA walk below still turns the SSA graph
1.1  mrg 	     into a tree but until we find a testcase do not
1.1  mrg 	     introduce additional tree sharing here.  */
1.1  mrg 	  bool existed_p;
1.1  mrg 	  tree &cee = cache.get_or_insert (e, &existed_p);
1.1  mrg 	  if (existed_p)
1.1  mrg 	    ee = cee;
1.1  mrg 	  else
1.1  mrg 	    {
1.1  mrg 	      cee = e;
1.1  mrg 	      ee = expand_simple_operations (e, stop, cache);
1.1  mrg 	      if (ee != e)
1.1  mrg 		*cache.get (e) = ee;
1.1  mrg 	    }
1.1  mrg 	  if (e == ee)
1.1  mrg 	    continue;
1.1  mrg
1.1  mrg 	  if (!ret)
1.1  mrg 	    ret = copy_node (expr);
1.1  mrg
1.1  mrg 	  TREE_OPERAND (ret, i) = ee;
1.1  mrg 	}
1.1  mrg
1.1  mrg       if (!ret)
1.1  mrg 	return expr;
1.1  mrg
1.1  mrg       fold_defer_overflow_warnings ();
1.1  mrg       ret = fold (ret);
1.1  mrg       fold_undefer_and_ignore_overflow_warnings ();
1.1  mrg       return ret;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* Stop if it's not ssa name or the one we don't want to expand.  */
1.1  mrg   if (TREE_CODE (expr) != SSA_NAME || expr == stop)
1.1  mrg     return expr;
1.1  mrg
1.1  mrg   stmt = SSA_NAME_DEF_STMT (expr);
1.1  mrg   if (gimple_code (stmt) == GIMPLE_PHI)
1.1  mrg     {
1.1  mrg       basic_block src, dest;
1.1  mrg
1.1  mrg       if (gimple_phi_num_args (stmt) != 1)
1.1  mrg 	return expr;
1.1  mrg       e = PHI_ARG_DEF (stmt, 0);
1.1  mrg
1.1  mrg       /* Avoid propagating through loop exit phi nodes, which
1.1  mrg 	 could break loop-closed SSA form restrictions.  */
1.1  mrg       dest = gimple_bb (stmt);
1.1  mrg       src = single_pred (dest);
1.1  mrg       if (TREE_CODE (e) == SSA_NAME
1.1  mrg 	  && src->loop_father != dest->loop_father)
1.1  mrg 	return expr;
1.1  mrg
1.1  mrg       return expand_simple_operations (e, stop, cache);
1.1  mrg     }
1.1  mrg   if (gimple_code (stmt) != GIMPLE_ASSIGN)
1.1  mrg     return expr;
1.1  mrg
1.1  mrg   /* Avoid expanding to expressions that contain SSA names that need
1.1  mrg      to take part in abnormal coalescing.  */
1.1  mrg   ssa_op_iter iter;
1.1  mrg   FOR_EACH_SSA_TREE_OPERAND (e, stmt, iter, SSA_OP_USE)
1.1  mrg     if (SSA_NAME_OCCURS_IN_ABNORMAL_PHI (e))
1.1  mrg       return expr;
1.1  mrg
1.1  mrg   e = gimple_assign_rhs1 (stmt);
1.1  mrg   code = gimple_assign_rhs_code (stmt);
1.1  mrg   if (get_gimple_rhs_class (code) == GIMPLE_SINGLE_RHS)
1.1  mrg     {
1.1  mrg       if (is_gimple_min_invariant (e))
1.1  mrg 	return e;
1.1  mrg
1.1  mrg       if (code == SSA_NAME)
1.1  mrg 	return expand_simple_operations (e, stop, cache);
1.1  mrg       else if (code == ADDR_EXPR)
1.1  mrg 	{
1.1  mrg 	  poly_int64 offset;
1.1  mrg 	  tree base = get_addr_base_and_unit_offset (TREE_OPERAND (e, 0),
1.1  mrg 						     &offset);
1.1  mrg 	  if (base
1.1  mrg 	      && TREE_CODE (base) == MEM_REF)
1.1  mrg 	    {
1.1  mrg 	      ee = expand_simple_operations (TREE_OPERAND (base, 0), stop,
1.1  mrg 					     cache);
1.1  mrg 	      return fold_build2 (POINTER_PLUS_EXPR, TREE_TYPE (expr), ee,
1.1  mrg 				  wide_int_to_tree (sizetype,
1.1  mrg 						    mem_ref_offset (base)
1.1  mrg 						    + offset));
1.1  mrg 	    }
1.1  mrg 	}
1.1  mrg
1.1  mrg       return expr;
1.1  mrg     }
1.1  mrg
1.1  mrg   switch (code)
1.1  mrg     {
1.1  mrg     CASE_CONVERT:
1.1  mrg       /* Casts are simple.  */
1.1  mrg       ee = expand_simple_operations (e, stop, cache);
1.1  mrg       return fold_build1 (code, TREE_TYPE (expr), ee);
1.1  mrg
1.1  mrg     case PLUS_EXPR:
1.1  mrg     case MINUS_EXPR:
1.1  mrg       if (ANY_INTEGRAL_TYPE_P (TREE_TYPE (expr))
1.1  mrg 	  && TYPE_OVERFLOW_TRAPS (TREE_TYPE (expr)))
1.1  mrg 	return expr;
1.1  mrg       /* Fallthru.  */
1.1  mrg     case POINTER_PLUS_EXPR:
1.1  mrg       /* And increments and decrements by a constant are simple.  */
1.1  mrg       e1 = gimple_assign_rhs2 (stmt);
1.1  mrg       if (!is_gimple_min_invariant (e1))
1.1  mrg 	return expr;
1.1  mrg
1.1  mrg       ee = expand_simple_operations (e, stop, cache);
1.1  mrg       return fold_build2 (code, TREE_TYPE (expr), ee, e1);
1.1  mrg
1.1  mrg     default:
1.1  mrg       return expr;
1.1  mrg     }
1.1  mrg }
1.1  mrg
1.1  mrg tree
1.1  mrg expand_simple_operations (tree expr, tree stop)
1.1  mrg {
1.1  mrg   hash_map<tree, tree> cache;
1.1  mrg   return expand_simple_operations (expr, stop, cache);
1.1  mrg }
1.1  mrg
1.1  mrg /* Tries to simplify EXPR using the condition COND.  Returns the simplified
1.1  mrg    expression (or EXPR unchanged, if no simplification was possible).  */
1.1  mrg
1.1  mrg static tree
1.1  mrg tree_simplify_using_condition_1 (tree cond, tree expr)
1.1  mrg {
1.1  mrg   bool changed;
1.1  mrg   tree e, e0, e1, e2, notcond;
1.1  mrg   enum tree_code code = TREE_CODE (expr);
1.1  mrg
1.1  mrg   if (code == INTEGER_CST)
1.1  mrg     return expr;
1.1  mrg
1.1  mrg   if (code == TRUTH_OR_EXPR
1.1  mrg       || code == TRUTH_AND_EXPR
1.1  mrg       || code == COND_EXPR)
1.1  mrg     {
1.1  mrg       changed = false;
1.1  mrg
1.1  mrg       e0 = tree_simplify_using_condition_1 (cond, TREE_OPERAND (expr, 0));
1.1  mrg       if (TREE_OPERAND (expr, 0) != e0)
1.1  mrg 	changed = true;
1.1  mrg
1.1  mrg       e1 = tree_simplify_using_condition_1 (cond, TREE_OPERAND (expr, 1));
1.1  mrg       if (TREE_OPERAND (expr, 1) != e1)
1.1  mrg 	changed = true;
1.1  mrg
1.1  mrg       if (code == COND_EXPR)
1.1  mrg 	{
1.1  mrg 	  e2 = tree_simplify_using_condition_1 (cond, TREE_OPERAND (expr, 2));
1.1  mrg 	  if (TREE_OPERAND (expr, 2) != e2)
1.1  mrg 	    changed = true;
1.1  mrg 	}
1.1  mrg       else
1.1  mrg 	e2 = NULL_TREE;
1.1  mrg
1.1  mrg       if (changed)
1.1  mrg 	{
1.1  mrg 	  if (code == COND_EXPR)
1.1  mrg 	    expr = fold_build3 (code, boolean_type_node, e0, e1, e2);
1.1  mrg 	  else
1.1  mrg 	    expr = fold_build2 (code, boolean_type_node, e0, e1);
1.1  mrg 	}
1.1  mrg
1.1  mrg       return expr;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* In case COND is equality, we may be able to simplify EXPR by copy/constant
1.1  mrg      propagation, and vice versa.  Fold does not handle this, since it is
1.1  mrg      considered too expensive.  */
1.1  mrg   if (TREE_CODE (cond) == EQ_EXPR)
1.1  mrg     {
1.1  mrg       e0 = TREE_OPERAND (cond, 0);
1.1  mrg       e1 = TREE_OPERAND (cond, 1);
1.1  mrg
1.1  mrg       /* We know that e0 == e1.  Check whether we cannot simplify expr
1.1  mrg 	 using this fact.  */
1.1  mrg       e = simplify_replace_tree (expr, e0, e1);
1.1  mrg       if (integer_zerop (e) || integer_nonzerop (e))
1.1  mrg 	return e;
1.1  mrg
1.1  mrg       e = simplify_replace_tree (expr, e1, e0);
1.1  mrg       if (integer_zerop (e) || integer_nonzerop (e))
1.1  mrg 	return e;
1.1  mrg     }
1.1  mrg   if (TREE_CODE (expr) == EQ_EXPR)
1.1  mrg     {
1.1  mrg       e0 = TREE_OPERAND (expr, 0);
1.1  mrg       e1 = TREE_OPERAND (expr, 1);
1.1  mrg
1.1  mrg       /* If e0 == e1 (EXPR) implies !COND, then EXPR cannot be true.  */
1.1  mrg       e = simplify_replace_tree (cond, e0, e1);
1.1  mrg       if (integer_zerop (e))
1.1  mrg 	return e;
1.1  mrg       e = simplify_replace_tree (cond, e1, e0);
1.1  mrg       if (integer_zerop (e))
1.1  mrg 	return e;
1.1  mrg     }
1.1  mrg   if (TREE_CODE (expr) == NE_EXPR)
1.1  mrg     {
1.1  mrg       e0 = TREE_OPERAND (expr, 0);
1.1  mrg       e1 = TREE_OPERAND (expr, 1);
1.1  mrg
1.1  mrg       /* If e0 == e1 (!EXPR) implies !COND, then EXPR must be true.  */
1.1  mrg       e = simplify_replace_tree (cond, e0, e1);
1.1  mrg       if (integer_zerop (e))
1.1  mrg 	return boolean_true_node;
1.1  mrg       e = simplify_replace_tree (cond, e1, e0);
1.1  mrg       if (integer_zerop (e))
1.1  mrg 	return boolean_true_node;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* Check whether COND ==> EXPR.  */
1.1  mrg   notcond = invert_truthvalue (cond);
1.1  mrg   e = fold_binary (TRUTH_OR_EXPR, boolean_type_node, notcond, expr);
1.1  mrg   if (e && integer_nonzerop (e))
1.1  mrg     return e;
1.1  mrg
1.1  mrg   /* Check whether COND ==> not EXPR.  */
1.1  mrg   e = fold_binary (TRUTH_AND_EXPR, boolean_type_node, cond, expr);
1.1  mrg   if (e && integer_zerop (e))
1.1  mrg     return e;
1.1  mrg
1.1  mrg   return expr;
1.1  mrg }
1.1  mrg
1.1  mrg /* Tries to simplify EXPR using the condition COND.  Returns the simplified
1.1  mrg    expression (or EXPR unchanged, if no simplification was possible).
1.1  mrg    Wrapper around tree_simplify_using_condition_1 that ensures that chains
1.1  mrg    of simple operations in definitions of ssa names in COND are expanded,
1.1  mrg    so that things like casts or incrementing the value of the bound before
1.1  mrg    the loop do not cause us to fail.  */
1.1  mrg
1.1  mrg static tree
1.1  mrg tree_simplify_using_condition (tree cond, tree expr)
1.1  mrg {
1.1  mrg   cond = expand_simple_operations (cond);
1.1  mrg
1.1  mrg   return tree_simplify_using_condition_1 (cond, expr);
1.1  mrg }
1.1  mrg
1.1  mrg /* Tries to simplify EXPR using the conditions on entry to LOOP.
1.1  mrg    Returns the simplified expression (or EXPR unchanged, if no
1.1  mrg    simplification was possible).  */
1.1  mrg
1.1  mrg tree
1.1  mrg simplify_using_initial_conditions (class loop *loop, tree expr)
1.1  mrg {
1.1  mrg   edge e;
1.1  mrg   basic_block bb;
1.1  mrg   gimple *stmt;
1.1  mrg   tree cond, expanded, backup;
1.1  mrg   int cnt = 0;
1.1  mrg
1.1  mrg   if (TREE_CODE (expr) == INTEGER_CST)
1.1  mrg     return expr;
1.1  mrg
1.1  mrg   backup = expanded = expand_simple_operations (expr);
1.1  mrg
1.1  mrg   /* Limit walking the dominators to avoid quadraticness in
1.1  mrg      the number of BBs times the number of loops in degenerate
1.1  mrg      cases.  */
1.1  mrg   for (bb = loop->header;
1.1  mrg        bb != ENTRY_BLOCK_PTR_FOR_FN (cfun) && cnt < MAX_DOMINATORS_TO_WALK;
1.1  mrg        bb = get_immediate_dominator (CDI_DOMINATORS, bb))
1.1  mrg     {
1.1  mrg       if (!single_pred_p (bb))
1.1  mrg 	continue;
1.1  mrg       e = single_pred_edge (bb);
1.1  mrg
1.1  mrg       if (!(e->flags & (EDGE_TRUE_VALUE | EDGE_FALSE_VALUE)))
1.1  mrg 	continue;
1.1  mrg
1.1  mrg       stmt = last_stmt (e->src);
1.1  mrg       cond = fold_build2 (gimple_cond_code (stmt),
1.1  mrg 			  boolean_type_node,
1.1  mrg 			  gimple_cond_lhs (stmt),
1.1  mrg 			  gimple_cond_rhs (stmt));
1.1  mrg       if (e->flags & EDGE_FALSE_VALUE)
1.1  mrg 	cond = invert_truthvalue (cond);
1.1  mrg       expanded = tree_simplify_using_condition (cond, expanded);
1.1  mrg       /* Break if EXPR is simplified to const values.  */
1.1  mrg       if (expanded
1.1  mrg 	  && (integer_zerop (expanded) || integer_nonzerop (expanded)))
1.1  mrg 	return expanded;
1.1  mrg
1.1  mrg       ++cnt;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* Return the original expression if no simplification is done.  */
1.1  mrg   return operand_equal_p (backup, expanded, 0) ? expr : expanded;
1.1  mrg }
1.1  mrg
1.1  mrg /* Tries to simplify EXPR using the evolutions of the loop invariants
1.1  mrg    in the superloops of LOOP.  Returns the simplified expression
1.1  mrg    (or EXPR unchanged, if no simplification was possible).  */
1.1  mrg
1.1  mrg static tree
1.1  mrg simplify_using_outer_evolutions (class loop *loop, tree expr)
1.1  mrg {
1.1  mrg   enum tree_code code = TREE_CODE (expr);
1.1  mrg   bool changed;
1.1  mrg   tree e, e0, e1, e2;
1.1  mrg
1.1  mrg   if (is_gimple_min_invariant (expr))
1.1  mrg     return expr;
1.1  mrg
1.1  mrg   if (code == TRUTH_OR_EXPR
1.1  mrg       || code == TRUTH_AND_EXPR
1.1  mrg       || code == COND_EXPR)
1.1  mrg     {
1.1  mrg       changed = false;
1.1  mrg
1.1  mrg       e0 = simplify_using_outer_evolutions (loop, TREE_OPERAND (expr, 0));
1.1  mrg       if (TREE_OPERAND (expr, 0) != e0)
1.1  mrg 	changed = true;
1.1  mrg
1.1  mrg       e1 = simplify_using_outer_evolutions (loop, TREE_OPERAND (expr, 1));
1.1  mrg       if (TREE_OPERAND (expr, 1) != e1)
1.1  mrg 	changed = true;
1.1  mrg
1.1  mrg       if (code == COND_EXPR)
1.1  mrg 	{
1.1  mrg 	  e2 = simplify_using_outer_evolutions (loop, TREE_OPERAND (expr, 2));
1.1  mrg 	  if (TREE_OPERAND (expr, 2) != e2)
1.1  mrg 	    changed = true;
1.1  mrg 	}
1.1  mrg       else
1.1  mrg 	e2 = NULL_TREE;
1.1  mrg
1.1  mrg       if (changed)
1.1  mrg 	{
1.1  mrg 	  if (code == COND_EXPR)
1.1  mrg 	    expr = fold_build3 (code, boolean_type_node, e0, e1, e2);
1.1  mrg 	  else
1.1  mrg 	    expr = fold_build2 (code, boolean_type_node, e0, e1);
1.1  mrg 	}
1.1  mrg
1.1  mrg       return expr;
1.1  mrg     }
1.1  mrg
1.1  mrg   e = instantiate_parameters (loop, expr);
1.1  mrg   if (is_gimple_min_invariant (e))
1.1  mrg     return e;
1.1  mrg
1.1  mrg   return expr;
1.1  mrg }
1.1  mrg
1.1  mrg /* Returns true if EXIT is the only possible exit from LOOP.  */
1.1  mrg
1.1  mrg bool
1.1  mrg loop_only_exit_p (const class loop *loop, basic_block *body, const_edge exit)
1.1  mrg {
1.1  mrg   gimple_stmt_iterator bsi;
1.1  mrg   unsigned i;
1.1  mrg
1.1  mrg   if (exit != single_exit (loop))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   for (i = 0; i < loop->num_nodes; i++)
1.1  mrg     for (bsi = gsi_start_bb (body[i]); !gsi_end_p (bsi); gsi_next (&bsi))
1.1  mrg       if (stmt_can_terminate_bb_p (gsi_stmt (bsi)))
1.1  mrg 	return false;
1.1  mrg
1.1  mrg   return true;
1.1  mrg }
1.1  mrg
1.1  mrg /* Stores description of number of iterations of LOOP derived from
1.1  mrg    EXIT (an exit edge of the LOOP) in NITER.  Returns true if some useful
1.1  mrg    information could be derived (and fields of NITER have meaning described
1.1  mrg    in comments at class tree_niter_desc declaration), false otherwise.
1.1  mrg    When EVERY_ITERATION is true, only tests that are known to be executed
1.1  mrg    every iteration are considered (i.e. only test that alone bounds the loop).
1.1  mrg    If AT_STMT is not NULL, this function stores LOOP's condition statement in
1.1  mrg    it when returning true.  */
1.1  mrg
1.1  mrg bool
1.1  mrg number_of_iterations_exit_assumptions (class loop *loop, edge exit,
1.1  mrg 				       class tree_niter_desc *niter,
1.1  mrg 				       gcond **at_stmt, bool every_iteration,
1.1  mrg 				       basic_block *body)
1.1  mrg {
1.1  mrg   gimple *last;
1.1  mrg   gcond *stmt;
1.1  mrg   tree type;
1.1  mrg   tree op0, op1;
1.1  mrg   enum tree_code code;
1.1  mrg   affine_iv iv0, iv1;
1.1  mrg   bool safe;
1.1  mrg
1.1  mrg   /* The condition at a fake exit (if it exists) does not control its
1.1  mrg      execution.  */
1.1  mrg   if (exit->flags & EDGE_FAKE)
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* Nothing to analyze if the loop is known to be infinite.  */
1.1  mrg   if (loop_constraint_set_p (loop, LOOP_C_INFINITE))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   safe = dominated_by_p (CDI_DOMINATORS, loop->latch, exit->src);
1.1  mrg
1.1  mrg   if (every_iteration && !safe)
1.1  mrg     return false;
1.1  mrg
1.1  mrg   niter->assumptions = boolean_false_node;
1.1  mrg   niter->control.base = NULL_TREE;
1.1  mrg   niter->control.step = NULL_TREE;
1.1  mrg   niter->control.no_overflow = false;
1.1  mrg   last = last_stmt (exit->src);
1.1  mrg   if (!last)
1.1  mrg     return false;
1.1  mrg   stmt = dyn_cast <gcond *> (last);
1.1  mrg   if (!stmt)
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* We want the condition for staying inside loop.  */
1.1  mrg   code = gimple_cond_code (stmt);
1.1  mrg   if (exit->flags & EDGE_TRUE_VALUE)
1.1  mrg     code = invert_tree_comparison (code, false);
1.1  mrg
1.1  mrg   switch (code)
1.1  mrg     {
1.1  mrg     case GT_EXPR:
1.1  mrg     case GE_EXPR:
1.1  mrg     case LT_EXPR:
1.1  mrg     case LE_EXPR:
1.1  mrg     case NE_EXPR:
1.1  mrg       break;
1.1  mrg
1.1  mrg     default:
1.1  mrg       return false;
1.1  mrg     }
1.1  mrg
1.1  mrg   op0 = gimple_cond_lhs (stmt);
1.1  mrg   op1 = gimple_cond_rhs (stmt);
1.1  mrg   type = TREE_TYPE (op0);
1.1  mrg
1.1  mrg   if (TREE_CODE (type) != INTEGER_TYPE
1.1  mrg       && !POINTER_TYPE_P (type))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   tree iv0_niters = NULL_TREE;
1.1  mrg   if (!simple_iv_with_niters (loop, loop_containing_stmt (stmt),
1.1  mrg 			      op0, &iv0, safe ? &iv0_niters : NULL, false))
1.1  mrg     return number_of_iterations_popcount (loop, exit, code, niter);
1.1  mrg   tree iv1_niters = NULL_TREE;
1.1  mrg   if (!simple_iv_with_niters (loop, loop_containing_stmt (stmt),
1.1  mrg 			      op1, &iv1, safe ? &iv1_niters : NULL, false))
1.1  mrg     return false;
1.1  mrg   /* Give up on complicated case.  */
1.1  mrg   if (iv0_niters && iv1_niters)
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* We don't want to see undefined signed overflow warnings while
1.1  mrg      computing the number of iterations.  */
1.1  mrg   fold_defer_overflow_warnings ();
1.1  mrg
1.1  mrg   iv0.base = expand_simple_operations (iv0.base);
1.1  mrg   iv1.base = expand_simple_operations (iv1.base);
1.1  mrg   bool body_from_caller = true;
1.1  mrg   if (!body)
1.1  mrg     {
1.1  mrg       body = get_loop_body (loop);
1.1  mrg       body_from_caller = false;
1.1  mrg     }
1.1  mrg   bool only_exit_p = loop_only_exit_p (loop, body, exit);
1.1  mrg   if (!body_from_caller)
1.1  mrg     free (body);
1.1  mrg   if (!number_of_iterations_cond (loop, type, &iv0, code, &iv1, niter,
1.1  mrg 				  only_exit_p, safe))
1.1  mrg     {
1.1  mrg       fold_undefer_and_ignore_overflow_warnings ();
1.1  mrg       return false;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* Incorporate additional assumption implied by control iv.  */
1.1  mrg   tree iv_niters = iv0_niters ? iv0_niters : iv1_niters;
1.1  mrg   if (iv_niters)
1.1  mrg     {
1.1  mrg       tree assumption = fold_build2 (LE_EXPR, boolean_type_node, niter->niter,
1.1  mrg 				     fold_convert (TREE_TYPE (niter->niter),
1.1  mrg 						   iv_niters));
1.1  mrg
1.1  mrg       if (!integer_nonzerop (assumption))
1.1  mrg 	niter->assumptions = fold_build2 (TRUTH_AND_EXPR, boolean_type_node,
1.1  mrg 					  niter->assumptions, assumption);
1.1  mrg
1.1  mrg       /* Refine upper bound if possible.  */
1.1  mrg       if (TREE_CODE (iv_niters) == INTEGER_CST
1.1  mrg 	  && niter->max > wi::to_widest (iv_niters))
1.1  mrg 	niter->max = wi::to_widest (iv_niters);
1.1  mrg     }
1.1  mrg
1.1  mrg   /* There is no assumptions if the loop is known to be finite.  */
1.1  mrg   if (!integer_zerop (niter->assumptions)
1.1  mrg       && loop_constraint_set_p (loop, LOOP_C_FINITE))
1.1  mrg     niter->assumptions = boolean_true_node;
1.1  mrg
1.1  mrg   if (optimize >= 3)
1.1  mrg     {
1.1  mrg       niter->assumptions = simplify_using_outer_evolutions (loop,
1.1  mrg 							    niter->assumptions);
1.1  mrg       niter->may_be_zero = simplify_using_outer_evolutions (loop,
1.1  mrg 							    niter->may_be_zero);
1.1  mrg       niter->niter = simplify_using_outer_evolutions (loop, niter->niter);
1.1  mrg     }
1.1  mrg
1.1  mrg   niter->assumptions
1.1  mrg 	  = simplify_using_initial_conditions (loop,
1.1  mrg 					       niter->assumptions);
1.1  mrg   niter->may_be_zero
1.1  mrg 	  = simplify_using_initial_conditions (loop,
1.1  mrg 					       niter->may_be_zero);
1.1  mrg
1.1  mrg   fold_undefer_and_ignore_overflow_warnings ();
1.1  mrg
1.1  mrg   /* If NITER has simplified into a constant, update MAX.  */
1.1  mrg   if (TREE_CODE (niter->niter) == INTEGER_CST)
1.1  mrg     niter->max = wi::to_widest (niter->niter);
1.1  mrg
1.1  mrg   if (at_stmt)
1.1  mrg     *at_stmt = stmt;
1.1  mrg
1.1  mrg   return (!integer_zerop (niter->assumptions));
1.1  mrg }
1.1  mrg
1.1  mrg
1.1  mrg /* Utility function to check if OP is defined by a stmt
1.1  mrg    that is a val - 1.  */
1.1  mrg
1.1  mrg static bool
1.1  mrg ssa_defined_by_minus_one_stmt_p (tree op, tree val)
1.1  mrg {
1.1  mrg   gimple *stmt;
1.1  mrg   return (TREE_CODE (op) == SSA_NAME
1.1  mrg 	  && (stmt = SSA_NAME_DEF_STMT (op))
1.1  mrg 	  && is_gimple_assign (stmt)
1.1  mrg 	  && (gimple_assign_rhs_code (stmt) == PLUS_EXPR)
1.1  mrg 	  && val == gimple_assign_rhs1 (stmt)
1.1  mrg 	  && integer_minus_onep (gimple_assign_rhs2 (stmt)));
1.1  mrg }
1.1  mrg
1.1  mrg
1.1  mrg /* See if LOOP is a popcout implementation, determine NITER for the loop
1.1  mrg
1.1  mrg    We match:
1.1  mrg    <bb 2>
1.1  mrg    goto <bb 4>
1.1  mrg
1.1  mrg    <bb 3>
1.1  mrg    _1 = b_11 + -1
1.1  mrg    b_6 = _1 & b_11
1.1  mrg
1.1  mrg    <bb 4>
1.1  mrg    b_11 = PHI <b_5(D)(2), b_6(3)>
1.1  mrg
1.1  mrg    exit block
1.1  mrg    if (b_11 != 0)
1.1  mrg 	goto <bb 3>
1.1  mrg    else
1.1  mrg 	goto <bb 5>
1.1  mrg
1.1  mrg    OR we match copy-header version:
1.1  mrg    if (b_5 != 0)
1.1  mrg 	goto <bb 3>
1.1  mrg    else
1.1  mrg 	goto <bb 4>
1.1  mrg
1.1  mrg    <bb 3>
1.1  mrg    b_11 = PHI <b_5(2), b_6(3)>
1.1  mrg    _1 = b_11 + -1
1.1  mrg    b_6 = _1 & b_11
1.1  mrg
1.1  mrg    exit block
1.1  mrg    if (b_6 != 0)
1.1  mrg 	goto <bb 3>
1.1  mrg    else
1.1  mrg 	goto <bb 4>
1.1  mrg
1.1  mrg    If popcount pattern, update NITER accordingly.
1.1  mrg    i.e., set NITER to  __builtin_popcount (b)
1.1  mrg    return true if we did, false otherwise.
1.1  mrg
1.1  mrg  */
1.1  mrg
1.1  mrg static bool
1.1  mrg number_of_iterations_popcount (loop_p loop, edge exit,
1.1  mrg 			       enum tree_code code,
1.1  mrg 			       class tree_niter_desc *niter)
1.1  mrg {
1.1  mrg   bool adjust = true;
1.1  mrg   tree iter;
1.1  mrg   HOST_WIDE_INT max;
1.1  mrg   adjust = true;
1.1  mrg   tree fn = NULL_TREE;
1.1  mrg
1.1  mrg   /* Check loop terminating branch is like
1.1  mrg      if (b != 0).  */
1.1  mrg   gimple *stmt = last_stmt (exit->src);
1.1  mrg   if (!stmt
1.1  mrg       || gimple_code (stmt) != GIMPLE_COND
1.1  mrg       || code != NE_EXPR
1.1  mrg       || !integer_zerop (gimple_cond_rhs (stmt))
1.1  mrg       || TREE_CODE (gimple_cond_lhs (stmt)) != SSA_NAME)
1.1  mrg     return false;
1.1  mrg
1.1  mrg   gimple *and_stmt = SSA_NAME_DEF_STMT (gimple_cond_lhs (stmt));
1.1  mrg
1.1  mrg   /* Depending on copy-header is performed, feeding PHI stmts might be in
1.1  mrg      the loop header or loop latch, handle this.  */
1.1  mrg   if (gimple_code (and_stmt) == GIMPLE_PHI
1.1  mrg       && gimple_bb (and_stmt) == loop->header
1.1  mrg       && gimple_phi_num_args (and_stmt) == 2
1.1  mrg       && (TREE_CODE (gimple_phi_arg_def (and_stmt,
1.1  mrg 					 loop_latch_edge (loop)->dest_idx))
1.1  mrg 	  == SSA_NAME))
1.1  mrg     {
1.1  mrg       /* SSA used in exit condition is defined by PHI stmt
1.1  mrg 	b_11 = PHI <b_5(D)(2), b_6(3)>
1.1  mrg 	from the PHI stmt, get the and_stmt
1.1  mrg 	b_6 = _1 & b_11.  */
1.1  mrg       tree t = gimple_phi_arg_def (and_stmt, loop_latch_edge (loop)->dest_idx);
1.1  mrg       and_stmt = SSA_NAME_DEF_STMT (t);
1.1  mrg       adjust = false;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* Make sure it is indeed an and stmt (b_6 = _1 & b_11).  */
1.1  mrg   if (!is_gimple_assign (and_stmt)
1.1  mrg       || gimple_assign_rhs_code (and_stmt) != BIT_AND_EXPR)
1.1  mrg     return false;
1.1  mrg
1.1  mrg   tree b_11 = gimple_assign_rhs1 (and_stmt);
1.1  mrg   tree _1 = gimple_assign_rhs2 (and_stmt);
1.1  mrg
1.1  mrg   /* Check that _1 is defined by _b11 + -1 (_1 = b_11 + -1).
1.1  mrg      Also make sure that b_11 is the same in and_stmt and _1 defining stmt.
1.1  mrg      Also canonicalize if _1 and _b11 are revrsed.  */
1.1  mrg   if (ssa_defined_by_minus_one_stmt_p (b_11, _1))
1.1  mrg     std::swap (b_11, _1);
1.1  mrg   else if (ssa_defined_by_minus_one_stmt_p (_1, b_11))
1.1  mrg     ;
1.1  mrg   else
1.1  mrg     return false;
1.1  mrg   /* Check the recurrence:
1.1  mrg    ... = PHI <b_5(2), b_6(3)>.  */
1.1  mrg   gimple *phi = SSA_NAME_DEF_STMT (b_11);
1.1  mrg   if (gimple_code (phi) != GIMPLE_PHI
1.1  mrg       || (gimple_bb (phi) != loop_latch_edge (loop)->dest)
1.1  mrg       || (gimple_assign_lhs (and_stmt)
1.1  mrg 	  != gimple_phi_arg_def (phi, loop_latch_edge (loop)->dest_idx)))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* We found a match. Get the corresponding popcount builtin.  */
1.1  mrg   tree src = gimple_phi_arg_def (phi, loop_preheader_edge (loop)->dest_idx);
1.1  mrg   if (TYPE_PRECISION (TREE_TYPE (src)) <= TYPE_PRECISION (integer_type_node))
1.1  mrg     fn = builtin_decl_implicit (BUILT_IN_POPCOUNT);
1.1  mrg   else if (TYPE_PRECISION (TREE_TYPE (src))
1.1  mrg 	   == TYPE_PRECISION (long_integer_type_node))
1.1  mrg     fn = builtin_decl_implicit (BUILT_IN_POPCOUNTL);
1.1  mrg   else if (TYPE_PRECISION (TREE_TYPE (src))
1.1  mrg 	   == TYPE_PRECISION (long_long_integer_type_node)
1.1  mrg 	   || (TYPE_PRECISION (TREE_TYPE (src))
1.1  mrg 	       == 2 * TYPE_PRECISION (long_long_integer_type_node)))
1.1  mrg     fn = builtin_decl_implicit (BUILT_IN_POPCOUNTLL);
1.1  mrg
1.1  mrg   if (!fn)
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* Update NITER params accordingly  */
1.1  mrg   tree utype = unsigned_type_for (TREE_TYPE (src));
1.1  mrg   src = fold_convert (utype, src);
1.1  mrg   if (TYPE_PRECISION (TREE_TYPE (src)) < TYPE_PRECISION (integer_type_node))
1.1  mrg     src = fold_convert (unsigned_type_node, src);
1.1  mrg   tree call;
1.1  mrg   if (TYPE_PRECISION (TREE_TYPE (src))
1.1  mrg       == 2 * TYPE_PRECISION (long_long_integer_type_node))
1.1  mrg     {
1.1  mrg       int prec = TYPE_PRECISION (long_long_integer_type_node);
1.1  mrg       tree src1 = fold_convert (long_long_unsigned_type_node,
1.1  mrg 				fold_build2 (RSHIFT_EXPR, TREE_TYPE (src),
1.1  mrg 					     unshare_expr (src),
1.1  mrg 					     build_int_cst (integer_type_node,
1.1  mrg 							    prec)));
1.1  mrg       tree src2 = fold_convert (long_long_unsigned_type_node, src);
1.1  mrg       call = build_call_expr (fn, 1, src1);
1.1  mrg       call = fold_build2 (PLUS_EXPR, TREE_TYPE (call), call,
1.1  mrg 			  build_call_expr (fn, 1, src2));
1.1  mrg       call = fold_convert (utype, call);
1.1  mrg     }
1.1  mrg   else
1.1  mrg     call = fold_convert (utype, build_call_expr (fn, 1, src));
1.1  mrg   if (adjust)
1.1  mrg     iter = fold_build2 (MINUS_EXPR, utype, call, build_int_cst (utype, 1));
1.1  mrg   else
1.1  mrg     iter = call;
1.1  mrg
1.1  mrg   if (TREE_CODE (call) == INTEGER_CST)
1.1  mrg     max = tree_to_uhwi (call);
1.1  mrg   else
1.1  mrg     max = TYPE_PRECISION (TREE_TYPE (src));
1.1  mrg   if (adjust)
1.1  mrg     max = max - 1;
1.1  mrg
1.1  mrg   niter->niter = iter;
1.1  mrg   niter->assumptions = boolean_true_node;
1.1  mrg
1.1  mrg   if (adjust)
1.1  mrg     {
1.1  mrg       tree may_be_zero = fold_build2 (EQ_EXPR, boolean_type_node, src,
1.1  mrg 				      build_zero_cst (TREE_TYPE (src)));
1.1  mrg       niter->may_be_zero
1.1  mrg 	= simplify_using_initial_conditions (loop, may_be_zero);
1.1  mrg     }
1.1  mrg   else
1.1  mrg     niter->may_be_zero = boolean_false_node;
1.1  mrg
1.1  mrg   niter->max = max;
1.1  mrg   niter->bound = NULL_TREE;
1.1  mrg   niter->cmp = ERROR_MARK;
1.1  mrg   return true;
1.1  mrg }
1.1  mrg
1.1  mrg
1.1  mrg /* Like number_of_iterations_exit_assumptions, but return TRUE only if
1.1  mrg    the niter information holds unconditionally.  */
1.1  mrg
1.1  mrg bool
1.1  mrg number_of_iterations_exit (class loop *loop, edge exit,
1.1  mrg 			   class tree_niter_desc *niter,
1.1  mrg 			   bool warn, bool every_iteration,
1.1  mrg 			   basic_block *body)
1.1  mrg {
1.1  mrg   gcond *stmt;
1.1  mrg   if (!number_of_iterations_exit_assumptions (loop, exit, niter,
1.1  mrg 					      &stmt, every_iteration, body))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   if (integer_nonzerop (niter->assumptions))
1.1  mrg     return true;
1.1  mrg
1.1  mrg   if (warn && dump_enabled_p ())
1.1  mrg     dump_printf_loc (MSG_MISSED_OPTIMIZATION, stmt,
1.1  mrg 		     "missed loop optimization: niters analysis ends up "
1.1  mrg 		     "with assumptions.\n");
1.1  mrg
1.1  mrg   return false;
1.1  mrg }
1.1  mrg
1.1  mrg /* Try to determine the number of iterations of LOOP.  If we succeed,
1.1  mrg    expression giving number of iterations is returned and *EXIT is
1.1  mrg    set to the edge from that the information is obtained.  Otherwise
1.1  mrg    chrec_dont_know is returned.  */
1.1  mrg
1.1  mrg tree
1.1  mrg find_loop_niter (class loop *loop, edge *exit)
1.1  mrg {
1.1  mrg   unsigned i;
1.1  mrg   auto_vec<edge> exits = get_loop_exit_edges (loop);
1.1  mrg   edge ex;
1.1  mrg   tree niter = NULL_TREE, aniter;
1.1  mrg   class tree_niter_desc desc;
1.1  mrg
1.1  mrg   *exit = NULL;
1.1  mrg   FOR_EACH_VEC_ELT (exits, i, ex)
1.1  mrg     {
1.1  mrg       if (!number_of_iterations_exit (loop, ex, &desc, false))
1.1  mrg 	continue;
1.1  mrg
1.1  mrg       if (integer_nonzerop (desc.may_be_zero))
1.1  mrg 	{
1.1  mrg 	  /* We exit in the first iteration through this exit.
1.1  mrg 	     We won't find anything better.  */
1.1  mrg 	  niter = build_int_cst (unsigned_type_node, 0);
1.1  mrg 	  *exit = ex;
1.1  mrg 	  break;
1.1  mrg 	}
1.1  mrg
1.1  mrg       if (!integer_zerop (desc.may_be_zero))
1.1  mrg 	continue;
1.1  mrg
1.1  mrg       aniter = desc.niter;
1.1  mrg
1.1  mrg       if (!niter)
1.1  mrg 	{
1.1  mrg 	  /* Nothing recorded yet.  */
1.1  mrg 	  niter = aniter;
1.1  mrg 	  *exit = ex;
1.1  mrg 	  continue;
1.1  mrg 	}
1.1  mrg
1.1  mrg       /* Prefer constants, the lower the better.  */
1.1  mrg       if (TREE_CODE (aniter) != INTEGER_CST)
1.1  mrg 	continue;
1.1  mrg
1.1  mrg       if (TREE_CODE (niter) != INTEGER_CST)
1.1  mrg 	{
1.1  mrg 	  niter = aniter;
1.1  mrg 	  *exit = ex;
1.1  mrg 	  continue;
1.1  mrg 	}
1.1  mrg
1.1  mrg       if (tree_int_cst_lt (aniter, niter))
1.1  mrg 	{
1.1  mrg 	  niter = aniter;
1.1  mrg 	  *exit = ex;
1.1  mrg 	  continue;
1.1  mrg 	}
1.1  mrg     }
1.1  mrg
1.1  mrg   return niter ? niter : chrec_dont_know;
1.1  mrg }
1.1  mrg
1.1  mrg /* Return true if loop is known to have bounded number of iterations.  */
1.1  mrg
1.1  mrg bool
1.1  mrg finite_loop_p (class loop *loop)
1.1  mrg {
1.1  mrg   widest_int nit;
1.1  mrg   int flags;
1.1  mrg
1.1  mrg   flags = flags_from_decl_or_type (current_function_decl);
1.1  mrg   if ((flags & (ECF_CONST|ECF_PURE)) && !(flags & ECF_LOOPING_CONST_OR_PURE))
1.1  mrg     {
1.1  mrg       if (dump_file && (dump_flags & TDF_DETAILS))
1.1  mrg 	fprintf (dump_file, "Found loop %i to be finite: it is within pure or const function.\n",
1.1  mrg 		 loop->num);
1.1  mrg       return true;
1.1  mrg     }
1.1  mrg
1.1  mrg   if (loop->any_upper_bound
1.1  mrg       || max_loop_iterations (loop, &nit))
1.1  mrg     {
1.1  mrg       if (dump_file && (dump_flags & TDF_DETAILS))
1.1  mrg 	fprintf (dump_file, "Found loop %i to be finite: upper bound found.\n",
1.1  mrg 		 loop->num);
1.1  mrg       return true;
1.1  mrg     }
1.1  mrg
1.1  mrg   if (loop->finite_p)
1.1  mrg     {
1.1  mrg       unsigned i;
1.1  mrg       auto_vec<edge> exits = get_loop_exit_edges (loop);
1.1  mrg       edge ex;
1.1  mrg
1.1  mrg       /* If the loop has a normal exit, we can assume it will terminate.  */
1.1  mrg       FOR_EACH_VEC_ELT (exits, i, ex)
1.1  mrg 	if (!(ex->flags & (EDGE_EH | EDGE_ABNORMAL | EDGE_FAKE)))
1.1  mrg 	  {
1.1  mrg 	    if (dump_file)
1.1  mrg 	      fprintf (dump_file, "Assume loop %i to be finite: it has an exit "
1.1  mrg 		       "and -ffinite-loops is on.\n", loop->num);
1.1  mrg 	    return true;
1.1  mrg 	  }
1.1  mrg     }
1.1  mrg
1.1  mrg   return false;
1.1  mrg }
1.1  mrg
1.1  mrg /*
1.1  mrg
1.1  mrg    Analysis of a number of iterations of a loop by a brute-force evaluation.
1.1  mrg
1.1  mrg */
1.1  mrg
1.1  mrg /* Bound on the number of iterations we try to evaluate.  */
1.1  mrg
1.1  mrg #define MAX_ITERATIONS_TO_TRACK \
1.1  mrg   ((unsigned) param_max_iterations_to_track)
1.1  mrg
1.1  mrg /* Returns the loop phi node of LOOP such that ssa name X is derived from its
1.1  mrg    result by a chain of operations such that all but exactly one of their
1.1  mrg    operands are constants.  */
1.1  mrg
1.1  mrg static gphi *
1.1  mrg chain_of_csts_start (class loop *loop, tree x)
1.1  mrg {
1.1  mrg   gimple *stmt = SSA_NAME_DEF_STMT (x);
1.1  mrg   tree use;
1.1  mrg   basic_block bb = gimple_bb (stmt);
1.1  mrg   enum tree_code code;
1.1  mrg
1.1  mrg   if (!bb
1.1  mrg       || !flow_bb_inside_loop_p (loop, bb))
1.1  mrg     return NULL;
1.1  mrg
1.1  mrg   if (gimple_code (stmt) == GIMPLE_PHI)
1.1  mrg     {
1.1  mrg       if (bb == loop->header)
1.1  mrg 	return as_a <gphi *> (stmt);
1.1  mrg
1.1  mrg       return NULL;
1.1  mrg     }
1.1  mrg
1.1  mrg   if (gimple_code (stmt) != GIMPLE_ASSIGN
1.1  mrg       || gimple_assign_rhs_class (stmt) == GIMPLE_TERNARY_RHS)
1.1  mrg     return NULL;
1.1  mrg
1.1  mrg   code = gimple_assign_rhs_code (stmt);
1.1  mrg   if (gimple_references_memory_p (stmt)
1.1  mrg       || TREE_CODE_CLASS (code) == tcc_reference
1.1  mrg       || (code == ADDR_EXPR
1.1  mrg 	  && !is_gimple_min_invariant (gimple_assign_rhs1 (stmt))))
1.1  mrg     return NULL;
1.1  mrg
1.1  mrg   use = SINGLE_SSA_TREE_OPERAND (stmt, SSA_OP_USE);
1.1  mrg   if (use == NULL_TREE)
1.1  mrg     return NULL;
1.1  mrg
1.1  mrg   return chain_of_csts_start (loop, use);
1.1  mrg }
1.1  mrg
1.1  mrg /* Determines whether the expression X is derived from a result of a phi node
1.1  mrg    in header of LOOP such that
1.1  mrg
1.1  mrg    * the derivation of X consists only from operations with constants
1.1  mrg    * the initial value of the phi node is constant
1.1  mrg    * the value of the phi node in the next iteration can be derived from the
1.1  mrg      value in the current iteration by a chain of operations with constants,
1.1  mrg      or is also a constant
1.1  mrg
1.1  mrg    If such phi node exists, it is returned, otherwise NULL is returned.  */
1.1  mrg
1.1  mrg static gphi *
1.1  mrg get_base_for (class loop *loop, tree x)
1.1  mrg {
1.1  mrg   gphi *phi;
1.1  mrg   tree init, next;
1.1  mrg
1.1  mrg   if (is_gimple_min_invariant (x))
1.1  mrg     return NULL;
1.1  mrg
1.1  mrg   phi = chain_of_csts_start (loop, x);
1.1  mrg   if (!phi)
1.1  mrg     return NULL;
1.1  mrg
1.1  mrg   init = PHI_ARG_DEF_FROM_EDGE (phi, loop_preheader_edge (loop));
1.1  mrg   next = PHI_ARG_DEF_FROM_EDGE (phi, loop_latch_edge (loop));
1.1  mrg
1.1  mrg   if (!is_gimple_min_invariant (init))
1.1  mrg     return NULL;
1.1  mrg
1.1  mrg   if (TREE_CODE (next) == SSA_NAME
1.1  mrg       && chain_of_csts_start (loop, next) != phi)
1.1  mrg     return NULL;
1.1  mrg
1.1  mrg   return phi;
1.1  mrg }
1.1  mrg
1.1  mrg /* Given an expression X, then
1.1  mrg
1.1  mrg    * if X is NULL_TREE, we return the constant BASE.
1.1  mrg    * if X is a constant, we return the constant X.
1.1  mrg    * otherwise X is a SSA name, whose value in the considered loop is derived
1.1  mrg      by a chain of operations with constant from a result of a phi node in
1.1  mrg      the header of the loop.  Then we return value of X when the value of the
1.1  mrg      result of this phi node is given by the constant BASE.  */
1.1  mrg
1.1  mrg static tree
1.1  mrg get_val_for (tree x, tree base)
1.1  mrg {
1.1  mrg   gimple *stmt;
1.1  mrg
1.1  mrg   gcc_checking_assert (is_gimple_min_invariant (base));
1.1  mrg
1.1  mrg   if (!x)
1.1  mrg     return base;
1.1  mrg   else if (is_gimple_min_invariant (x))
1.1  mrg     return x;
1.1  mrg
1.1  mrg   stmt = SSA_NAME_DEF_STMT (x);
1.1  mrg   if (gimple_code (stmt) == GIMPLE_PHI)
1.1  mrg     return base;
1.1  mrg
1.1  mrg   gcc_checking_assert (is_gimple_assign (stmt));
1.1  mrg
1.1  mrg   /* STMT must be either an assignment of a single SSA name or an
1.1  mrg      expression involving an SSA name and a constant.  Try to fold that
1.1  mrg      expression using the value for the SSA name.  */
1.1  mrg   if (gimple_assign_ssa_name_copy_p (stmt))
1.1  mrg     return get_val_for (gimple_assign_rhs1 (stmt), base);
1.1  mrg   else if (gimple_assign_rhs_class (stmt) == GIMPLE_UNARY_RHS
1.1  mrg 	   && TREE_CODE (gimple_assign_rhs1 (stmt)) == SSA_NAME)
1.1  mrg     return fold_build1 (gimple_assign_rhs_code (stmt),
1.1  mrg 			TREE_TYPE (gimple_assign_lhs (stmt)),
1.1  mrg 			get_val_for (gimple_assign_rhs1 (stmt), base));
1.1  mrg   else if (gimple_assign_rhs_class (stmt) == GIMPLE_BINARY_RHS)
1.1  mrg     {
1.1  mrg       tree rhs1 = gimple_assign_rhs1 (stmt);
1.1  mrg       tree rhs2 = gimple_assign_rhs2 (stmt);
1.1  mrg       if (TREE_CODE (rhs1) == SSA_NAME)
1.1  mrg 	rhs1 = get_val_for (rhs1, base);
1.1  mrg       else if (TREE_CODE (rhs2) == SSA_NAME)
1.1  mrg 	rhs2 = get_val_for (rhs2, base);
1.1  mrg       else
1.1  mrg 	gcc_unreachable ();
1.1  mrg       return fold_build2 (gimple_assign_rhs_code (stmt),
1.1  mrg 			  TREE_TYPE (gimple_assign_lhs (stmt)), rhs1, rhs2);
1.1  mrg     }
1.1  mrg   else
1.1  mrg     gcc_unreachable ();
1.1  mrg }
1.1  mrg
1.1  mrg
1.1  mrg /* Tries to count the number of iterations of LOOP till it exits by EXIT
1.1  mrg    by brute force -- i.e. by determining the value of the operands of the
1.1  mrg    condition at EXIT in first few iterations of the loop (assuming that
1.1  mrg    these values are constant) and determining the first one in that the
1.1  mrg    condition is not satisfied.  Returns the constant giving the number
1.1  mrg    of the iterations of LOOP if successful, chrec_dont_know otherwise.  */
1.1  mrg
1.1  mrg tree
1.1  mrg loop_niter_by_eval (class loop *loop, edge exit)
1.1  mrg {
1.1  mrg   tree acnd;
1.1  mrg   tree op[2], val[2], next[2], aval[2];
1.1  mrg   gphi *phi;
1.1  mrg   gimple *cond;
1.1  mrg   unsigned i, j;
1.1  mrg   enum tree_code cmp;
1.1  mrg
1.1  mrg   cond = last_stmt (exit->src);
1.1  mrg   if (!cond || gimple_code (cond) != GIMPLE_COND)
1.1  mrg     return chrec_dont_know;
1.1  mrg
1.1  mrg   cmp = gimple_cond_code (cond);
1.1  mrg   if (exit->flags & EDGE_TRUE_VALUE)
1.1  mrg     cmp = invert_tree_comparison (cmp, false);
1.1  mrg
1.1  mrg   switch (cmp)
1.1  mrg     {
1.1  mrg     case EQ_EXPR:
1.1  mrg     case NE_EXPR:
1.1  mrg     case GT_EXPR:
1.1  mrg     case GE_EXPR:
1.1  mrg     case LT_EXPR:
1.1  mrg     case LE_EXPR:
1.1  mrg       op[0] = gimple_cond_lhs (cond);
1.1  mrg       op[1] = gimple_cond_rhs (cond);
1.1  mrg       break;
1.1  mrg
1.1  mrg     default:
1.1  mrg       return chrec_dont_know;
1.1  mrg     }
1.1  mrg
1.1  mrg   for (j = 0; j < 2; j++)
1.1  mrg     {
1.1  mrg       if (is_gimple_min_invariant (op[j]))
1.1  mrg 	{
1.1  mrg 	  val[j] = op[j];
1.1  mrg 	  next[j] = NULL_TREE;
1.1  mrg 	  op[j] = NULL_TREE;
1.1  mrg 	}
1.1  mrg       else
1.1  mrg 	{
1.1  mrg 	  phi = get_base_for (loop, op[j]);
1.1  mrg 	  if (!phi)
1.1  mrg 	    return chrec_dont_know;
1.1  mrg 	  val[j] = PHI_ARG_DEF_FROM_EDGE (phi, loop_preheader_edge (loop));
1.1  mrg 	  next[j] = PHI_ARG_DEF_FROM_EDGE (phi, loop_latch_edge (loop));
1.1  mrg 	}
1.1  mrg     }
1.1  mrg
1.1  mrg   /* Don't issue signed overflow warnings.  */
1.1  mrg   fold_defer_overflow_warnings ();
1.1  mrg
1.1  mrg   for (i = 0; i < MAX_ITERATIONS_TO_TRACK; i++)
1.1  mrg     {
1.1  mrg       for (j = 0; j < 2; j++)
1.1  mrg 	aval[j] = get_val_for (op[j], val[j]);
1.1  mrg
1.1  mrg       acnd = fold_binary (cmp, boolean_type_node, aval[0], aval[1]);
1.1  mrg       if (acnd && integer_zerop (acnd))
1.1  mrg 	{
1.1  mrg 	  fold_undefer_and_ignore_overflow_warnings ();
1.1  mrg 	  if (dump_file && (dump_flags & TDF_DETAILS))
1.1  mrg 	    fprintf (dump_file,
1.1  mrg 		     "Proved that loop %d iterates %d times using brute force.\n",
1.1  mrg 		     loop->num, i);
1.1  mrg 	  return build_int_cst (unsigned_type_node, i);
1.1  mrg 	}
1.1  mrg
1.1  mrg       for (j = 0; j < 2; j++)
1.1  mrg 	{
1.1  mrg 	  aval[j] = val[j];
1.1  mrg 	  val[j] = get_val_for (next[j], val[j]);
1.1  mrg 	  if (!is_gimple_min_invariant (val[j]))
1.1  mrg 	    {
1.1  mrg 	      fold_undefer_and_ignore_overflow_warnings ();
1.1  mrg 	      return chrec_dont_know;
1.1  mrg 	    }
1.1  mrg 	}
1.1  mrg
1.1  mrg       /* If the next iteration would use the same base values
1.1  mrg 	 as the current one, there is no point looping further,
1.1  mrg 	 all following iterations will be the same as this one.  */
1.1  mrg       if (val[0] == aval[0] && val[1] == aval[1])
1.1  mrg 	break;
1.1  mrg     }
1.1  mrg
1.1  mrg   fold_undefer_and_ignore_overflow_warnings ();
1.1  mrg
1.1  mrg   return chrec_dont_know;
1.1  mrg }
1.1  mrg
1.1  mrg /* Finds the exit of the LOOP by that the loop exits after a constant
1.1  mrg    number of iterations and stores the exit edge to *EXIT.  The constant
1.1  mrg    giving the number of iterations of LOOP is returned.  The number of
1.1  mrg    iterations is determined using loop_niter_by_eval (i.e. by brute force
1.1  mrg    evaluation).  If we are unable to find the exit for that loop_niter_by_eval
1.1  mrg    determines the number of iterations, chrec_dont_know is returned.  */
1.1  mrg
1.1  mrg tree
1.1  mrg find_loop_niter_by_eval (class loop *loop, edge *exit)
1.1  mrg {
1.1  mrg   unsigned i;
1.1  mrg   auto_vec<edge> exits = get_loop_exit_edges (loop);
1.1  mrg   edge ex;
1.1  mrg   tree niter = NULL_TREE, aniter;
1.1  mrg
1.1  mrg   *exit = NULL;
1.1  mrg
1.1  mrg   /* Loops with multiple exits are expensive to handle and less important.  */
1.1  mrg   if (!flag_expensive_optimizations
1.1  mrg       && exits.length () > 1)
1.1  mrg     return chrec_dont_know;
1.1  mrg
1.1  mrg   FOR_EACH_VEC_ELT (exits, i, ex)
1.1  mrg     {
1.1  mrg       if (!just_once_each_iteration_p (loop, ex->src))
1.1  mrg 	continue;
1.1  mrg
1.1  mrg       aniter = loop_niter_by_eval (loop, ex);
1.1  mrg       if (chrec_contains_undetermined (aniter))
1.1  mrg 	continue;
1.1  mrg
1.1  mrg       if (niter
1.1  mrg 	  && !tree_int_cst_lt (aniter, niter))
1.1  mrg 	continue;
1.1  mrg
1.1  mrg       niter = aniter;
1.1  mrg       *exit = ex;
1.1  mrg     }
1.1  mrg
1.1  mrg   return niter ? niter : chrec_dont_know;
1.1  mrg }
1.1  mrg
1.1  mrg /*
1.1  mrg
1.1  mrg    Analysis of upper bounds on number of iterations of a loop.
1.1  mrg
1.1  mrg */
1.1  mrg
1.1  mrg static widest_int derive_constant_upper_bound_ops (tree, tree,
1.1  mrg 						   enum tree_code, tree);
1.1  mrg
1.1  mrg /* Returns a constant upper bound on the value of the right-hand side of
1.1  mrg    an assignment statement STMT.  */
1.1  mrg
1.1  mrg static widest_int
1.1  mrg derive_constant_upper_bound_assign (gimple *stmt)
1.1  mrg {
1.1  mrg   enum tree_code code = gimple_assign_rhs_code (stmt);
1.1  mrg   tree op0 = gimple_assign_rhs1 (stmt);
1.1  mrg   tree op1 = gimple_assign_rhs2 (stmt);
1.1  mrg
1.1  mrg   return derive_constant_upper_bound_ops (TREE_TYPE (gimple_assign_lhs (stmt)),
1.1  mrg 					  op0, code, op1);
1.1  mrg }
1.1  mrg
1.1  mrg /* Returns a constant upper bound on the value of expression VAL.  VAL
1.1  mrg    is considered to be unsigned.  If its type is signed, its value must
1.1  mrg    be nonnegative.  */
1.1  mrg
1.1  mrg static widest_int
1.1  mrg derive_constant_upper_bound (tree val)
1.1  mrg {
1.1  mrg   enum tree_code code;
1.1  mrg   tree op0, op1, op2;
1.1  mrg
1.1  mrg   extract_ops_from_tree (val, &code, &op0, &op1, &op2);
1.1  mrg   return derive_constant_upper_bound_ops (TREE_TYPE (val), op0, code, op1);
1.1  mrg }
1.1  mrg
1.1  mrg /* Returns a constant upper bound on the value of expression OP0 CODE OP1,
1.1  mrg    whose type is TYPE.  The expression is considered to be unsigned.  If
1.1  mrg    its type is signed, its value must be nonnegative.  */
1.1  mrg
1.1  mrg static widest_int
1.1  mrg derive_constant_upper_bound_ops (tree type, tree op0,
1.1  mrg 				 enum tree_code code, tree op1)
1.1  mrg {
1.1  mrg   tree subtype, maxt;
1.1  mrg   widest_int bnd, max, cst;
1.1  mrg   gimple *stmt;
1.1  mrg
1.1  mrg   if (INTEGRAL_TYPE_P (type))
1.1  mrg     maxt = TYPE_MAX_VALUE (type);
1.1  mrg   else
1.1  mrg     maxt = upper_bound_in_type (type, type);
1.1  mrg
1.1  mrg   max = wi::to_widest (maxt);
1.1  mrg
1.1  mrg   switch (code)
1.1  mrg     {
1.1  mrg     case INTEGER_CST:
1.1  mrg       return wi::to_widest (op0);
1.1  mrg
1.1  mrg     CASE_CONVERT:
1.1  mrg       subtype = TREE_TYPE (op0);
1.1  mrg       if (!TYPE_UNSIGNED (subtype)
1.1  mrg 	  /* If TYPE is also signed, the fact that VAL is nonnegative implies
1.1  mrg 	     that OP0 is nonnegative.  */
1.1  mrg 	  && TYPE_UNSIGNED (type)
1.1  mrg 	  && !tree_expr_nonnegative_p (op0))
1.1  mrg 	{
1.1  mrg 	  /* If we cannot prove that the casted expression is nonnegative,
1.1  mrg 	     we cannot establish more useful upper bound than the precision
1.1  mrg 	     of the type gives us.  */
1.1  mrg 	  return max;
1.1  mrg 	}
1.1  mrg
1.1  mrg       /* We now know that op0 is an nonnegative value.  Try deriving an upper
1.1  mrg 	 bound for it.  */
1.1  mrg       bnd = derive_constant_upper_bound (op0);
1.1  mrg
1.1  mrg       /* If the bound does not fit in TYPE, max. value of TYPE could be
1.1  mrg 	 attained.  */
1.1  mrg       if (wi::ltu_p (max, bnd))
1.1  mrg 	return max;
1.1  mrg
1.1  mrg       return bnd;
1.1  mrg
1.1  mrg     case PLUS_EXPR:
1.1  mrg     case POINTER_PLUS_EXPR:
1.1  mrg     case MINUS_EXPR:
1.1  mrg       if (TREE_CODE (op1) != INTEGER_CST
1.1  mrg 	  || !tree_expr_nonnegative_p (op0))
1.1  mrg 	return max;
1.1  mrg
1.1  mrg       /* Canonicalize to OP0 - CST.  Consider CST to be signed, in order to
1.1  mrg 	 choose the most logical way how to treat this constant regardless
1.1  mrg 	 of the signedness of the type.  */
1.1  mrg       cst = wi::sext (wi::to_widest (op1), TYPE_PRECISION (type));
1.1  mrg       if (code != MINUS_EXPR)
1.1  mrg 	cst = -cst;
1.1  mrg
1.1  mrg       bnd = derive_constant_upper_bound (op0);
1.1  mrg
1.1  mrg       if (wi::neg_p (cst))
1.1  mrg 	{
1.1  mrg 	  cst = -cst;
1.1  mrg 	  /* Avoid CST == 0x80000...  */
1.1  mrg 	  if (wi::neg_p (cst))
1.1  mrg 	    return max;
1.1  mrg
1.1  mrg 	  /* OP0 + CST.  We need to check that
1.1  mrg 	     BND <= MAX (type) - CST.  */
1.1  mrg
1.1  mrg 	  widest_int mmax = max - cst;
1.1  mrg 	  if (wi::leu_p (bnd, mmax))
1.1  mrg 	    return max;
1.1  mrg
1.1  mrg 	  return bnd + cst;
1.1  mrg 	}
1.1  mrg       else
1.1  mrg 	{
1.1  mrg 	  /* OP0 - CST, where CST >= 0.
1.1  mrg
1.1  mrg 	     If TYPE is signed, we have already verified that OP0 >= 0, and we
1.1  mrg 	     know that the result is nonnegative.  This implies that
1.1  mrg 	     VAL <= BND - CST.
1.1  mrg
1.1  mrg 	     If TYPE is unsigned, we must additionally know that OP0 >= CST,
1.1  mrg 	     otherwise the operation underflows.
1.1  mrg 	   */
1.1  mrg
1.1  mrg 	  /* This should only happen if the type is unsigned; however, for
1.1  mrg 	     buggy programs that use overflowing signed arithmetics even with
1.1  mrg 	     -fno-wrapv, this condition may also be true for signed values.  */
1.1  mrg 	  if (wi::ltu_p (bnd, cst))
1.1  mrg 	    return max;
1.1  mrg
1.1  mrg 	  if (TYPE_UNSIGNED (type))
1.1  mrg 	    {
1.1  mrg 	      tree tem = fold_binary (GE_EXPR, boolean_type_node, op0,
1.1  mrg 				      wide_int_to_tree (type, cst));
1.1  mrg 	      if (!tem || integer_nonzerop (tem))
1.1  mrg 		return max;
1.1  mrg 	    }
1.1  mrg
1.1  mrg 	  bnd -= cst;
1.1  mrg 	}
1.1  mrg
1.1  mrg       return bnd;
1.1  mrg
1.1  mrg     case FLOOR_DIV_EXPR:
1.1  mrg     case EXACT_DIV_EXPR:
1.1  mrg       if (TREE_CODE (op1) != INTEGER_CST
1.1  mrg 	  || tree_int_cst_sign_bit (op1))
1.1  mrg 	return max;
1.1  mrg
1.1  mrg       bnd = derive_constant_upper_bound (op0);
1.1  mrg       return wi::udiv_floor (bnd, wi::to_widest (op1));
1.1  mrg
1.1  mrg     case BIT_AND_EXPR:
1.1  mrg       if (TREE_CODE (op1) != INTEGER_CST
1.1  mrg 	  || tree_int_cst_sign_bit (op1))
1.1  mrg 	return max;
1.1  mrg       return wi::to_widest (op1);
1.1  mrg
1.1  mrg     case SSA_NAME:
1.1  mrg       stmt = SSA_NAME_DEF_STMT (op0);
1.1  mrg       if (gimple_code (stmt) != GIMPLE_ASSIGN
1.1  mrg 	  || gimple_assign_lhs (stmt) != op0)
1.1  mrg 	return max;
1.1  mrg       return derive_constant_upper_bound_assign (stmt);
1.1  mrg
1.1  mrg     default:
1.1  mrg       return max;
1.1  mrg     }
1.1  mrg }
1.1  mrg
1.1  mrg /* Emit a -Waggressive-loop-optimizations warning if needed.  */
1.1  mrg
1.1  mrg static void
1.1  mrg do_warn_aggressive_loop_optimizations (class loop *loop,
1.1  mrg 				       widest_int i_bound, gimple *stmt)
1.1  mrg {
1.1  mrg   /* Don't warn if the loop doesn't have known constant bound.  */
1.1  mrg   if (!loop->nb_iterations
1.1  mrg       || TREE_CODE (loop->nb_iterations) != INTEGER_CST
1.1  mrg       || !warn_aggressive_loop_optimizations
1.1  mrg       /* To avoid warning multiple times for the same loop,
1.1  mrg 	 only start warning when we preserve loops.  */
1.1  mrg       || (cfun->curr_properties & PROP_loops) == 0
1.1  mrg       /* Only warn once per loop.  */
1.1  mrg       || loop->warned_aggressive_loop_optimizations
1.1  mrg       /* Only warn if undefined behavior gives us lower estimate than the
1.1  mrg 	 known constant bound.  */
1.1  mrg       || wi::cmpu (i_bound, wi::to_widest (loop->nb_iterations)) >= 0
1.1  mrg       /* And undefined behavior happens unconditionally.  */
1.1  mrg       || !dominated_by_p (CDI_DOMINATORS, loop->latch, gimple_bb (stmt)))
1.1  mrg     return;
1.1  mrg
1.1  mrg   edge e = single_exit (loop);
1.1  mrg   if (e == NULL)
1.1  mrg     return;
1.1  mrg
1.1  mrg   gimple *estmt = last_stmt (e->src);
1.1  mrg   char buf[WIDE_INT_PRINT_BUFFER_SIZE];
1.1  mrg   print_dec (i_bound, buf, TYPE_UNSIGNED (TREE_TYPE (loop->nb_iterations))
1.1  mrg 	     ? UNSIGNED : SIGNED);
1.1  mrg   auto_diagnostic_group d;
1.1  mrg   if (warning_at (gimple_location (stmt), OPT_Waggressive_loop_optimizations,
1.1  mrg 		  "iteration %s invokes undefined behavior", buf))
1.1  mrg     inform (gimple_location (estmt), "within this loop");
1.1  mrg   loop->warned_aggressive_loop_optimizations = true;
1.1  mrg }
1.1  mrg
1.1  mrg /* Records that AT_STMT is executed at most BOUND + 1 times in LOOP.  IS_EXIT
1.1  mrg    is true if the loop is exited immediately after STMT, and this exit
1.1  mrg    is taken at last when the STMT is executed BOUND + 1 times.
1.1  mrg    REALISTIC is true if BOUND is expected to be close to the real number
1.1  mrg    of iterations.  UPPER is true if we are sure the loop iterates at most
1.1  mrg    BOUND times.  I_BOUND is a widest_int upper estimate on BOUND.  */
1.1  mrg
1.1  mrg static void
1.1  mrg record_estimate (class loop *loop, tree bound, const widest_int &i_bound,
1.1  mrg 		 gimple *at_stmt, bool is_exit, bool realistic, bool upper)
1.1  mrg {
1.1  mrg   widest_int delta;
1.1  mrg
1.1  mrg   if (dump_file && (dump_flags & TDF_DETAILS))
1.1  mrg     {
1.1  mrg       fprintf (dump_file, "Statement %s", is_exit ? "(exit)" : "");
1.1  mrg       print_gimple_stmt (dump_file, at_stmt, 0, TDF_SLIM);
1.1  mrg       fprintf (dump_file, " is %sexecuted at most ",
1.1  mrg 	       upper ? "" : "probably ");
1.1  mrg       print_generic_expr (dump_file, bound, TDF_SLIM);
1.1  mrg       fprintf (dump_file, " (bounded by ");
1.1  mrg       print_decu (i_bound, dump_file);
1.1  mrg       fprintf (dump_file, ") + 1 times in loop %d.\n", loop->num);
1.1  mrg     }
1.1  mrg
1.1  mrg   /* If the I_BOUND is just an estimate of BOUND, it rarely is close to the
1.1  mrg      real number of iterations.  */
1.1  mrg   if (TREE_CODE (bound) != INTEGER_CST)
1.1  mrg     realistic = false;
1.1  mrg   else
1.1  mrg     gcc_checking_assert (i_bound == wi::to_widest (bound));
1.1  mrg
1.1  mrg   /* If we have a guaranteed upper bound, record it in the appropriate
1.1  mrg      list, unless this is an !is_exit bound (i.e. undefined behavior in
1.1  mrg      at_stmt) in a loop with known constant number of iterations.  */
1.1  mrg   if (upper
1.1  mrg       && (is_exit
1.1  mrg 	  || loop->nb_iterations == NULL_TREE
1.1  mrg 	  || TREE_CODE (loop->nb_iterations) != INTEGER_CST))
1.1  mrg     {
1.1  mrg       class nb_iter_bound *elt = ggc_alloc<nb_iter_bound> ();
1.1  mrg
1.1  mrg       elt->bound = i_bound;
1.1  mrg       elt->stmt = at_stmt;
1.1  mrg       elt->is_exit = is_exit;
1.1  mrg       elt->next = loop->bounds;
1.1  mrg       loop->bounds = elt;
1.1  mrg     }
1.1  mrg
1.1  mrg   /* If statement is executed on every path to the loop latch, we can directly
1.1  mrg      infer the upper bound on the # of iterations of the loop.  */
1.1  mrg   if (!dominated_by_p (CDI_DOMINATORS, loop->latch, gimple_bb (at_stmt)))
1.1  mrg     upper = false;
1.1  mrg
1.1  mrg   /* Update the number of iteration estimates according to the bound.
1.1  mrg      If at_stmt is an exit then the loop latch is executed at most BOUND times,
1.1  mrg      otherwise it can be executed BOUND + 1 times.  We will lower the estimate
1.1  mrg      later if such statement must be executed on last iteration  */
1.1  mrg   if (is_exit)
1.1  mrg     delta = 0;
1.1  mrg   else
1.1  mrg     delta = 1;
1.1  mrg   widest_int new_i_bound = i_bound + delta;
1.1  mrg
1.1  mrg   /* If an overflow occurred, ignore the result.  */
1.1  mrg   if (wi::ltu_p (new_i_bound, delta))
1.1  mrg     return;
1.1  mrg
1.1  mrg   if (upper && !is_exit)
1.1  mrg     do_warn_aggressive_loop_optimizations (loop, new_i_bound, at_stmt);
1.1  mrg   record_niter_bound (loop, new_i_bound, realistic, upper);
1.1  mrg }
1.1  mrg
1.1  mrg /* Records the control iv analyzed in NITER for LOOP if the iv is valid
1.1  mrg    and doesn't overflow.  */
1.1  mrg
1.1  mrg static void
1.1  mrg record_control_iv (class loop *loop, class tree_niter_desc *niter)
1.1  mrg {
1.1  mrg   struct control_iv *iv;
1.1  mrg
1.1  mrg   if (!niter->control.base || !niter->control.step)
1.1  mrg     return;
1.1  mrg
1.1  mrg   if (!integer_onep (niter->assumptions) || !niter->control.no_overflow)
1.1  mrg     return;
1.1  mrg
1.1  mrg   iv = ggc_alloc<control_iv> ();
1.1  mrg   iv->base = niter->control.base;
1.1  mrg   iv->step = niter->control.step;
1.1  mrg   iv->next = loop->control_ivs;
1.1  mrg   loop->control_ivs = iv;
1.1  mrg
1.1  mrg   return;
1.1  mrg }
1.1  mrg
1.1  mrg /* This function returns TRUE if below conditions are satisfied:
1.1  mrg      1) VAR is SSA variable.
1.1  mrg      2) VAR is an IV:{base, step} in its defining loop.
1.1  mrg      3) IV doesn't overflow.
1.1  mrg      4) Both base and step are integer constants.
1.1  mrg      5) Base is the MIN/MAX value depends on IS_MIN.
1.1  mrg    Store value of base to INIT correspondingly.  */
1.1  mrg
1.1  mrg static bool
1.1  mrg get_cst_init_from_scev (tree var, wide_int *init, bool is_min)
1.1  mrg {
1.1  mrg   if (TREE_CODE (var) != SSA_NAME)
1.1  mrg     return false;
1.1  mrg
1.1  mrg   gimple *def_stmt = SSA_NAME_DEF_STMT (var);
1.1  mrg   class loop *loop = loop_containing_stmt (def_stmt);
1.1  mrg
1.1  mrg   if (loop == NULL)
1.1  mrg     return false;
1.1  mrg
1.1  mrg   affine_iv iv;
1.1  mrg   if (!simple_iv (loop, loop, var, &iv, false))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   if (!iv.no_overflow)
1.1  mrg     return false;
1.1  mrg
1.1  mrg   if (TREE_CODE (iv.base) != INTEGER_CST || TREE_CODE (iv.step) != INTEGER_CST)
1.1  mrg     return false;
1.1  mrg
1.1  mrg   if (is_min == tree_int_cst_sign_bit (iv.step))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   *init = wi::to_wide (iv.base);
1.1  mrg   return true;
1.1  mrg }
1.1  mrg
1.1  mrg /* Record the estimate on number of iterations of LOOP based on the fact that
1.1  mrg    the induction variable BASE + STEP * i evaluated in STMT does not wrap and
1.1  mrg    its values belong to the range <LOW, HIGH>.  REALISTIC is true if the
1.1  mrg    estimated number of iterations is expected to be close to the real one.
1.1  mrg    UPPER is true if we are sure the induction variable does not wrap.  */
1.1  mrg
1.1  mrg static void
1.1  mrg record_nonwrapping_iv (class loop *loop, tree base, tree step, gimple *stmt,
1.1  mrg 		       tree low, tree high, bool realistic, bool upper)
1.1  mrg {
1.1  mrg   tree niter_bound, extreme, delta;
1.1  mrg   tree type = TREE_TYPE (base), unsigned_type;
1.1  mrg   tree orig_base = base;
1.1  mrg
1.1  mrg   if (TREE_CODE (step) != INTEGER_CST || integer_zerop (step))
1.1  mrg     return;
1.1  mrg
1.1  mrg   if (dump_file && (dump_flags & TDF_DETAILS))
1.1  mrg     {
1.1  mrg       fprintf (dump_file, "Induction variable (");
1.1  mrg       print_generic_expr (dump_file, TREE_TYPE (base), TDF_SLIM);
1.1  mrg       fprintf (dump_file, ") ");
1.1  mrg       print_generic_expr (dump_file, base, TDF_SLIM);
1.1  mrg       fprintf (dump_file, " + ");
1.1  mrg       print_generic_expr (dump_file, step, TDF_SLIM);
1.1  mrg       fprintf (dump_file, " * iteration does not wrap in statement ");
1.1  mrg       print_gimple_stmt (dump_file, stmt, 0, TDF_SLIM);
1.1  mrg       fprintf (dump_file, " in loop %d.\n", loop->num);
1.1  mrg     }
1.1  mrg
1.1  mrg   unsigned_type = unsigned_type_for (type);
1.1  mrg   base = fold_convert (unsigned_type, base);
1.1  mrg   step = fold_convert (unsigned_type, step);
1.1  mrg
1.1  mrg   if (tree_int_cst_sign_bit (step))
1.1  mrg     {
1.1  mrg       wide_int max;
1.1  mrg       value_range base_range;
1.1  mrg       if (get_range_query (cfun)->range_of_expr (base_range, orig_base)
1.1  mrg 	  && !base_range.undefined_p ())
1.1  mrg 	max = base_range.upper_bound ();
1.1  mrg       extreme = fold_convert (unsigned_type, low);
1.1  mrg       if (TREE_CODE (orig_base) == SSA_NAME
1.1  mrg 	  && TREE_CODE (high) == INTEGER_CST
1.1  mrg 	  && INTEGRAL_TYPE_P (TREE_TYPE (orig_base))
1.1  mrg 	  && (base_range.kind () == VR_RANGE
1.1  mrg 	      || get_cst_init_from_scev (orig_base, &max, false))
1.1  mrg 	  && wi::gts_p (wi::to_wide (high), max))
1.1  mrg 	base = wide_int_to_tree (unsigned_type, max);
1.1  mrg       else if (TREE_CODE (base) != INTEGER_CST
1.1  mrg 	       && dominated_by_p (CDI_DOMINATORS,
1.1  mrg 				  loop->latch, gimple_bb (stmt)))
1.1  mrg 	base = fold_convert (unsigned_type, high);
1.1  mrg       delta = fold_build2 (MINUS_EXPR, unsigned_type, base, extreme);
1.1  mrg       step = fold_build1 (NEGATE_EXPR, unsigned_type, step);
1.1  mrg     }
1.1  mrg   else
1.1  mrg     {
1.1  mrg       wide_int min;
1.1  mrg       value_range base_range;
1.1  mrg       if (get_range_query (cfun)->range_of_expr (base_range, orig_base)
1.1  mrg 	  && !base_range.undefined_p ())
1.1  mrg 	min = base_range.lower_bound ();
1.1  mrg       extreme = fold_convert (unsigned_type, high);
1.1  mrg       if (TREE_CODE (orig_base) == SSA_NAME
1.1  mrg 	  && TREE_CODE (low) == INTEGER_CST
1.1  mrg 	  && INTEGRAL_TYPE_P (TREE_TYPE (orig_base))
1.1  mrg 	  && (base_range.kind () == VR_RANGE
1.1  mrg 	      || get_cst_init_from_scev (orig_base, &min, true))
1.1  mrg 	  && wi::gts_p (min, wi::to_wide (low)))
1.1  mrg 	base = wide_int_to_tree (unsigned_type, min);
1.1  mrg       else if (TREE_CODE (base) != INTEGER_CST
1.1  mrg 	       && dominated_by_p (CDI_DOMINATORS,
1.1  mrg 				  loop->latch, gimple_bb (stmt)))
1.1  mrg 	base = fold_convert (unsigned_type, low);
1.1  mrg       delta = fold_build2 (MINUS_EXPR, unsigned_type, extreme, base);
1.1  mrg     }
1.1  mrg
1.1  mrg   /* STMT is executed at most NITER_BOUND + 1 times, since otherwise the value
1.1  mrg      would get out of the range.  */
1.1  mrg   niter_bound = fold_build2 (FLOOR_DIV_EXPR, unsigned_type, delta, step);
1.1  mrg   widest_int max = derive_constant_upper_bound (niter_bound);
1.1  mrg   record_estimate (loop, niter_bound, max, stmt, false, realistic, upper);
1.1  mrg }
1.1  mrg
1.1  mrg /* Determine information about number of iterations a LOOP from the index
1.1  mrg    IDX of a data reference accessed in STMT.  RELIABLE is true if STMT is
1.1  mrg    guaranteed to be executed in every iteration of LOOP.  Callback for
1.1  mrg    for_each_index.  */
1.1  mrg
1.1  mrg struct ilb_data
1.1  mrg {
1.1  mrg   class loop *loop;
1.1  mrg   gimple *stmt;
1.1  mrg };
1.1  mrg
1.1  mrg static bool
1.1  mrg idx_infer_loop_bounds (tree base, tree *idx, void *dta)
1.1  mrg {
1.1  mrg   struct ilb_data *data = (struct ilb_data *) dta;
1.1  mrg   tree ev, init, step;
1.1  mrg   tree low, high, type, next;
1.1  mrg   bool sign, upper = true, at_end = false;
1.1  mrg   class loop *loop = data->loop;
1.1  mrg
1.1  mrg   if (TREE_CODE (base) != ARRAY_REF)
1.1  mrg     return true;
1.1  mrg
1.1  mrg   /* For arrays at the end of the structure, we are not guaranteed that they
1.1  mrg      do not really extend over their declared size.  However, for arrays of
1.1  mrg      size greater than one, this is unlikely to be intended.  */
1.1  mrg   if (array_at_struct_end_p (base))
1.1  mrg     {
1.1  mrg       at_end = true;
1.1  mrg       upper = false;
1.1  mrg     }
1.1  mrg
1.1  mrg   class loop *dloop = loop_containing_stmt (data->stmt);
1.1  mrg   if (!dloop)
1.1  mrg     return true;
1.1  mrg
1.1  mrg   ev = analyze_scalar_evolution (dloop, *idx);
1.1  mrg   ev = instantiate_parameters (loop, ev);
1.1  mrg   init = initial_condition (ev);
1.1  mrg   step = evolution_part_in_loop_num (ev, loop->num);
1.1  mrg
1.1  mrg   if (!init
1.1  mrg       || !step
1.1  mrg       || TREE_CODE (step) != INTEGER_CST
1.1  mrg       || integer_zerop (step)
1.1  mrg       || tree_contains_chrecs (init, NULL)
1.1  mrg       || chrec_contains_symbols_defined_in_loop (init, loop->num))
1.1  mrg     return true;
1.1  mrg
1.1  mrg   low = array_ref_low_bound (base);
1.1  mrg   high = array_ref_up_bound (base);
1.1  mrg
1.1  mrg   /* The case of nonconstant bounds could be handled, but it would be
1.1  mrg      complicated.  */
1.1  mrg   if (TREE_CODE (low) != INTEGER_CST
1.1  mrg       || !high
1.1  mrg       || TREE_CODE (high) != INTEGER_CST)
1.1  mrg     return true;
1.1  mrg   sign = tree_int_cst_sign_bit (step);
1.1  mrg   type = TREE_TYPE (step);
1.1  mrg
1.1  mrg   /* The array of length 1 at the end of a structure most likely extends
1.1  mrg      beyond its bounds.  */
1.1  mrg   if (at_end
1.1  mrg       && operand_equal_p (low, high, 0))
1.1  mrg     return true;
1.1  mrg
1.1  mrg   /* In case the relevant bound of the array does not fit in type, or
1.1  mrg      it does, but bound + step (in type) still belongs into the range of the
1.1  mrg      array, the index may wrap and still stay within the range of the array
1.1  mrg      (consider e.g. if the array is indexed by the full range of
1.1  mrg      unsigned char).
1.1  mrg
1.1  mrg      To make things simpler, we require both bounds to fit into type, although
1.1  mrg      there are cases where this would not be strictly necessary.  */
1.1  mrg   if (!int_fits_type_p (high, type)
1.1  mrg       || !int_fits_type_p (low, type))
1.1  mrg     return true;
1.1  mrg   low = fold_convert (type, low);
1.1  mrg   high = fold_convert (type, high);
1.1  mrg
1.1  mrg   if (sign)
1.1  mrg     next = fold_binary (PLUS_EXPR, type, low, step);
1.1  mrg   else
1.1  mrg     next = fold_binary (PLUS_EXPR, type, high, step);
1.1  mrg
1.1  mrg   if (tree_int_cst_compare (low, next) <= 0
1.1  mrg       && tree_int_cst_compare (next, high) <= 0)
1.1  mrg     return true;
1.1  mrg
1.1  mrg   /* If access is not executed on every iteration, we must ensure that overlow
1.1  mrg      may not make the access valid later.  */
1.1  mrg   if (!dominated_by_p (CDI_DOMINATORS, loop->latch, gimple_bb (data->stmt))
1.1  mrg       && scev_probably_wraps_p (NULL_TREE,
1.1  mrg 				initial_condition_in_loop_num (ev, loop->num),
1.1  mrg 				step, data->stmt, loop, true))
1.1  mrg     upper = false;
1.1  mrg
1.1  mrg   record_nonwrapping_iv (loop, init, step, data->stmt, low, high, false, upper);
1.1  mrg   return true;
1.1  mrg }
1.1  mrg
1.1  mrg /* Determine information about number of iterations a LOOP from the bounds
1.1  mrg    of arrays in the data reference REF accessed in STMT.  RELIABLE is true if
1.1  mrg    STMT is guaranteed to be executed in every iteration of LOOP.*/
1.1  mrg
1.1  mrg static void
1.1  mrg infer_loop_bounds_from_ref (class loop *loop, gimple *stmt, tree ref)
1.1  mrg {
1.1  mrg   struct ilb_data data;
1.1  mrg
1.1  mrg   data.loop = loop;
1.1  mrg   data.stmt = stmt;
1.1  mrg   for_each_index (&ref, idx_infer_loop_bounds, &data);
1.1  mrg }
1.1  mrg
1.1  mrg /* Determine information about number of iterations of a LOOP from the way
1.1  mrg    arrays are used in STMT.  RELIABLE is true if STMT is guaranteed to be
1.1  mrg    executed in every iteration of LOOP.  */
1.1  mrg
1.1  mrg static void
1.1  mrg infer_loop_bounds_from_array (class loop *loop, gimple *stmt)
1.1  mrg {
1.1  mrg   if (is_gimple_assign (stmt))
1.1  mrg     {
1.1  mrg       tree op0 = gimple_assign_lhs (stmt);
1.1  mrg       tree op1 = gimple_assign_rhs1 (stmt);
1.1  mrg
1.1  mrg       /* For each memory access, analyze its access function
1.1  mrg 	 and record a bound on the loop iteration domain.  */
1.1  mrg       if (REFERENCE_CLASS_P (op0))
1.1  mrg 	infer_loop_bounds_from_ref (loop, stmt, op0);
1.1  mrg
1.1  mrg       if (REFERENCE_CLASS_P (op1))
1.1  mrg 	infer_loop_bounds_from_ref (loop, stmt, op1);
1.1  mrg     }
1.1  mrg   else if (is_gimple_call (stmt))
1.1  mrg     {
1.1  mrg       tree arg, lhs;
1.1  mrg       unsigned i, n = gimple_call_num_args (stmt);
1.1  mrg
1.1  mrg       lhs = gimple_call_lhs (stmt);
1.1  mrg       if (lhs && REFERENCE_CLASS_P (lhs))
1.1  mrg 	infer_loop_bounds_from_ref (loop, stmt, lhs);
1.1  mrg
1.1  mrg       for (i = 0; i < n; i++)
1.1  mrg 	{
1.1  mrg 	  arg = gimple_call_arg (stmt, i);
1.1  mrg 	  if (REFERENCE_CLASS_P (arg))
1.1  mrg 	    infer_loop_bounds_from_ref (loop, stmt, arg);
1.1  mrg 	}
1.1  mrg     }
1.1  mrg }
1.1  mrg
1.1  mrg /* Determine information about number of iterations of a LOOP from the fact
1.1  mrg    that pointer arithmetics in STMT does not overflow.  */
1.1  mrg
1.1  mrg static void
1.1  mrg infer_loop_bounds_from_pointer_arith (class loop *loop, gimple *stmt)
1.1  mrg {
1.1  mrg   tree def, base, step, scev, type, low, high;
1.1  mrg   tree var, ptr;
1.1  mrg
1.1  mrg   if (!is_gimple_assign (stmt)
1.1  mrg       || gimple_assign_rhs_code (stmt) != POINTER_PLUS_EXPR)
1.1  mrg     return;
1.1  mrg
1.1  mrg   def = gimple_assign_lhs (stmt);
1.1  mrg   if (TREE_CODE (def) != SSA_NAME)
1.1  mrg     return;
1.1  mrg
1.1  mrg   type = TREE_TYPE (def);
1.1  mrg   if (!nowrap_type_p (type))
1.1  mrg     return;
1.1  mrg
1.1  mrg   ptr = gimple_assign_rhs1 (stmt);
1.1  mrg   if (!expr_invariant_in_loop_p (loop, ptr))
1.1  mrg     return;
1.1  mrg
1.1  mrg   var = gimple_assign_rhs2 (stmt);
1.1  mrg   if (TYPE_PRECISION (type) != TYPE_PRECISION (TREE_TYPE (var)))
1.1  mrg     return;
1.1  mrg
1.1  mrg   class loop *uloop = loop_containing_stmt (stmt);
1.1  mrg   scev = instantiate_parameters (loop, analyze_scalar_evolution (uloop, def));
1.1  mrg   if (chrec_contains_undetermined (scev))
1.1  mrg     return;
1.1  mrg
1.1  mrg   base = initial_condition_in_loop_num (scev, loop->num);
1.1  mrg   step = evolution_part_in_loop_num (scev, loop->num);
1.1  mrg
1.1  mrg   if (!base || !step
1.1  mrg       || TREE_CODE (step) != INTEGER_CST
1.1  mrg       || tree_contains_chrecs (base, NULL)
1.1  mrg       || chrec_contains_symbols_defined_in_loop (base, loop->num))
1.1  mrg     return;
1.1  mrg
1.1  mrg   low = lower_bound_in_type (type, type);
1.1  mrg   high = upper_bound_in_type (type, type);
1.1  mrg
1.1  mrg   /* In C, pointer arithmetic p + 1 cannot use a NULL pointer, and p - 1 cannot
1.1  mrg      produce a NULL pointer.  The contrary would mean NULL points to an object,
1.1  mrg      while NULL is supposed to compare unequal with the address of all objects.
1.1  mrg      Furthermore, p + 1 cannot produce a NULL pointer and p - 1 cannot use a
1.1  mrg      NULL pointer since that would mean wrapping, which we assume here not to
1.1  mrg      happen.  So, we can exclude NULL from the valid range of pointer
1.1  mrg      arithmetic.  */
1.1  mrg   if (flag_delete_null_pointer_checks && int_cst_value (low) == 0)
1.1  mrg     low = build_int_cstu (TREE_TYPE (low), TYPE_ALIGN_UNIT (TREE_TYPE (type)));
1.1  mrg
1.1  mrg   record_nonwrapping_iv (loop, base, step, stmt, low, high, false, true);
1.1  mrg }
1.1  mrg
1.1  mrg /* Determine information about number of iterations of a LOOP from the fact
1.1  mrg    that signed arithmetics in STMT does not overflow.  */
1.1  mrg
1.1  mrg static void
1.1  mrg infer_loop_bounds_from_signedness (class loop *loop, gimple *stmt)
1.1  mrg {
1.1  mrg   tree def, base, step, scev, type, low, high;
1.1  mrg
1.1  mrg   if (gimple_code (stmt) != GIMPLE_ASSIGN)
1.1  mrg     return;
1.1  mrg
1.1  mrg   def = gimple_assign_lhs (stmt);
1.1  mrg
1.1  mrg   if (TREE_CODE (def) != SSA_NAME)
1.1  mrg     return;
1.1  mrg
1.1  mrg   type = TREE_TYPE (def);
1.1  mrg   if (!INTEGRAL_TYPE_P (type)
1.1  mrg       || !TYPE_OVERFLOW_UNDEFINED (type))
1.1  mrg     return;
1.1  mrg
1.1  mrg   scev = instantiate_parameters (loop, analyze_scalar_evolution (loop, def));
1.1  mrg   if (chrec_contains_undetermined (scev))
1.1  mrg     return;
1.1  mrg
1.1  mrg   base = initial_condition_in_loop_num (scev, loop->num);
1.1  mrg   step = evolution_part_in_loop_num (scev, loop->num);
1.1  mrg
1.1  mrg   if (!base || !step
1.1  mrg       || TREE_CODE (step) != INTEGER_CST
1.1  mrg       || tree_contains_chrecs (base, NULL)
1.1  mrg       || chrec_contains_symbols_defined_in_loop (base, loop->num))
1.1  mrg     return;
1.1  mrg
1.1  mrg   low = lower_bound_in_type (type, type);
1.1  mrg   high = upper_bound_in_type (type, type);
1.1  mrg   value_range r;
1.1  mrg   get_range_query (cfun)->range_of_expr (r, def);
1.1  mrg   if (r.kind () == VR_RANGE)
1.1  mrg     {
1.1  mrg       low = wide_int_to_tree (type, r.lower_bound ());
1.1  mrg       high = wide_int_to_tree (type, r.upper_bound ());
1.1  mrg     }
1.1  mrg
1.1  mrg   record_nonwrapping_iv (loop, base, step, stmt, low, high, false, true);
1.1  mrg }
1.1  mrg
1.1  mrg /* The following analyzers are extracting informations on the bounds
1.1  mrg    of LOOP from the following undefined behaviors:
1.1  mrg
1.1  mrg    - data references should not access elements over the statically
1.1  mrg      allocated size,
1.1  mrg
1.1  mrg    - signed variables should not overflow when flag_wrapv is not set.
1.1  mrg */
1.1  mrg
1.1  mrg static void
1.1  mrg infer_loop_bounds_from_undefined (class loop *loop, basic_block *bbs)
1.1  mrg {
1.1  mrg   unsigned i;
1.1  mrg   gimple_stmt_iterator bsi;
1.1  mrg   basic_block bb;
1.1  mrg   bool reliable;
1.1  mrg
1.1  mrg   for (i = 0; i < loop->num_nodes; i++)
1.1  mrg     {
1.1  mrg       bb = bbs[i];
1.1  mrg
1.1  mrg       /* If BB is not executed in each iteration of the loop, we cannot
1.1  mrg 	 use the operations in it to infer reliable upper bound on the
1.1  mrg 	 # of iterations of the loop.  However, we can use it as a guess.
1.1  mrg 	 Reliable guesses come only from array bounds.  */
1.1  mrg       reliable = dominated_by_p (CDI_DOMINATORS, loop->latch, bb);
1.1  mrg
1.1  mrg       for (bsi = gsi_start_bb (bb); !gsi_end_p (bsi); gsi_next (&bsi))
1.1  mrg 	{
1.1  mrg 	  gimple *stmt = gsi_stmt (bsi);
1.1  mrg
1.1  mrg 	  infer_loop_bounds_from_array (loop, stmt);
1.1  mrg
1.1  mrg 	  if (reliable)
1.1  mrg             {
1.1  mrg               infer_loop_bounds_from_signedness (loop, stmt);
1.1  mrg               infer_loop_bounds_from_pointer_arith (loop, stmt);
1.1  mrg             }
1.1  mrg   	}
1.1  mrg
1.1  mrg     }
1.1  mrg }
1.1  mrg
1.1  mrg /* Compare wide ints, callback for qsort.  */
1.1  mrg
1.1  mrg static int
1.1  mrg wide_int_cmp (const void *p1, const void *p2)
1.1  mrg {
1.1  mrg   const widest_int *d1 = (const widest_int *) p1;
1.1  mrg   const widest_int *d2 = (const widest_int *) p2;
1.1  mrg   return wi::cmpu (*d1, *d2);
1.1  mrg }
1.1  mrg
1.1  mrg /* Return index of BOUND in BOUNDS array sorted in increasing order.
1.1  mrg    Lookup by binary search.  */
1.1  mrg
1.1  mrg static int
1.1  mrg bound_index (const vec<widest_int> &bounds, const widest_int &bound)
1.1  mrg {
1.1  mrg   unsigned int end = bounds.length ();
1.1  mrg   unsigned int begin = 0;
1.1  mrg
1.1  mrg   /* Find a matching index by means of a binary search.  */
1.1  mrg   while (begin != end)
1.1  mrg     {
1.1  mrg       unsigned int middle = (begin + end) / 2;
1.1  mrg       widest_int index = bounds[middle];
1.1  mrg
1.1  mrg       if (index == bound)
1.1  mrg 	return middle;
1.1  mrg       else if (wi::ltu_p (index, bound))
1.1  mrg 	begin = middle + 1;
1.1  mrg       else
1.1  mrg 	end = middle;
1.1  mrg     }
1.1  mrg   gcc_unreachable ();
1.1  mrg }
1.1  mrg
1.1  mrg /* We recorded loop bounds only for statements dominating loop latch (and thus
1.1  mrg    executed each loop iteration).  If there are any bounds on statements not
1.1  mrg    dominating the loop latch we can improve the estimate by walking the loop
1.1  mrg    body and seeing if every path from loop header to loop latch contains
1.1  mrg    some bounded statement.  */
1.1  mrg
1.1  mrg static void
1.1  mrg discover_iteration_bound_by_body_walk (class loop *loop)
1.1  mrg {
1.1  mrg   class nb_iter_bound *elt;
1.1  mrg   auto_vec<widest_int> bounds;
1.1  mrg   vec<vec<basic_block> > queues = vNULL;
1.1  mrg   vec<basic_block> queue = vNULL;
1.1  mrg   ptrdiff_t queue_index;
1.1  mrg   ptrdiff_t latch_index = 0;
1.1  mrg
1.1  mrg   /* Discover what bounds may interest us.  */
1.1  mrg   for (elt = loop->bounds; elt; elt = elt->next)
1.1  mrg     {
1.1  mrg       widest_int bound = elt->bound;
1.1  mrg
1.1  mrg       /* Exit terminates loop at given iteration, while non-exits produce undefined
1.1  mrg 	 effect on the next iteration.  */
1.1  mrg       if (!elt->is_exit)
1.1  mrg 	{
1.1  mrg 	  bound += 1;
1.1  mrg 	  /* If an overflow occurred, ignore the result.  */
1.1  mrg 	  if (bound == 0)
1.1  mrg 	    continue;
1.1  mrg 	}
1.1  mrg
1.1  mrg       if (!loop->any_upper_bound
1.1  mrg 	  || wi::ltu_p (bound, loop->nb_iterations_upper_bound))
1.1  mrg         bounds.safe_push (bound);
1.1  mrg     }
1.1  mrg
1.1  mrg   /* Exit early if there is nothing to do.  */
1.1  mrg   if (!bounds.exists ())
1.1  mrg     return;
1.1  mrg
1.1  mrg   if (dump_file && (dump_flags & TDF_DETAILS))
1.1  mrg     fprintf (dump_file, " Trying to walk loop body to reduce the bound.\n");
1.1  mrg
1.1  mrg   /* Sort the bounds in decreasing order.  */
1.1  mrg   bounds.qsort (wide_int_cmp);
1.1  mrg
1.1  mrg   /* For every basic block record the lowest bound that is guaranteed to
1.1  mrg      terminate the loop.  */
1.1  mrg
1.1  mrg   hash_map<basic_block, ptrdiff_t> bb_bounds;
1.1  mrg   for (elt = loop->bounds; elt; elt = elt->next)
1.1  mrg     {
1.1  mrg       widest_int bound = elt->bound;
1.1  mrg       if (!elt->is_exit)
1.1  mrg 	{
1.1  mrg 	  bound += 1;
1.1  mrg 	  /* If an overflow occurred, ignore the result.  */
1.1  mrg 	  if (bound == 0)
1.1  mrg 	    continue;
1.1  mrg 	}
1.1  mrg
1.1  mrg       if (!loop->any_upper_bound
1.1  mrg 	  || wi::ltu_p (bound, loop->nb_iterations_upper_bound))
1.1  mrg 	{
1.1  mrg 	  ptrdiff_t index = bound_index (bounds, bound);
1.1  mrg 	  ptrdiff_t *entry = bb_bounds.get (gimple_bb (elt->stmt));
1.1  mrg 	  if (!entry)
1.1  mrg 	    bb_bounds.put (gimple_bb (elt->stmt), index);
1.1  mrg 	  else if ((ptrdiff_t)*entry > index)
1.1  mrg 	    *entry = index;
1.1  mrg 	}
1.1  mrg     }
1.1  mrg
1.1  mrg   hash_map<basic_block, ptrdiff_t> block_priority;
1.1  mrg
1.1  mrg   /* Perform shortest path discovery loop->header ... loop->latch.
1.1  mrg
1.1  mrg      The "distance" is given by the smallest loop bound of basic block
1.1  mrg      present in the path and we look for path with largest smallest bound
1.1  mrg      on it.
1.1  mrg
1.1  mrg      To avoid the need for fibonacci heap on double ints we simply compress
1.1  mrg      double ints into indexes to BOUNDS array and then represent the queue
1.1  mrg      as arrays of queues for every index.
1.1  mrg      Index of BOUNDS.length() means that the execution of given BB has
1.1  mrg      no bounds determined.
1.1  mrg
1.1  mrg      VISITED is a pointer map translating basic block into smallest index
1.1  mrg      it was inserted into the priority queue with.  */
1.1  mrg   latch_index = -1;
1.1  mrg
1.1  mrg   /* Start walk in loop header with index set to infinite bound.  */
1.1  mrg   queue_index = bounds.length ();
1.1  mrg   queues.safe_grow_cleared (queue_index + 1, true);
1.1  mrg   queue.safe_push (loop->header);
1.1  mrg   queues[queue_index] = queue;
1.1  mrg   block_priority.put (loop->header, queue_index);
1.1  mrg
1.1  mrg   for (; queue_index >= 0; queue_index--)
1.1  mrg     {
1.1  mrg       if (latch_index < queue_index)
1.1  mrg 	{
1.1  mrg 	  while (queues[queue_index].length ())
1.1  mrg 	    {
1.1  mrg 	      basic_block bb;
1.1  mrg 	      ptrdiff_t bound_index = queue_index;
1.1  mrg               edge e;
1.1  mrg               edge_iterator ei;
1.1  mrg
1.1  mrg 	      queue = queues[queue_index];
1.1  mrg 	      bb = queue.pop ();
1.1  mrg
1.1  mrg 	      /* OK, we later inserted the BB with lower priority, skip it.  */
1.1  mrg 	      if (*block_priority.get (bb) > queue_index)
1.1  mrg 		continue;
1.1  mrg
1.1  mrg 	      /* See if we can improve the bound.  */
1.1  mrg 	      ptrdiff_t *entry = bb_bounds.get (bb);
1.1  mrg 	      if (entry && *entry < bound_index)
1.1  mrg 		bound_index = *entry;
1.1  mrg
1.1  mrg 	      /* Insert succesors into the queue, watch for latch edge
1.1  mrg 		 and record greatest index we saw.  */
1.1  mrg 	      FOR_EACH_EDGE (e, ei, bb->succs)
1.1  mrg 		{
1.1  mrg 		  bool insert = false;
1.1  mrg
1.1  mrg 		  if (loop_exit_edge_p (loop, e))
1.1  mrg 		    continue;
1.1  mrg
1.1  mrg 		  if (e == loop_latch_edge (loop)
1.1  mrg 		      && latch_index < bound_index)
1.1  mrg 		    latch_index = bound_index;
1.1  mrg 		  else if (!(entry = block_priority.get (e->dest)))
1.1  mrg 		    {
1.1  mrg 		      insert = true;
1.1  mrg 		      block_priority.put (e->dest, bound_index);
1.1  mrg 		    }
1.1  mrg 		  else if (*entry < bound_index)
1.1  mrg 		    {
1.1  mrg 		      insert = true;
1.1  mrg 		      *entry = bound_index;
1.1  mrg 		    }
1.1  mrg
1.1  mrg 		  if (insert)
1.1  mrg 		    queues[bound_index].safe_push (e->dest);
1.1  mrg 		}
1.1  mrg 	    }
1.1  mrg 	}
1.1  mrg       queues[queue_index].release ();
1.1  mrg     }
1.1  mrg
1.1  mrg   gcc_assert (latch_index >= 0);
1.1  mrg   if ((unsigned)latch_index < bounds.length ())
1.1  mrg     {
1.1  mrg       if (dump_file && (dump_flags & TDF_DETAILS))
1.1  mrg 	{
1.1  mrg 	  fprintf (dump_file, "Found better loop bound ");
1.1  mrg 	  print_decu (bounds[latch_index], dump_file);
1.1  mrg 	  fprintf (dump_file, "\n");
1.1  mrg 	}
1.1  mrg       record_niter_bound (loop, bounds[latch_index], false, true);
1.1  mrg     }
1.1  mrg
1.1  mrg   queues.release ();
1.1  mrg }
1.1  mrg
1.1  mrg /* See if every path cross the loop goes through a statement that is known
1.1  mrg    to not execute at the last iteration. In that case we can decrese iteration
1.1  mrg    count by 1.  */
1.1  mrg
1.1  mrg static void
1.1  mrg maybe_lower_iteration_bound (class loop *loop)
1.1  mrg {
1.1  mrg   hash_set<gimple *> *not_executed_last_iteration = NULL;
1.1  mrg   class nb_iter_bound *elt;
1.1  mrg   bool found_exit = false;
1.1  mrg   auto_vec<basic_block> queue;
1.1  mrg   bitmap visited;
1.1  mrg
1.1  mrg   /* Collect all statements with interesting (i.e. lower than
1.1  mrg      nb_iterations_upper_bound) bound on them.
1.1  mrg
1.1  mrg      TODO: Due to the way record_estimate choose estimates to store, the bounds
1.1  mrg      will be always nb_iterations_upper_bound-1.  We can change this to record
1.1  mrg      also statements not dominating the loop latch and update the walk bellow
1.1  mrg      to the shortest path algorithm.  */
1.1  mrg   for (elt = loop->bounds; elt; elt = elt->next)
1.1  mrg     {
1.1  mrg       if (!elt->is_exit
1.1  mrg 	  && wi::ltu_p (elt->bound, loop->nb_iterations_upper_bound))
1.1  mrg 	{
1.1  mrg 	  if (!not_executed_last_iteration)
1.1  mrg 	    not_executed_last_iteration = new hash_set<gimple *>;
1.1  mrg 	  not_executed_last_iteration->add (elt->stmt);
1.1  mrg 	}
1.1  mrg     }
1.1  mrg   if (!not_executed_last_iteration)
1.1  mrg     return;
1.1  mrg
1.1  mrg   /* Start DFS walk in the loop header and see if we can reach the
1.1  mrg      loop latch or any of the exits (including statements with side
1.1  mrg      effects that may terminate the loop otherwise) without visiting
1.1  mrg      any of the statements known to have undefined effect on the last
1.1  mrg      iteration.  */
1.1  mrg   queue.safe_push (loop->header);
1.1  mrg   visited = BITMAP_ALLOC (NULL);
1.1  mrg   bitmap_set_bit (visited, loop->header->index);
1.1  mrg   found_exit = false;
1.1  mrg
1.1  mrg   do
1.1  mrg     {
1.1  mrg       basic_block bb = queue.pop ();
1.1  mrg       gimple_stmt_iterator gsi;
1.1  mrg       bool stmt_found = false;
1.1  mrg
1.1  mrg       /* Loop for possible exits and statements bounding the execution.  */
1.1  mrg       for (gsi = gsi_start_bb (bb); !gsi_end_p (gsi); gsi_next (&gsi))
1.1  mrg 	{
1.1  mrg 	  gimple *stmt = gsi_stmt (gsi);
1.1  mrg 	  if (not_executed_last_iteration->contains (stmt))
1.1  mrg 	    {
1.1  mrg 	      stmt_found = true;
1.1  mrg 	      break;
1.1  mrg 	    }
1.1  mrg 	  if (gimple_has_side_effects (stmt))
1.1  mrg 	    {
1.1  mrg 	      found_exit = true;
1.1  mrg 	      break;
1.1  mrg 	    }
1.1  mrg 	}
1.1  mrg       if (found_exit)
1.1  mrg 	break;
1.1  mrg
1.1  mrg       /* If no bounding statement is found, continue the walk.  */
1.1  mrg       if (!stmt_found)
1.1  mrg 	{
1.1  mrg           edge e;
1.1  mrg           edge_iterator ei;
1.1  mrg
1.1  mrg           FOR_EACH_EDGE (e, ei, bb->succs)
1.1  mrg 	    {
1.1  mrg 	      if (loop_exit_edge_p (loop, e)
1.1  mrg 		  || e == loop_latch_edge (loop))
1.1  mrg 		{
1.1  mrg 		  found_exit = true;
1.1  mrg 		  break;
1.1  mrg 		}
1.1  mrg 	      if (bitmap_set_bit (visited, e->dest->index))
1.1  mrg 		queue.safe_push (e->dest);
1.1  mrg 	    }
1.1  mrg 	}
1.1  mrg     }
1.1  mrg   while (queue.length () && !found_exit);
1.1  mrg
1.1  mrg   /* If every path through the loop reach bounding statement before exit,
1.1  mrg      then we know the last iteration of the loop will have undefined effect
1.1  mrg      and we can decrease number of iterations.  */
1.1  mrg
1.1  mrg   if (!found_exit)
1.1  mrg     {
1.1  mrg       if (dump_file && (dump_flags & TDF_DETAILS))
1.1  mrg 	fprintf (dump_file, "Reducing loop iteration estimate by 1; "
1.1  mrg 		 "undefined statement must be executed at the last iteration.\n");
1.1  mrg       record_niter_bound (loop, loop->nb_iterations_upper_bound - 1,
1.1  mrg 			  false, true);
1.1  mrg     }
1.1  mrg
1.1  mrg   BITMAP_FREE (visited);
1.1  mrg   delete not_executed_last_iteration;
1.1  mrg }
1.1  mrg
1.1  mrg /* Get expected upper bound for number of loop iterations for
1.1  mrg    BUILT_IN_EXPECT_WITH_PROBABILITY for a condition COND.  */
1.1  mrg
1.1  mrg static tree
1.1  mrg get_upper_bound_based_on_builtin_expr_with_prob (gcond *cond)
1.1  mrg {
1.1  mrg   if (cond == NULL)
1.1  mrg     return NULL_TREE;
1.1  mrg
1.1  mrg   tree lhs = gimple_cond_lhs (cond);
1.1  mrg   if (TREE_CODE (lhs) != SSA_NAME)
1.1  mrg     return NULL_TREE;
1.1  mrg
1.1  mrg   gimple *stmt = SSA_NAME_DEF_STMT (gimple_cond_lhs (cond));
1.1  mrg   gcall *def = dyn_cast<gcall *> (stmt);
1.1  mrg   if (def == NULL)
1.1  mrg     return NULL_TREE;
1.1  mrg
1.1  mrg   tree decl = gimple_call_fndecl (def);
1.1  mrg   if (!decl
1.1  mrg       || !fndecl_built_in_p (decl, BUILT_IN_EXPECT_WITH_PROBABILITY)
1.1  mrg       || gimple_call_num_args (stmt) != 3)
1.1  mrg     return NULL_TREE;
1.1  mrg
1.1  mrg   tree c = gimple_call_arg (def, 1);
1.1  mrg   tree condt = TREE_TYPE (lhs);
1.1  mrg   tree res = fold_build2 (gimple_cond_code (cond),
1.1  mrg 			  condt, c,
1.1  mrg 			  gimple_cond_rhs (cond));
1.1  mrg   if (TREE_CODE (res) != INTEGER_CST)
1.1  mrg     return NULL_TREE;
1.1  mrg
1.1  mrg
1.1  mrg   tree prob = gimple_call_arg (def, 2);
1.1  mrg   tree t = TREE_TYPE (prob);
1.1  mrg   tree one
1.1  mrg     = build_real_from_int_cst (t,
1.1  mrg 			       integer_one_node);
1.1  mrg   if (integer_zerop (res))
1.1  mrg     prob = fold_build2 (MINUS_EXPR, t, one, prob);
1.1  mrg   tree r = fold_build2 (RDIV_EXPR, t, one, prob);
1.1  mrg   if (TREE_CODE (r) != REAL_CST)
1.1  mrg     return NULL_TREE;
1.1  mrg
1.1  mrg   HOST_WIDE_INT probi
1.1  mrg     = real_to_integer (TREE_REAL_CST_PTR (r));
1.1  mrg   return build_int_cst (condt, probi);
1.1  mrg }
1.1  mrg
1.1  mrg /* Records estimates on numbers of iterations of LOOP.  If USE_UNDEFINED_P
1.1  mrg    is true also use estimates derived from undefined behavior.  */
1.1  mrg
1.1  mrg void
1.1  mrg estimate_numbers_of_iterations (class loop *loop)
1.1  mrg {
1.1  mrg   tree niter, type;
1.1  mrg   unsigned i;
1.1  mrg   class tree_niter_desc niter_desc;
1.1  mrg   edge ex;
1.1  mrg   widest_int bound;
1.1  mrg   edge likely_exit;
1.1  mrg
1.1  mrg   /* Give up if we already have tried to compute an estimation.  */
1.1  mrg   if (loop->estimate_state != EST_NOT_COMPUTED)
1.1  mrg     return;
1.1  mrg
1.1  mrg   if (dump_file && (dump_flags & TDF_DETAILS))
1.1  mrg     fprintf (dump_file, "Estimating # of iterations of loop %d\n", loop->num);
1.1  mrg
1.1  mrg   loop->estimate_state = EST_AVAILABLE;
1.1  mrg
1.1  mrg   /* If we have a measured profile, use it to estimate the number of
1.1  mrg      iterations.  Normally this is recorded by branch_prob right after
1.1  mrg      reading the profile.  In case we however found a new loop, record the
1.1  mrg      information here.
1.1  mrg
1.1  mrg      Explicitly check for profile status so we do not report
1.1  mrg      wrong prediction hitrates for guessed loop iterations heuristics.
1.1  mrg      Do not recompute already recorded bounds - we ought to be better on
1.1  mrg      updating iteration bounds than updating profile in general and thus
1.1  mrg      recomputing iteration bounds later in the compilation process will just
1.1  mrg      introduce random roundoff errors.  */
1.1  mrg   if (!loop->any_estimate
1.1  mrg       && loop->header->count.reliable_p ())
1.1  mrg     {
1.1  mrg       gcov_type nit = expected_loop_iterations_unbounded (loop);
1.1  mrg       bound = gcov_type_to_wide_int (nit);
1.1  mrg       record_niter_bound (loop, bound, true, false);
1.1  mrg     }
1.1  mrg
1.1  mrg   /* Ensure that loop->nb_iterations is computed if possible.  If it turns out
1.1  mrg      to be constant, we avoid undefined behavior implied bounds and instead
1.1  mrg      diagnose those loops with -Waggressive-loop-optimizations.  */
1.1  mrg   number_of_latch_executions (loop);
1.1  mrg
1.1  mrg   basic_block *body = get_loop_body (loop);
1.1  mrg   auto_vec<edge> exits = get_loop_exit_edges (loop, body);
1.1  mrg   likely_exit = single_likely_exit (loop, exits);
1.1  mrg   FOR_EACH_VEC_ELT (exits, i, ex)
1.1  mrg     {
1.1  mrg       if (ex == likely_exit)
1.1  mrg 	{
1.1  mrg 	  gimple *stmt = last_stmt (ex->src);
1.1  mrg 	  if (stmt != NULL)
1.1  mrg 	    {
1.1  mrg 	      gcond *cond = dyn_cast<gcond *> (stmt);
1.1  mrg 	      tree niter_bound
1.1  mrg 		= get_upper_bound_based_on_builtin_expr_with_prob (cond);
1.1  mrg 	      if (niter_bound != NULL_TREE)
1.1  mrg 		{
1.1  mrg 		  widest_int max = derive_constant_upper_bound (niter_bound);
1.1  mrg 		  record_estimate (loop, niter_bound, max, cond,
1.1  mrg 				   true, true, false);
1.1  mrg 		}
1.1  mrg 	    }
1.1  mrg 	}
1.1  mrg
1.1  mrg       if (!number_of_iterations_exit (loop, ex, &niter_desc,
1.1  mrg 				      false, false, body))
1.1  mrg 	continue;
1.1  mrg
1.1  mrg       niter = niter_desc.niter;
1.1  mrg       type = TREE_TYPE (niter);
1.1  mrg       if (TREE_CODE (niter_desc.may_be_zero) != INTEGER_CST)
1.1  mrg 	niter = build3 (COND_EXPR, type, niter_desc.may_be_zero,
1.1  mrg 			build_int_cst (type, 0),
1.1  mrg 			niter);
1.1  mrg       record_estimate (loop, niter, niter_desc.max,
1.1  mrg 		       last_stmt (ex->src),
1.1  mrg 		       true, ex == likely_exit, true);
1.1  mrg       record_control_iv (loop, &niter_desc);
1.1  mrg     }
1.1  mrg
1.1  mrg   if (flag_aggressive_loop_optimizations)
1.1  mrg     infer_loop_bounds_from_undefined (loop, body);
1.1  mrg   free (body);
1.1  mrg
1.1  mrg   discover_iteration_bound_by_body_walk (loop);
1.1  mrg
1.1  mrg   maybe_lower_iteration_bound (loop);
1.1  mrg
1.1  mrg   /* If we know the exact number of iterations of this loop, try to
1.1  mrg      not break code with undefined behavior by not recording smaller
1.1  mrg      maximum number of iterations.  */
1.1  mrg   if (loop->nb_iterations
1.1  mrg       && TREE_CODE (loop->nb_iterations) == INTEGER_CST)
1.1  mrg     {
1.1  mrg       loop->any_upper_bound = true;
1.1  mrg       loop->nb_iterations_upper_bound = wi::to_widest (loop->nb_iterations);
1.1  mrg     }
1.1  mrg }
1.1  mrg
1.1  mrg /* Sets NIT to the estimated number of executions of the latch of the
1.1  mrg    LOOP.  If CONSERVATIVE is true, we must be sure that NIT is at least as
1.1  mrg    large as the number of iterations.  If we have no reliable estimate,
1.1  mrg    the function returns false, otherwise returns true.  */
1.1  mrg
1.1  mrg bool
1.1  mrg estimated_loop_iterations (class loop *loop, widest_int *nit)
1.1  mrg {
1.1  mrg   /* When SCEV information is available, try to update loop iterations
1.1  mrg      estimate.  Otherwise just return whatever we recorded earlier.  */
1.1  mrg   if (scev_initialized_p ())
1.1  mrg     estimate_numbers_of_iterations (loop);
1.1  mrg
1.1  mrg   return (get_estimated_loop_iterations (loop, nit));
1.1  mrg }
1.1  mrg
1.1  mrg /* Similar to estimated_loop_iterations, but returns the estimate only
1.1  mrg    if it fits to HOST_WIDE_INT.  If this is not the case, or the estimate
1.1  mrg    on the number of iterations of LOOP could not be derived, returns -1.  */
1.1  mrg
1.1  mrg HOST_WIDE_INT
1.1  mrg estimated_loop_iterations_int (class loop *loop)
1.1  mrg {
1.1  mrg   widest_int nit;
1.1  mrg   HOST_WIDE_INT hwi_nit;
1.1  mrg
1.1  mrg   if (!estimated_loop_iterations (loop, &nit))
1.1  mrg     return -1;
1.1  mrg
1.1  mrg   if (!wi::fits_shwi_p (nit))
1.1  mrg     return -1;
1.1  mrg   hwi_nit = nit.to_shwi ();
1.1  mrg
1.1  mrg   return hwi_nit < 0 ? -1 : hwi_nit;
1.1  mrg }
1.1  mrg
1.1  mrg
1.1  mrg /* Sets NIT to an upper bound for the maximum number of executions of the
1.1  mrg    latch of the LOOP.  If we have no reliable estimate, the function returns
1.1  mrg    false, otherwise returns true.  */
1.1  mrg
1.1  mrg bool
1.1  mrg max_loop_iterations (class loop *loop, widest_int *nit)
1.1  mrg {
1.1  mrg   /* When SCEV information is available, try to update loop iterations
1.1  mrg      estimate.  Otherwise just return whatever we recorded earlier.  */
1.1  mrg   if (scev_initialized_p ())
1.1  mrg     estimate_numbers_of_iterations (loop);
1.1  mrg
1.1  mrg   return get_max_loop_iterations (loop, nit);
1.1  mrg }
1.1  mrg
1.1  mrg /* Similar to max_loop_iterations, but returns the estimate only
1.1  mrg    if it fits to HOST_WIDE_INT.  If this is not the case, or the estimate
1.1  mrg    on the number of iterations of LOOP could not be derived, returns -1.  */
1.1  mrg
1.1  mrg HOST_WIDE_INT
1.1  mrg max_loop_iterations_int (class loop *loop)
1.1  mrg {
1.1  mrg   widest_int nit;
1.1  mrg   HOST_WIDE_INT hwi_nit;
1.1  mrg
1.1  mrg   if (!max_loop_iterations (loop, &nit))
1.1  mrg     return -1;
1.1  mrg
1.1  mrg   if (!wi::fits_shwi_p (nit))
1.1  mrg     return -1;
1.1  mrg   hwi_nit = nit.to_shwi ();
1.1  mrg
1.1  mrg   return hwi_nit < 0 ? -1 : hwi_nit;
1.1  mrg }
1.1  mrg
1.1  mrg /* Sets NIT to an likely upper bound for the maximum number of executions of the
1.1  mrg    latch of the LOOP.  If we have no reliable estimate, the function returns
1.1  mrg    false, otherwise returns true.  */
1.1  mrg
1.1  mrg bool
1.1  mrg likely_max_loop_iterations (class loop *loop, widest_int *nit)
1.1  mrg {
1.1  mrg   /* When SCEV information is available, try to update loop iterations
1.1  mrg      estimate.  Otherwise just return whatever we recorded earlier.  */
1.1  mrg   if (scev_initialized_p ())
1.1  mrg     estimate_numbers_of_iterations (loop);
1.1  mrg
1.1  mrg   return get_likely_max_loop_iterations (loop, nit);
1.1  mrg }
1.1  mrg
1.1  mrg /* Similar to max_loop_iterations, but returns the estimate only
1.1  mrg    if it fits to HOST_WIDE_INT.  If this is not the case, or the estimate
1.1  mrg    on the number of iterations of LOOP could not be derived, returns -1.  */
1.1  mrg
1.1  mrg HOST_WIDE_INT
1.1  mrg likely_max_loop_iterations_int (class loop *loop)
1.1  mrg {
1.1  mrg   widest_int nit;
1.1  mrg   HOST_WIDE_INT hwi_nit;
1.1  mrg
1.1  mrg   if (!likely_max_loop_iterations (loop, &nit))
1.1  mrg     return -1;
1.1  mrg
1.1  mrg   if (!wi::fits_shwi_p (nit))
1.1  mrg     return -1;
1.1  mrg   hwi_nit = nit.to_shwi ();
1.1  mrg
1.1  mrg   return hwi_nit < 0 ? -1 : hwi_nit;
1.1  mrg }
1.1  mrg
1.1  mrg /* Returns an estimate for the number of executions of statements
1.1  mrg    in the LOOP.  For statements before the loop exit, this exceeds
1.1  mrg    the number of execution of the latch by one.  */
1.1  mrg
1.1  mrg HOST_WIDE_INT
1.1  mrg estimated_stmt_executions_int (class loop *loop)
1.1  mrg {
1.1  mrg   HOST_WIDE_INT nit = estimated_loop_iterations_int (loop);
1.1  mrg   HOST_WIDE_INT snit;
1.1  mrg
1.1  mrg   if (nit == -1)
1.1  mrg     return -1;
1.1  mrg
1.1  mrg   snit = (HOST_WIDE_INT) ((unsigned HOST_WIDE_INT) nit + 1);
1.1  mrg
1.1  mrg   /* If the computation overflows, return -1.  */
1.1  mrg   return snit < 0 ? -1 : snit;
1.1  mrg }
1.1  mrg
1.1  mrg /* Sets NIT to the maximum number of executions of the latch of the
1.1  mrg    LOOP, plus one.  If we have no reliable estimate, the function returns
1.1  mrg    false, otherwise returns true.  */
1.1  mrg
1.1  mrg bool
1.1  mrg max_stmt_executions (class loop *loop, widest_int *nit)
1.1  mrg {
1.1  mrg   widest_int nit_minus_one;
1.1  mrg
1.1  mrg   if (!max_loop_iterations (loop, nit))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   nit_minus_one = *nit;
1.1  mrg
1.1  mrg   *nit += 1;
1.1  mrg
1.1  mrg   return wi::gtu_p (*nit, nit_minus_one);
1.1  mrg }
1.1  mrg
1.1  mrg /* Sets NIT to the estimated maximum number of executions of the latch of the
1.1  mrg    LOOP, plus one.  If we have no likely estimate, the function returns
1.1  mrg    false, otherwise returns true.  */
1.1  mrg
1.1  mrg bool
1.1  mrg likely_max_stmt_executions (class loop *loop, widest_int *nit)
1.1  mrg {
1.1  mrg   widest_int nit_minus_one;
1.1  mrg
1.1  mrg   if (!likely_max_loop_iterations (loop, nit))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   nit_minus_one = *nit;
1.1  mrg
1.1  mrg   *nit += 1;
1.1  mrg
1.1  mrg   return wi::gtu_p (*nit, nit_minus_one);
1.1  mrg }
1.1  mrg
1.1  mrg /* Sets NIT to the estimated number of executions of the latch of the
1.1  mrg    LOOP, plus one.  If we have no reliable estimate, the function returns
1.1  mrg    false, otherwise returns true.  */
1.1  mrg
1.1  mrg bool
1.1  mrg estimated_stmt_executions (class loop *loop, widest_int *nit)
1.1  mrg {
1.1  mrg   widest_int nit_minus_one;
1.1  mrg
1.1  mrg   if (!estimated_loop_iterations (loop, nit))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   nit_minus_one = *nit;
1.1  mrg
1.1  mrg   *nit += 1;
1.1  mrg
1.1  mrg   return wi::gtu_p (*nit, nit_minus_one);
1.1  mrg }
1.1  mrg
1.1  mrg /* Records estimates on numbers of iterations of loops.  */
1.1  mrg
1.1  mrg void
1.1  mrg estimate_numbers_of_iterations (function *fn)
1.1  mrg {
1.1  mrg   /* We don't want to issue signed overflow warnings while getting
1.1  mrg      loop iteration estimates.  */
1.1  mrg   fold_defer_overflow_warnings ();
1.1  mrg
1.1  mrg   for (auto loop : loops_list (fn, 0))
1.1  mrg     estimate_numbers_of_iterations (loop);
1.1  mrg
1.1  mrg   fold_undefer_and_ignore_overflow_warnings ();
1.1  mrg }
1.1  mrg
1.1  mrg /* Returns true if statement S1 dominates statement S2.  */
1.1  mrg
1.1  mrg bool
1.1  mrg stmt_dominates_stmt_p (gimple *s1, gimple *s2)
1.1  mrg {
1.1  mrg   basic_block bb1 = gimple_bb (s1), bb2 = gimple_bb (s2);
1.1  mrg
1.1  mrg   if (!bb1
1.1  mrg       || s1 == s2)
1.1  mrg     return true;
1.1  mrg
1.1  mrg   if (bb1 == bb2)
1.1  mrg     {
1.1  mrg       gimple_stmt_iterator bsi;
1.1  mrg
1.1  mrg       if (gimple_code (s2) == GIMPLE_PHI)
1.1  mrg 	return false;
1.1  mrg
1.1  mrg       if (gimple_code (s1) == GIMPLE_PHI)
1.1  mrg 	return true;
1.1  mrg
1.1  mrg       for (bsi = gsi_start_bb (bb1); gsi_stmt (bsi) != s2; gsi_next (&bsi))
1.1  mrg 	if (gsi_stmt (bsi) == s1)
1.1  mrg 	  return true;
1.1  mrg
1.1  mrg       return false;
1.1  mrg     }
1.1  mrg
1.1  mrg   return dominated_by_p (CDI_DOMINATORS, bb2, bb1);
1.1  mrg }
1.1  mrg
1.1  mrg /* Returns true when we can prove that the number of executions of
1.1  mrg    STMT in the loop is at most NITER, according to the bound on
1.1  mrg    the number of executions of the statement NITER_BOUND->stmt recorded in
1.1  mrg    NITER_BOUND and fact that NITER_BOUND->stmt dominate STMT.
1.1  mrg
1.1  mrg    ??? This code can become quite a CPU hog - we can have many bounds,
1.1  mrg    and large basic block forcing stmt_dominates_stmt_p to be queried
1.1  mrg    many times on a large basic blocks, so the whole thing is O(n^2)
1.1  mrg    for scev_probably_wraps_p invocation (that can be done n times).
1.1  mrg
1.1  mrg    It would make more sense (and give better answers) to remember BB
1.1  mrg    bounds computed by discover_iteration_bound_by_body_walk.  */
1.1  mrg
1.1  mrg static bool
1.1  mrg n_of_executions_at_most (gimple *stmt,
1.1  mrg 			 class nb_iter_bound *niter_bound,
1.1  mrg 			 tree niter)
1.1  mrg {
1.1  mrg   widest_int bound = niter_bound->bound;
1.1  mrg   tree nit_type = TREE_TYPE (niter), e;
1.1  mrg   enum tree_code cmp;
1.1  mrg
1.1  mrg   gcc_assert (TYPE_UNSIGNED (nit_type));
1.1  mrg
1.1  mrg   /* If the bound does not even fit into NIT_TYPE, it cannot tell us that
1.1  mrg      the number of iterations is small.  */
1.1  mrg   if (!wi::fits_to_tree_p (bound, nit_type))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* We know that NITER_BOUND->stmt is executed at most NITER_BOUND->bound + 1
1.1  mrg      times.  This means that:
1.1  mrg
1.1  mrg      -- if NITER_BOUND->is_exit is true, then everything after
1.1  mrg 	it at most NITER_BOUND->bound times.
1.1  mrg
1.1  mrg      -- If NITER_BOUND->is_exit is false, then if we can prove that when STMT
1.1  mrg 	is executed, then NITER_BOUND->stmt is executed as well in the same
1.1  mrg 	iteration then STMT is executed at most NITER_BOUND->bound + 1 times.
1.1  mrg
1.1  mrg 	If we can determine that NITER_BOUND->stmt is always executed
1.1  mrg 	after STMT, then STMT is executed at most NITER_BOUND->bound + 2 times.
1.1  mrg 	We conclude that if both statements belong to the same
1.1  mrg 	basic block and STMT is before NITER_BOUND->stmt and there are no
1.1  mrg 	statements with side effects in between.  */
1.1  mrg
1.1  mrg   if (niter_bound->is_exit)
1.1  mrg     {
1.1  mrg       if (stmt == niter_bound->stmt
1.1  mrg 	  || !stmt_dominates_stmt_p (niter_bound->stmt, stmt))
1.1  mrg 	return false;
1.1  mrg       cmp = GE_EXPR;
1.1  mrg     }
1.1  mrg   else
1.1  mrg     {
1.1  mrg       if (!stmt_dominates_stmt_p (niter_bound->stmt, stmt))
1.1  mrg 	{
1.1  mrg           gimple_stmt_iterator bsi;
1.1  mrg 	  if (gimple_bb (stmt) != gimple_bb (niter_bound->stmt)
1.1  mrg 	      || gimple_code (stmt) == GIMPLE_PHI
1.1  mrg 	      || gimple_code (niter_bound->stmt) == GIMPLE_PHI)
1.1  mrg 	    return false;
1.1  mrg
1.1  mrg 	  /* By stmt_dominates_stmt_p we already know that STMT appears
1.1  mrg 	     before NITER_BOUND->STMT.  Still need to test that the loop
1.1  mrg 	     cannot be terinated by a side effect in between.  */
1.1  mrg 	  for (bsi = gsi_for_stmt (stmt); gsi_stmt (bsi) != niter_bound->stmt;
1.1  mrg 	       gsi_next (&bsi))
1.1  mrg 	    if (gimple_has_side_effects (gsi_stmt (bsi)))
1.1  mrg 	       return false;
1.1  mrg 	  bound += 1;
1.1  mrg 	  if (bound == 0
1.1  mrg 	      || !wi::fits_to_tree_p (bound, nit_type))
1.1  mrg 	    return false;
1.1  mrg 	}
1.1  mrg       cmp = GT_EXPR;
1.1  mrg     }
1.1  mrg
1.1  mrg   e = fold_binary (cmp, boolean_type_node,
1.1  mrg 		   niter, wide_int_to_tree (nit_type, bound));
1.1  mrg   return e && integer_nonzerop (e);
1.1  mrg }
1.1  mrg
1.1  mrg /* Returns true if the arithmetics in TYPE can be assumed not to wrap.  */
1.1  mrg
1.1  mrg bool
1.1  mrg nowrap_type_p (tree type)
1.1  mrg {
1.1  mrg   if (ANY_INTEGRAL_TYPE_P (type)
1.1  mrg       && TYPE_OVERFLOW_UNDEFINED (type))
1.1  mrg     return true;
1.1  mrg
1.1  mrg   if (POINTER_TYPE_P (type))
1.1  mrg     return true;
1.1  mrg
1.1  mrg   return false;
1.1  mrg }
1.1  mrg
1.1  mrg /* Return true if we can prove LOOP is exited before evolution of induction
1.1  mrg    variable {BASE, STEP} overflows with respect to its type bound.  */
1.1  mrg
1.1  mrg static bool
1.1  mrg loop_exits_before_overflow (tree base, tree step,
1.1  mrg 			    gimple *at_stmt, class loop *loop)
1.1  mrg {
1.1  mrg   widest_int niter;
1.1  mrg   struct control_iv *civ;
1.1  mrg   class nb_iter_bound *bound;
1.1  mrg   tree e, delta, step_abs, unsigned_base;
1.1  mrg   tree type = TREE_TYPE (step);
1.1  mrg   tree unsigned_type, valid_niter;
1.1  mrg
1.1  mrg   /* Don't issue signed overflow warnings.  */
1.1  mrg   fold_defer_overflow_warnings ();
1.1  mrg
1.1  mrg   /* Compute the number of iterations before we reach the bound of the
1.1  mrg      type, and verify that the loop is exited before this occurs.  */
1.1  mrg   unsigned_type = unsigned_type_for (type);
1.1  mrg   unsigned_base = fold_convert (unsigned_type, base);
1.1  mrg
1.1  mrg   if (tree_int_cst_sign_bit (step))
1.1  mrg     {
1.1  mrg       tree extreme = fold_convert (unsigned_type,
1.1  mrg 				   lower_bound_in_type (type, type));
1.1  mrg       delta = fold_build2 (MINUS_EXPR, unsigned_type, unsigned_base, extreme);
1.1  mrg       step_abs = fold_build1 (NEGATE_EXPR, unsigned_type,
1.1  mrg 			      fold_convert (unsigned_type, step));
1.1  mrg     }
1.1  mrg   else
1.1  mrg     {
1.1  mrg       tree extreme = fold_convert (unsigned_type,
1.1  mrg 				   upper_bound_in_type (type, type));
1.1  mrg       delta = fold_build2 (MINUS_EXPR, unsigned_type, extreme, unsigned_base);
1.1  mrg       step_abs = fold_convert (unsigned_type, step);
1.1  mrg     }
1.1  mrg
1.1  mrg   valid_niter = fold_build2 (FLOOR_DIV_EXPR, unsigned_type, delta, step_abs);
1.1  mrg
1.1  mrg   estimate_numbers_of_iterations (loop);
1.1  mrg
1.1  mrg   if (max_loop_iterations (loop, &niter)
1.1  mrg       && wi::fits_to_tree_p (niter, TREE_TYPE (valid_niter))
1.1  mrg       && (e = fold_binary (GT_EXPR, boolean_type_node, valid_niter,
1.1  mrg 			   wide_int_to_tree (TREE_TYPE (valid_niter),
1.1  mrg 					     niter))) != NULL
1.1  mrg       && integer_nonzerop (e))
1.1  mrg     {
1.1  mrg       fold_undefer_and_ignore_overflow_warnings ();
1.1  mrg       return true;
1.1  mrg     }
1.1  mrg   if (at_stmt)
1.1  mrg     for (bound = loop->bounds; bound; bound = bound->next)
1.1  mrg       {
1.1  mrg 	if (n_of_executions_at_most (at_stmt, bound, valid_niter))
1.1  mrg 	  {
1.1  mrg 	    fold_undefer_and_ignore_overflow_warnings ();
1.1  mrg 	    return true;
1.1  mrg 	  }
1.1  mrg       }
1.1  mrg   fold_undefer_and_ignore_overflow_warnings ();
1.1  mrg
1.1  mrg   /* Try to prove loop is exited before {base, step} overflows with the
1.1  mrg      help of analyzed loop control IV.  This is done only for IVs with
1.1  mrg      constant step because otherwise we don't have the information.  */
1.1  mrg   if (TREE_CODE (step) == INTEGER_CST)
1.1  mrg     {
1.1  mrg       for (civ = loop->control_ivs; civ; civ = civ->next)
1.1  mrg 	{
1.1  mrg 	  enum tree_code code;
1.1  mrg 	  tree civ_type = TREE_TYPE (civ->step);
1.1  mrg
1.1  mrg 	  /* Have to consider type difference because operand_equal_p ignores
1.1  mrg 	     that for constants.  */
1.1  mrg 	  if (TYPE_UNSIGNED (type) != TYPE_UNSIGNED (civ_type)
1.1  mrg 	      || element_precision (type) != element_precision (civ_type))
1.1  mrg 	    continue;
1.1  mrg
1.1  mrg 	  /* Only consider control IV with same step.  */
1.1  mrg 	  if (!operand_equal_p (step, civ->step, 0))
1.1  mrg 	    continue;
1.1  mrg
1.1  mrg 	  /* Done proving if this is a no-overflow control IV.  */
1.1  mrg 	  if (operand_equal_p (base, civ->base, 0))
1.1  mrg 	    return true;
1.1  mrg
1.1  mrg 	  /* Control IV is recorded after expanding simple operations,
1.1  mrg 	     Here we expand base and compare it too.  */
1.1  mrg 	  tree expanded_base = expand_simple_operations (base);
1.1  mrg 	  if (operand_equal_p (expanded_base, civ->base, 0))
1.1  mrg 	    return true;
1.1  mrg
1.1  mrg 	  /* If this is a before stepping control IV, in other words, we have
1.1  mrg
1.1  mrg 	       {civ_base, step} = {base + step, step}
1.1  mrg
1.1  mrg 	     Because civ {base + step, step} doesn't overflow during loop
1.1  mrg 	     iterations, {base, step} will not overflow if we can prove the
1.1  mrg 	     operation "base + step" does not overflow.  Specifically, we try
1.1  mrg 	     to prove below conditions are satisfied:
1.1  mrg
1.1  mrg 	       base <= UPPER_BOUND (type) - step  ;;step > 0
1.1  mrg 	       base >= LOWER_BOUND (type) - step  ;;step < 0
1.1  mrg
1.1  mrg 	     by proving the reverse conditions are false using loop's initial
1.1  mrg 	     condition.  */
1.1  mrg 	  if (POINTER_TYPE_P (TREE_TYPE (base)))
1.1  mrg 	    code = POINTER_PLUS_EXPR;
1.1  mrg 	  else
1.1  mrg 	    code = PLUS_EXPR;
1.1  mrg
1.1  mrg 	  tree stepped = fold_build2 (code, TREE_TYPE (base), base, step);
1.1  mrg 	  tree expanded_stepped = fold_build2 (code, TREE_TYPE (base),
1.1  mrg 					       expanded_base, step);
1.1  mrg 	  if (operand_equal_p (stepped, civ->base, 0)
1.1  mrg 	      || operand_equal_p (expanded_stepped, civ->base, 0))
1.1  mrg 	    {
1.1  mrg 	      tree extreme;
1.1  mrg
1.1  mrg 	      if (tree_int_cst_sign_bit (step))
1.1  mrg 		{
1.1  mrg 		  code = LT_EXPR;
1.1  mrg 		  extreme = lower_bound_in_type (type, type);
1.1  mrg 		}
1.1  mrg 	      else
1.1  mrg 		{
1.1  mrg 		  code = GT_EXPR;
1.1  mrg 		  extreme = upper_bound_in_type (type, type);
1.1  mrg 		}
1.1  mrg 	      extreme = fold_build2 (MINUS_EXPR, type, extreme, step);
1.1  mrg 	      e = fold_build2 (code, boolean_type_node, base, extreme);
1.1  mrg 	      e = simplify_using_initial_conditions (loop, e);
1.1  mrg 	      if (integer_zerop (e))
1.1  mrg 		return true;
1.1  mrg 	    }
1.1  mrg         }
1.1  mrg     }
1.1  mrg
1.1  mrg   return false;
1.1  mrg }
1.1  mrg
1.1  mrg /* VAR is scev variable whose evolution part is constant STEP, this function
1.1  mrg    proves that VAR can't overflow by using value range info.  If VAR's value
1.1  mrg    range is [MIN, MAX], it can be proven by:
1.1  mrg      MAX + step doesn't overflow    ; if step > 0
1.1  mrg    or
1.1  mrg      MIN + step doesn't underflow   ; if step < 0.
1.1  mrg
1.1  mrg    We can only do this if var is computed in every loop iteration, i.e, var's
1.1  mrg    definition has to dominate loop latch.  Consider below example:
1.1  mrg
1.1  mrg      {
1.1  mrg        unsigned int i;
1.1  mrg
1.1  mrg        <bb 3>:
1.1  mrg
1.1  mrg        <bb 4>:
1.1  mrg        # RANGE [0, 4294967294] NONZERO 65535
1.1  mrg        # i_21 = PHI <0(3), i_18(9)>
1.1  mrg        if (i_21 != 0)
1.1  mrg 	 goto <bb 6>;
1.1  mrg        else
1.1  mrg 	 goto <bb 8>;
1.1  mrg
1.1  mrg        <bb 6>:
1.1  mrg        # RANGE [0, 65533] NONZERO 65535
1.1  mrg        _6 = i_21 + 4294967295;
1.1  mrg        # RANGE [0, 65533] NONZERO 65535
1.1  mrg        _7 = (long unsigned int) _6;
1.1  mrg        # RANGE [0, 524264] NONZERO 524280
1.1  mrg        _8 = _7 * 8;
1.1  mrg        # PT = nonlocal escaped
1.1  mrg        _9 = a_14 + _8;
1.1  mrg        *_9 = 0;
1.1  mrg
1.1  mrg        <bb 8>:
1.1  mrg        # RANGE [1, 65535] NONZERO 65535
1.1  mrg        i_18 = i_21 + 1;
1.1  mrg        if (i_18 >= 65535)
1.1  mrg 	 goto <bb 10>;
1.1  mrg        else
1.1  mrg 	 goto <bb 9>;
1.1  mrg
1.1  mrg        <bb 9>:
1.1  mrg        goto <bb 4>;
1.1  mrg
1.1  mrg        <bb 10>:
1.1  mrg        return;
1.1  mrg      }
1.1  mrg
1.1  mrg    VAR _6 doesn't overflow only with pre-condition (i_21 != 0), here we
1.1  mrg    can't use _6 to prove no-overlfow for _7.  In fact, var _7 takes value
1.1  mrg    sequence (4294967295, 0, 1, ..., 65533) in loop life time, rather than
1.1  mrg    (4294967295, 4294967296, ...).  */
1.1  mrg
1.1  mrg static bool
1.1  mrg scev_var_range_cant_overflow (tree var, tree step, class loop *loop)
1.1  mrg {
1.1  mrg   tree type;
1.1  mrg   wide_int minv, maxv, diff, step_wi;
1.1  mrg
1.1  mrg   if (TREE_CODE (step) != INTEGER_CST || !INTEGRAL_TYPE_P (TREE_TYPE (var)))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* Check if VAR evaluates in every loop iteration.  It's not the case
1.1  mrg      if VAR is default definition or does not dominate loop's latch.  */
1.1  mrg   basic_block def_bb = gimple_bb (SSA_NAME_DEF_STMT (var));
1.1  mrg   if (!def_bb || !dominated_by_p (CDI_DOMINATORS, loop->latch, def_bb))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   value_range r;
1.1  mrg   get_range_query (cfun)->range_of_expr (r, var);
1.1  mrg   if (r.kind () != VR_RANGE)
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* VAR is a scev whose evolution part is STEP and value range info
1.1  mrg      is [MIN, MAX], we can prove its no-overflowness by conditions:
1.1  mrg
1.1  mrg        type_MAX - MAX >= step   ; if step > 0
1.1  mrg        MIN - type_MIN >= |step| ; if step < 0.
1.1  mrg
1.1  mrg      Or VAR must take value outside of value range, which is not true.  */
1.1  mrg   step_wi = wi::to_wide (step);
1.1  mrg   type = TREE_TYPE (var);
1.1  mrg   if (tree_int_cst_sign_bit (step))
1.1  mrg     {
1.1  mrg       diff = r.lower_bound () - wi::to_wide (lower_bound_in_type (type, type));
1.1  mrg       step_wi = - step_wi;
1.1  mrg     }
1.1  mrg   else
1.1  mrg     diff = wi::to_wide (upper_bound_in_type (type, type)) - r.upper_bound ();
1.1  mrg
1.1  mrg   return (wi::geu_p (diff, step_wi));
1.1  mrg }
1.1  mrg
1.1  mrg /* Return false only when the induction variable BASE + STEP * I is
1.1  mrg    known to not overflow: i.e. when the number of iterations is small
1.1  mrg    enough with respect to the step and initial condition in order to
1.1  mrg    keep the evolution confined in TYPEs bounds.  Return true when the
1.1  mrg    iv is known to overflow or when the property is not computable.
1.1  mrg
1.1  mrg    USE_OVERFLOW_SEMANTICS is true if this function should assume that
1.1  mrg    the rules for overflow of the given language apply (e.g., that signed
1.1  mrg    arithmetics in C does not overflow).
1.1  mrg
1.1  mrg    If VAR is a ssa variable, this function also returns false if VAR can
1.1  mrg    be proven not overflow with value range info.  */
1.1  mrg
1.1  mrg bool
1.1  mrg scev_probably_wraps_p (tree var, tree base, tree step,
1.1  mrg 		       gimple *at_stmt, class loop *loop,
1.1  mrg 		       bool use_overflow_semantics)
1.1  mrg {
1.1  mrg   /* FIXME: We really need something like
1.1  mrg      http://gcc.gnu.org/ml/gcc-patches/2005-06/msg02025.html.
1.1  mrg
1.1  mrg      We used to test for the following situation that frequently appears
1.1  mrg      during address arithmetics:
1.1  mrg
1.1  mrg        D.1621_13 = (long unsigned intD.4) D.1620_12;
1.1  mrg        D.1622_14 = D.1621_13 * 8;
1.1  mrg        D.1623_15 = (doubleD.29 *) D.1622_14;
1.1  mrg
1.1  mrg      And derived that the sequence corresponding to D_14
1.1  mrg      can be proved to not wrap because it is used for computing a
1.1  mrg      memory access; however, this is not really the case -- for example,
1.1  mrg      if D_12 = (unsigned char) [254,+,1], then D_14 has values
1.1  mrg      2032, 2040, 0, 8, ..., but the code is still legal.  */
1.1  mrg
1.1  mrg   if (chrec_contains_undetermined (base)
1.1  mrg       || chrec_contains_undetermined (step))
1.1  mrg     return true;
1.1  mrg
1.1  mrg   if (integer_zerop (step))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* If we can use the fact that signed and pointer arithmetics does not
1.1  mrg      wrap, we are done.  */
1.1  mrg   if (use_overflow_semantics && nowrap_type_p (TREE_TYPE (base)))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* To be able to use estimates on number of iterations of the loop,
1.1  mrg      we must have an upper bound on the absolute value of the step.  */
1.1  mrg   if (TREE_CODE (step) != INTEGER_CST)
1.1  mrg     return true;
1.1  mrg
1.1  mrg   /* Check if var can be proven not overflow with value range info.  */
1.1  mrg   if (var && TREE_CODE (var) == SSA_NAME
1.1  mrg       && scev_var_range_cant_overflow (var, step, loop))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   if (loop_exits_before_overflow (base, step, at_stmt, loop))
1.1  mrg     return false;
1.1  mrg
1.1  mrg   /* At this point we still don't have a proof that the iv does not
1.1  mrg      overflow: give up.  */
1.1  mrg   return true;
1.1  mrg }
1.1  mrg
1.1  mrg /* Frees the information on upper bounds on numbers of iterations of LOOP.  */
1.1  mrg
1.1  mrg void
1.1  mrg free_numbers_of_iterations_estimates (class loop *loop)
1.1  mrg {
1.1  mrg   struct control_iv *civ;
1.1  mrg   class nb_iter_bound *bound;
1.1  mrg
1.1  mrg   loop->nb_iterations = NULL;
1.1  mrg   loop->estimate_state = EST_NOT_COMPUTED;
1.1  mrg   for (bound = loop->bounds; bound;)
1.1  mrg     {
1.1  mrg       class nb_iter_bound *next = bound->next;
1.1  mrg       ggc_free (bound);
1.1  mrg       bound = next;
1.1  mrg     }
1.1  mrg   loop->bounds = NULL;
1.1  mrg
1.1  mrg   for (civ = loop->control_ivs; civ;)
1.1  mrg     {
1.1  mrg       struct control_iv *next = civ->next;
1.1  mrg       ggc_free (civ);
1.1  mrg       civ = next;
1.1  mrg     }
1.1  mrg   loop->control_ivs = NULL;
1.1  mrg }
1.1  mrg
1.1  mrg /* Frees the information on upper bounds on numbers of iterations of loops.  */
1.1  mrg
1.1  mrg void
1.1  mrg free_numbers_of_iterations_estimates (function *fn)
1.1  mrg {
1.1  mrg   for (auto loop : loops_list (fn, 0))
1.1  mrg     free_numbers_of_iterations_estimates (loop);
1.1  mrg }
1.1  mrg
1.1  mrg /* Substitute value VAL for ssa name NAME inside expressions held
1.1  mrg    at LOOP.  */
1.1  mrg
1.1  mrg void
1.1  mrg substitute_in_loop_info (class loop *loop, tree name, tree val)
1.1  mrg {
1.1  mrg   loop->nb_iterations = simplify_replace_tree (loop->nb_iterations, name, val);
1.1  mrg }