contrib/gcc/tree-vectorizer.c

169689Skan/* Loop Vectorization
169689Skan   Copyright (C) 2003, 2004, 2005, 2006, 2007 Free Software Foundation, Inc.
169689Skan   Contributed by Dorit Naishlos <dorit@il.ibm.com>
169689Skan
169689SkanThis file is part of GCC.
169689Skan
169689SkanGCC is free software; you can redistribute it and/or modify it under
169689Skanthe terms of the GNU General Public License as published by the Free
169689SkanSoftware Foundation; either version 2, or (at your option) any later
169689Skanversion.
169689Skan
169689SkanGCC is distributed in the hope that it will be useful, but WITHOUT ANY
169689SkanWARRANTY; without even the implied warranty of MERCHANTABILITY or
169689SkanFITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
169689Skanfor more details.
169689Skan
169689SkanYou should have received a copy of the GNU General Public License
169689Skanalong with GCC; see the file COPYING.  If not, write to the Free
169689SkanSoftware Foundation, 51 Franklin Street, Fifth Floor, Boston, MA
169689Skan02110-1301, USA.  */
169689Skan
169689Skan/* Loop Vectorization Pass.
169689Skan
169689Skan   This pass tries to vectorize loops. This first implementation focuses on
169689Skan   simple inner-most loops, with no conditional control flow, and a set of
169689Skan   simple operations which vector form can be expressed using existing
169689Skan   tree codes (PLUS, MULT etc).
169689Skan
169689Skan   For example, the vectorizer transforms the following simple loop:
169689Skan
169689Skan	short a[N]; short b[N]; short c[N]; int i;
169689Skan
169689Skan	for (i=0; i<N; i++){
169689Skan	  a[i] = b[i] + c[i];
169689Skan	}
169689Skan
169689Skan   as if it was manually vectorized by rewriting the source code into:
169689Skan
169689Skan	typedef int __attribute__((mode(V8HI))) v8hi;
169689Skan	short a[N];  short b[N]; short c[N];   int i;
169689Skan	v8hi *pa = (v8hi*)a, *pb = (v8hi*)b, *pc = (v8hi*)c;
169689Skan	v8hi va, vb, vc;
169689Skan
169689Skan	for (i=0; i<N/8; i++){
169689Skan	  vb = pb[i];
169689Skan	  vc = pc[i];
169689Skan	  va = vb + vc;
169689Skan	  pa[i] = va;
169689Skan	}
169689Skan
169689Skan	The main entry to this pass is vectorize_loops(), in which
169689Skan   the vectorizer applies a set of analyses on a given set of loops,
169689Skan   followed by the actual vectorization transformation for the loops that
169689Skan   had successfully passed the analysis phase.
169689Skan
169689Skan	Throughout this pass we make a distinction between two types of
169689Skan   data: scalars (which are represented by SSA_NAMES), and memory references
169689Skan   ("data-refs"). These two types of data require different handling both
169689Skan   during analysis and transformation. The types of data-refs that the
169689Skan   vectorizer currently supports are ARRAY_REFS which base is an array DECL
169689Skan   (not a pointer), and INDIRECT_REFS through pointers; both array and pointer
169689Skan   accesses are required to have a  simple (consecutive) access pattern.
169689Skan
169689Skan   Analysis phase:
169689Skan   ===============
169689Skan	The driver for the analysis phase is vect_analyze_loop_nest().
169689Skan   It applies a set of analyses, some of which rely on the scalar evolution
169689Skan   analyzer (scev) developed by Sebastian Pop.
169689Skan
169689Skan	During the analysis phase the vectorizer records some information
169689Skan   per stmt in a "stmt_vec_info" struct which is attached to each stmt in the
169689Skan   loop, as well as general information about the loop as a whole, which is
169689Skan   recorded in a "loop_vec_info" struct attached to each loop.
169689Skan
169689Skan   Transformation phase:
169689Skan   =====================
169689Skan	The loop transformation phase scans all the stmts in the loop, and
169689Skan   creates a vector stmt (or a sequence of stmts) for each scalar stmt S in
169689Skan   the loop that needs to be vectorized. It insert the vector code sequence
169689Skan   just before the scalar stmt S, and records a pointer to the vector code
169689Skan   in STMT_VINFO_VEC_STMT (stmt_info) (stmt_info is the stmt_vec_info struct
169689Skan   attached to S). This pointer will be used for the vectorization of following
169689Skan   stmts which use the def of stmt S. Stmt S is removed if it writes to memory;
169689Skan   otherwise, we rely on dead code elimination for removing it.
169689Skan
169689Skan	For example, say stmt S1 was vectorized into stmt VS1:
169689Skan
169689Skan   VS1: vb = px[i];
169689Skan   S1:	b = x[i];    STMT_VINFO_VEC_STMT (stmt_info (S1)) = VS1
169689Skan   S2:  a = b;
169689Skan
169689Skan   To vectorize stmt S2, the vectorizer first finds the stmt that defines
169689Skan   the operand 'b' (S1), and gets the relevant vector def 'vb' from the
169689Skan   vector stmt VS1 pointed to by STMT_VINFO_VEC_STMT (stmt_info (S1)). The
169689Skan   resulting sequence would be:
169689Skan
169689Skan   VS1: vb = px[i];
169689Skan   S1:	b = x[i];	STMT_VINFO_VEC_STMT (stmt_info (S1)) = VS1
169689Skan   VS2: va = vb;
169689Skan   S2:  a = b;          STMT_VINFO_VEC_STMT (stmt_info (S2)) = VS2
169689Skan
169689Skan	Operands that are not SSA_NAMEs, are data-refs that appear in
169689Skan   load/store operations (like 'x[i]' in S1), and are handled differently.
169689Skan
169689Skan   Target modeling:
169689Skan   =================
169689Skan	Currently the only target specific information that is used is the
169689Skan   size of the vector (in bytes) - "UNITS_PER_SIMD_WORD". Targets that can
169689Skan   support different sizes of vectors, for now will need to specify one value
169689Skan   for "UNITS_PER_SIMD_WORD". More flexibility will be added in the future.
169689Skan
169689Skan	Since we only vectorize operations which vector form can be
169689Skan   expressed using existing tree codes, to verify that an operation is
169689Skan   supported, the vectorizer checks the relevant optab at the relevant
169689Skan   machine_mode (e.g, add_optab->handlers[(int) V8HImode].insn_code). If
169689Skan   the value found is CODE_FOR_nothing, then there's no target support, and
169689Skan   we can't vectorize the stmt.
169689Skan
169689Skan   For additional information on this project see:
169689Skan   http://gcc.gnu.org/projects/tree-ssa/vectorization.html
169689Skan*/
169689Skan
169689Skan#include "config.h"
169689Skan#include "system.h"
169689Skan#include "coretypes.h"
169689Skan#include "tm.h"
169689Skan#include "ggc.h"
169689Skan#include "tree.h"
169689Skan#include "target.h"
169689Skan#include "rtl.h"
169689Skan#include "basic-block.h"
169689Skan#include "diagnostic.h"
169689Skan#include "tree-flow.h"
169689Skan#include "tree-dump.h"
169689Skan#include "timevar.h"
169689Skan#include "cfgloop.h"
169689Skan#include "cfglayout.h"
169689Skan#include "expr.h"
169689Skan#include "optabs.h"
169689Skan#include "params.h"
169689Skan#include "toplev.h"
169689Skan#include "tree-chrec.h"
169689Skan#include "tree-data-ref.h"
169689Skan#include "tree-scalar-evolution.h"
169689Skan#include "input.h"
169689Skan#include "tree-vectorizer.h"
169689Skan#include "tree-pass.h"
169689Skan
169689Skan/*************************************************************************
169689Skan  Simple Loop Peeling Utilities
169689Skan *************************************************************************/
169689Skanstatic struct loop *slpeel_tree_duplicate_loop_to_edge_cfg
169689Skan  (struct loop *, struct loops *, edge);
169689Skanstatic void slpeel_update_phis_for_duplicate_loop
169689Skan  (struct loop *, struct loop *, bool after);
169689Skanstatic void slpeel_update_phi_nodes_for_guard1
169689Skan  (edge, struct loop *, bool, basic_block *, bitmap *);
169689Skanstatic void slpeel_update_phi_nodes_for_guard2
169689Skan  (edge, struct loop *, bool, basic_block *);
169689Skanstatic edge slpeel_add_loop_guard (basic_block, tree, basic_block, basic_block);
169689Skan
169689Skanstatic void rename_use_op (use_operand_p);
169689Skanstatic void rename_variables_in_bb (basic_block);
169689Skanstatic void rename_variables_in_loop (struct loop *);
169689Skan
169689Skan/*************************************************************************
169689Skan  General Vectorization Utilities
169689Skan *************************************************************************/
169689Skanstatic void vect_set_dump_settings (void);
169689Skan
169689Skan/* vect_dump will be set to stderr or dump_file if exist.  */
169689SkanFILE *vect_dump;
169689Skan
169689Skan/* vect_verbosity_level set to an invalid value
169689Skan   to mark that it's uninitialized.  */
169689Skanenum verbosity_levels vect_verbosity_level = MAX_VERBOSITY_LEVEL;
169689Skan
169689Skan/* Number of loops, at the beginning of vectorization.  */
169689Skanunsigned int vect_loops_num;
169689Skan
169689Skan/* Loop location.  */
169689Skanstatic LOC vect_loop_location;
169689Skan
169689Skan/* Bitmap of virtual variables to be renamed.  */
169689Skanbitmap vect_vnames_to_rename;
169689Skan
169689Skan/*************************************************************************
169689Skan  Simple Loop Peeling Utilities
169689Skan
169689Skan  Utilities to support loop peeling for vectorization purposes.
169689Skan *************************************************************************/
169689Skan
169689Skan
169689Skan/* Renames the use *OP_P.  */
169689Skan
169689Skanstatic void
169689Skanrename_use_op (use_operand_p op_p)
169689Skan{
169689Skan  tree new_name;
169689Skan
169689Skan  if (TREE_CODE (USE_FROM_PTR (op_p)) != SSA_NAME)
169689Skan    return;
169689Skan
169689Skan  new_name = get_current_def (USE_FROM_PTR (op_p));
169689Skan
169689Skan  /* Something defined outside of the loop.  */
169689Skan  if (!new_name)
169689Skan    return;
169689Skan
169689Skan  /* An ordinary ssa name defined in the loop.  */
169689Skan
169689Skan  SET_USE (op_p, new_name);
169689Skan}
169689Skan
169689Skan
169689Skan/* Renames the variables in basic block BB.  */
169689Skan
169689Skanstatic void
169689Skanrename_variables_in_bb (basic_block bb)
169689Skan{
169689Skan  tree phi;
169689Skan  block_stmt_iterator bsi;
169689Skan  tree stmt;
169689Skan  use_operand_p use_p;
169689Skan  ssa_op_iter iter;
169689Skan  edge e;
169689Skan  edge_iterator ei;
169689Skan  struct loop *loop = bb->loop_father;
169689Skan
169689Skan  for (bsi = bsi_start (bb); !bsi_end_p (bsi); bsi_next (&bsi))
169689Skan    {
169689Skan      stmt = bsi_stmt (bsi);
169689Skan      FOR_EACH_SSA_USE_OPERAND (use_p, stmt, iter,
169689Skan				 (SSA_OP_ALL_USES | SSA_OP_ALL_KILLS))
169689Skan	rename_use_op (use_p);
169689Skan    }
169689Skan
169689Skan  FOR_EACH_EDGE (e, ei, bb->succs)
169689Skan    {
169689Skan      if (!flow_bb_inside_loop_p (loop, e->dest))
169689Skan	continue;
169689Skan      for (phi = phi_nodes (e->dest); phi; phi = PHI_CHAIN (phi))
169689Skan        rename_use_op (PHI_ARG_DEF_PTR_FROM_EDGE (phi, e));
169689Skan    }
169689Skan}
169689Skan
169689Skan
169689Skan/* Renames variables in new generated LOOP.  */
169689Skan
169689Skanstatic void
169689Skanrename_variables_in_loop (struct loop *loop)
169689Skan{
169689Skan  unsigned i;
169689Skan  basic_block *bbs;
169689Skan
169689Skan  bbs = get_loop_body (loop);
169689Skan
169689Skan  for (i = 0; i < loop->num_nodes; i++)
169689Skan    rename_variables_in_bb (bbs[i]);
169689Skan
169689Skan  free (bbs);
169689Skan}
169689Skan
169689Skan
169689Skan/* Update the PHI nodes of NEW_LOOP.
169689Skan
169689Skan   NEW_LOOP is a duplicate of ORIG_LOOP.
169689Skan   AFTER indicates whether NEW_LOOP executes before or after ORIG_LOOP:
169689Skan   AFTER is true if NEW_LOOP executes after ORIG_LOOP, and false if it
169689Skan   executes before it.  */
169689Skan
169689Skanstatic void
169689Skanslpeel_update_phis_for_duplicate_loop (struct loop *orig_loop,
169689Skan				       struct loop *new_loop, bool after)
169689Skan{
169689Skan  tree new_ssa_name;
169689Skan  tree phi_new, phi_orig;
169689Skan  tree def;
169689Skan  edge orig_loop_latch = loop_latch_edge (orig_loop);
169689Skan  edge orig_entry_e = loop_preheader_edge (orig_loop);
169689Skan  edge new_loop_exit_e = new_loop->single_exit;
169689Skan  edge new_loop_entry_e = loop_preheader_edge (new_loop);
169689Skan  edge entry_arg_e = (after ? orig_loop_latch : orig_entry_e);
169689Skan
169689Skan  /*
169689Skan     step 1. For each loop-header-phi:
169689Skan             Add the first phi argument for the phi in NEW_LOOP
169689Skan            (the one associated with the entry of NEW_LOOP)
169689Skan
169689Skan     step 2. For each loop-header-phi:
169689Skan             Add the second phi argument for the phi in NEW_LOOP
169689Skan            (the one associated with the latch of NEW_LOOP)
169689Skan
169689Skan     step 3. Update the phis in the successor block of NEW_LOOP.
169689Skan
169689Skan        case 1: NEW_LOOP was placed before ORIG_LOOP:
169689Skan                The successor block of NEW_LOOP is the header of ORIG_LOOP.
169689Skan                Updating the phis in the successor block can therefore be done
169689Skan                along with the scanning of the loop header phis, because the
169689Skan                header blocks of ORIG_LOOP and NEW_LOOP have exactly the same
169689Skan                phi nodes, organized in the same order.
169689Skan
169689Skan        case 2: NEW_LOOP was placed after ORIG_LOOP:
169689Skan                The successor block of NEW_LOOP is the original exit block of
169689Skan                ORIG_LOOP - the phis to be updated are the loop-closed-ssa phis.
169689Skan                We postpone updating these phis to a later stage (when
169689Skan                loop guards are added).
169689Skan   */
169689Skan
169689Skan
169689Skan  /* Scan the phis in the headers of the old and new loops
169689Skan     (they are organized in exactly the same order).  */
169689Skan
169689Skan  for (phi_new = phi_nodes (new_loop->header),
169689Skan       phi_orig = phi_nodes (orig_loop->header);
169689Skan       phi_new && phi_orig;
169689Skan       phi_new = PHI_CHAIN (phi_new), phi_orig = PHI_CHAIN (phi_orig))
169689Skan    {
169689Skan      /* step 1.  */
169689Skan      def = PHI_ARG_DEF_FROM_EDGE (phi_orig, entry_arg_e);
169689Skan      add_phi_arg (phi_new, def, new_loop_entry_e);
169689Skan
169689Skan      /* step 2.  */
169689Skan      def = PHI_ARG_DEF_FROM_EDGE (phi_orig, orig_loop_latch);
169689Skan      if (TREE_CODE (def) != SSA_NAME)
169689Skan        continue;
169689Skan
169689Skan      new_ssa_name = get_current_def (def);
169689Skan      if (!new_ssa_name)
169689Skan	{
169689Skan	  /* This only happens if there are no definitions
169689Skan	     inside the loop. use the phi_result in this case.  */
169689Skan	  new_ssa_name = PHI_RESULT (phi_new);
169689Skan	}
169689Skan
169689Skan      /* An ordinary ssa name defined in the loop.  */
169689Skan      add_phi_arg (phi_new, new_ssa_name, loop_latch_edge (new_loop));
169689Skan
169689Skan      /* step 3 (case 1).  */
169689Skan      if (!after)
169689Skan        {
169689Skan          gcc_assert (new_loop_exit_e == orig_entry_e);
169689Skan          SET_PHI_ARG_DEF (phi_orig,
169689Skan                           new_loop_exit_e->dest_idx,
169689Skan                           new_ssa_name);
169689Skan        }
169689Skan    }
169689Skan}
169689Skan
169689Skan
169689Skan/* Update PHI nodes for a guard of the LOOP.
169689Skan
169689Skan   Input:
169689Skan   - LOOP, GUARD_EDGE: LOOP is a loop for which we added guard code that
169689Skan        controls whether LOOP is to be executed.  GUARD_EDGE is the edge that
169689Skan        originates from the guard-bb, skips LOOP and reaches the (unique) exit
169689Skan        bb of LOOP.  This loop-exit-bb is an empty bb with one successor.
169689Skan        We denote this bb NEW_MERGE_BB because before the guard code was added
169689Skan        it had a single predecessor (the LOOP header), and now it became a merge
169689Skan        point of two paths - the path that ends with the LOOP exit-edge, and
169689Skan        the path that ends with GUARD_EDGE.
169689Skan   - NEW_EXIT_BB: New basic block that is added by this function between LOOP
169689Skan        and NEW_MERGE_BB. It is used to place loop-closed-ssa-form exit-phis.
169689Skan
169689Skan   ===> The CFG before the guard-code was added:
169689Skan        LOOP_header_bb:
169689Skan          loop_body
169689Skan          if (exit_loop) goto update_bb
169689Skan          else           goto LOOP_header_bb
169689Skan        update_bb:
169689Skan
169689Skan   ==> The CFG after the guard-code was added:
169689Skan        guard_bb:
169689Skan          if (LOOP_guard_condition) goto new_merge_bb
169689Skan          else                      goto LOOP_header_bb
169689Skan        LOOP_header_bb:
169689Skan          loop_body
169689Skan          if (exit_loop_condition) goto new_merge_bb
169689Skan          else                     goto LOOP_header_bb
169689Skan        new_merge_bb:
169689Skan          goto update_bb
169689Skan        update_bb:
169689Skan
169689Skan   ==> The CFG after this function:
169689Skan        guard_bb:
169689Skan          if (LOOP_guard_condition) goto new_merge_bb
169689Skan          else                      goto LOOP_header_bb
169689Skan        LOOP_header_bb:
169689Skan          loop_body
169689Skan          if (exit_loop_condition) goto new_exit_bb
169689Skan          else                     goto LOOP_header_bb
169689Skan        new_exit_bb:
169689Skan        new_merge_bb:
169689Skan          goto update_bb
169689Skan        update_bb:
169689Skan
169689Skan   This function:
169689Skan   1. creates and updates the relevant phi nodes to account for the new
169689Skan      incoming edge (GUARD_EDGE) into NEW_MERGE_BB. This involves:
169689Skan      1.1. Create phi nodes at NEW_MERGE_BB.
169689Skan      1.2. Update the phi nodes at the successor of NEW_MERGE_BB (denoted
169689Skan           UPDATE_BB).  UPDATE_BB was the exit-bb of LOOP before NEW_MERGE_BB
169689Skan   2. preserves loop-closed-ssa-form by creating the required phi nodes
169689Skan      at the exit of LOOP (i.e, in NEW_EXIT_BB).
169689Skan
169689Skan   There are two flavors to this function:
169689Skan
169689Skan   slpeel_update_phi_nodes_for_guard1:
169689Skan     Here the guard controls whether we enter or skip LOOP, where LOOP is a
169689Skan     prolog_loop (loop1 below), and the new phis created in NEW_MERGE_BB are
169689Skan     for variables that have phis in the loop header.
169689Skan
169689Skan   slpeel_update_phi_nodes_for_guard2:
169689Skan     Here the guard controls whether we enter or skip LOOP, where LOOP is an
169689Skan     epilog_loop (loop2 below), and the new phis created in NEW_MERGE_BB are
169689Skan     for variables that have phis in the loop exit.
169689Skan
169689Skan   I.E., the overall structure is:
169689Skan
169689Skan        loop1_preheader_bb:
169689Skan                guard1 (goto loop1/merg1_bb)
169689Skan        loop1
169689Skan        loop1_exit_bb:
169689Skan                guard2 (goto merge1_bb/merge2_bb)
169689Skan        merge1_bb
169689Skan        loop2
169689Skan        loop2_exit_bb
169689Skan        merge2_bb
169689Skan        next_bb
169689Skan
169689Skan   slpeel_update_phi_nodes_for_guard1 takes care of creating phis in
169689Skan   loop1_exit_bb and merge1_bb. These are entry phis (phis for the vars
169689Skan   that have phis in loop1->header).
169689Skan
169689Skan   slpeel_update_phi_nodes_for_guard2 takes care of creating phis in
169689Skan   loop2_exit_bb and merge2_bb. These are exit phis (phis for the vars
169689Skan   that have phis in next_bb). It also adds some of these phis to
169689Skan   loop1_exit_bb.
169689Skan
169689Skan   slpeel_update_phi_nodes_for_guard1 is always called before
169689Skan   slpeel_update_phi_nodes_for_guard2. They are both needed in order
169689Skan   to create correct data-flow and loop-closed-ssa-form.
169689Skan
169689Skan   Generally slpeel_update_phi_nodes_for_guard1 creates phis for variables
169689Skan   that change between iterations of a loop (and therefore have a phi-node
169689Skan   at the loop entry), whereas slpeel_update_phi_nodes_for_guard2 creates
169689Skan   phis for variables that are used out of the loop (and therefore have
169689Skan   loop-closed exit phis). Some variables may be both updated between
169689Skan   iterations and used after the loop. This is why in loop1_exit_bb we
169689Skan   may need both entry_phis (created by slpeel_update_phi_nodes_for_guard1)
169689Skan   and exit phis (created by slpeel_update_phi_nodes_for_guard2).
169689Skan
169689Skan   - IS_NEW_LOOP: if IS_NEW_LOOP is true, then LOOP is a newly created copy of
169689Skan     an original loop. i.e., we have:
169689Skan
169689Skan           orig_loop
169689Skan           guard_bb (goto LOOP/new_merge)
169689Skan           new_loop <-- LOOP
169689Skan           new_exit
169689Skan           new_merge
169689Skan           next_bb
169689Skan
169689Skan     If IS_NEW_LOOP is false, then LOOP is an original loop, in which case we
169689Skan     have:
169689Skan
169689Skan           new_loop
169689Skan           guard_bb (goto LOOP/new_merge)
169689Skan           orig_loop <-- LOOP
169689Skan           new_exit
169689Skan           new_merge
169689Skan           next_bb
169689Skan
169689Skan     The SSA names defined in the original loop have a current
169689Skan     reaching definition that that records the corresponding new
169689Skan     ssa-name used in the new duplicated loop copy.
169689Skan  */
169689Skan
169689Skan/* Function slpeel_update_phi_nodes_for_guard1
169689Skan
169689Skan   Input:
169689Skan   - GUARD_EDGE, LOOP, IS_NEW_LOOP, NEW_EXIT_BB - as explained above.
169689Skan   - DEFS - a bitmap of ssa names to mark new names for which we recorded
169689Skan            information.
169689Skan
169689Skan   In the context of the overall structure, we have:
169689Skan
169689Skan        loop1_preheader_bb:
169689Skan                guard1 (goto loop1/merg1_bb)
169689SkanLOOP->  loop1
169689Skan        loop1_exit_bb:
169689Skan                guard2 (goto merge1_bb/merge2_bb)
169689Skan        merge1_bb
169689Skan        loop2
169689Skan        loop2_exit_bb
169689Skan        merge2_bb
169689Skan        next_bb
169689Skan
169689Skan   For each name updated between loop iterations (i.e - for each name that has
169689Skan   an entry (loop-header) phi in LOOP) we create a new phi in:
169689Skan   1. merge1_bb (to account for the edge from guard1)
169689Skan   2. loop1_exit_bb (an exit-phi to keep LOOP in loop-closed form)
169689Skan*/
169689Skan
169689Skanstatic void
169689Skanslpeel_update_phi_nodes_for_guard1 (edge guard_edge, struct loop *loop,
169689Skan                                    bool is_new_loop, basic_block *new_exit_bb,
169689Skan                                    bitmap *defs)
169689Skan{
169689Skan  tree orig_phi, new_phi;
169689Skan  tree update_phi, update_phi2;
169689Skan  tree guard_arg, loop_arg;
169689Skan  basic_block new_merge_bb = guard_edge->dest;
169689Skan  edge e = EDGE_SUCC (new_merge_bb, 0);
169689Skan  basic_block update_bb = e->dest;
169689Skan  basic_block orig_bb = loop->header;
169689Skan  edge new_exit_e;
169689Skan  tree current_new_name;
169689Skan  tree name;
169689Skan
169689Skan  /* Create new bb between loop and new_merge_bb.  */
169689Skan  *new_exit_bb = split_edge (loop->single_exit);
169689Skan  add_bb_to_loop (*new_exit_bb, loop->outer);
169689Skan
169689Skan  new_exit_e = EDGE_SUCC (*new_exit_bb, 0);
169689Skan
169689Skan  for (orig_phi = phi_nodes (orig_bb), update_phi = phi_nodes (update_bb);
169689Skan       orig_phi && update_phi;
169689Skan       orig_phi = PHI_CHAIN (orig_phi), update_phi = PHI_CHAIN (update_phi))
169689Skan    {
169689Skan      /* Virtual phi; Mark it for renaming. We actually want to call
169689Skan	 mar_sym_for_renaming, but since all ssa renaming datastructures
169689Skan	 are going to be freed before we get to call ssa_upate, we just
169689Skan	 record this name for now in a bitmap, and will mark it for
169689Skan	 renaming later.  */
169689Skan      name = PHI_RESULT (orig_phi);
169689Skan      if (!is_gimple_reg (SSA_NAME_VAR (name)))
169689Skan        bitmap_set_bit (vect_vnames_to_rename, SSA_NAME_VERSION (name));
169689Skan
169689Skan      /** 1. Handle new-merge-point phis  **/
169689Skan
169689Skan      /* 1.1. Generate new phi node in NEW_MERGE_BB:  */
169689Skan      new_phi = create_phi_node (SSA_NAME_VAR (PHI_RESULT (orig_phi)),
169689Skan                                 new_merge_bb);
169689Skan
169689Skan      /* 1.2. NEW_MERGE_BB has two incoming edges: GUARD_EDGE and the exit-edge
169689Skan            of LOOP. Set the two phi args in NEW_PHI for these edges:  */
169689Skan      loop_arg = PHI_ARG_DEF_FROM_EDGE (orig_phi, EDGE_SUCC (loop->latch, 0));
169689Skan      guard_arg = PHI_ARG_DEF_FROM_EDGE (orig_phi, loop_preheader_edge (loop));
169689Skan
169689Skan      add_phi_arg (new_phi, loop_arg, new_exit_e);
169689Skan      add_phi_arg (new_phi, guard_arg, guard_edge);
169689Skan
169689Skan      /* 1.3. Update phi in successor block.  */
169689Skan      gcc_assert (PHI_ARG_DEF_FROM_EDGE (update_phi, e) == loop_arg
169689Skan                  || PHI_ARG_DEF_FROM_EDGE (update_phi, e) == guard_arg);
169689Skan      SET_PHI_ARG_DEF (update_phi, e->dest_idx, PHI_RESULT (new_phi));
169689Skan      update_phi2 = new_phi;
169689Skan
169689Skan
169689Skan      /** 2. Handle loop-closed-ssa-form phis  **/
169689Skan
169689Skan      /* 2.1. Generate new phi node in NEW_EXIT_BB:  */
169689Skan      new_phi = create_phi_node (SSA_NAME_VAR (PHI_RESULT (orig_phi)),
169689Skan                                 *new_exit_bb);
169689Skan
169689Skan      /* 2.2. NEW_EXIT_BB has one incoming edge: the exit-edge of the loop.  */
169689Skan      add_phi_arg (new_phi, loop_arg, loop->single_exit);
169689Skan
169689Skan      /* 2.3. Update phi in successor of NEW_EXIT_BB:  */
169689Skan      gcc_assert (PHI_ARG_DEF_FROM_EDGE (update_phi2, new_exit_e) == loop_arg);
169689Skan      SET_PHI_ARG_DEF (update_phi2, new_exit_e->dest_idx, PHI_RESULT (new_phi));
169689Skan
169689Skan      /* 2.4. Record the newly created name with set_current_def.
169689Skan         We want to find a name such that
169689Skan                name = get_current_def (orig_loop_name)
169689Skan         and to set its current definition as follows:
169689Skan                set_current_def (name, new_phi_name)
169689Skan
169689Skan         If LOOP is a new loop then loop_arg is already the name we're
169689Skan         looking for. If LOOP is the original loop, then loop_arg is
169689Skan         the orig_loop_name and the relevant name is recorded in its
169689Skan         current reaching definition.  */
169689Skan      if (is_new_loop)
169689Skan        current_new_name = loop_arg;
169689Skan      else
169689Skan        {
169689Skan          current_new_name = get_current_def (loop_arg);
169689Skan	  /* current_def is not available only if the variable does not
169689Skan	     change inside the loop, in which case we also don't care
169689Skan	     about recording a current_def for it because we won't be
169689Skan	     trying to create loop-exit-phis for it.  */
169689Skan	  if (!current_new_name)
169689Skan	    continue;
169689Skan        }
169689Skan      gcc_assert (get_current_def (current_new_name) == NULL_TREE);
169689Skan
169689Skan      set_current_def (current_new_name, PHI_RESULT (new_phi));
169689Skan      bitmap_set_bit (*defs, SSA_NAME_VERSION (current_new_name));
169689Skan    }
169689Skan
169689Skan  set_phi_nodes (new_merge_bb, phi_reverse (phi_nodes (new_merge_bb)));
169689Skan}
169689Skan
169689Skan
169689Skan/* Function slpeel_update_phi_nodes_for_guard2
169689Skan
169689Skan   Input:
169689Skan   - GUARD_EDGE, LOOP, IS_NEW_LOOP, NEW_EXIT_BB - as explained above.
169689Skan
169689Skan   In the context of the overall structure, we have:
169689Skan
169689Skan        loop1_preheader_bb:
169689Skan                guard1 (goto loop1/merg1_bb)
169689Skan        loop1
169689Skan        loop1_exit_bb:
169689Skan                guard2 (goto merge1_bb/merge2_bb)
169689Skan        merge1_bb
169689SkanLOOP->  loop2
169689Skan        loop2_exit_bb
169689Skan        merge2_bb
169689Skan        next_bb
169689Skan
169689Skan   For each name used out side the loop (i.e - for each name that has an exit
169689Skan   phi in next_bb) we create a new phi in:
169689Skan   1. merge2_bb (to account for the edge from guard_bb)
169689Skan   2. loop2_exit_bb (an exit-phi to keep LOOP in loop-closed form)
169689Skan   3. guard2 bb (an exit phi to keep the preceding loop in loop-closed form),
169689Skan      if needed (if it wasn't handled by slpeel_update_phis_nodes_for_phi1).
169689Skan*/
169689Skan
169689Skanstatic void
169689Skanslpeel_update_phi_nodes_for_guard2 (edge guard_edge, struct loop *loop,
169689Skan                                    bool is_new_loop, basic_block *new_exit_bb)
169689Skan{
169689Skan  tree orig_phi, new_phi;
169689Skan  tree update_phi, update_phi2;
169689Skan  tree guard_arg, loop_arg;
169689Skan  basic_block new_merge_bb = guard_edge->dest;
169689Skan  edge e = EDGE_SUCC (new_merge_bb, 0);
169689Skan  basic_block update_bb = e->dest;
169689Skan  edge new_exit_e;
169689Skan  tree orig_def, orig_def_new_name;
169689Skan  tree new_name, new_name2;
169689Skan  tree arg;
169689Skan
169689Skan  /* Create new bb between loop and new_merge_bb.  */
169689Skan  *new_exit_bb = split_edge (loop->single_exit);
169689Skan  add_bb_to_loop (*new_exit_bb, loop->outer);
169689Skan
169689Skan  new_exit_e = EDGE_SUCC (*new_exit_bb, 0);
169689Skan
169689Skan  for (update_phi = phi_nodes (update_bb); update_phi;
169689Skan       update_phi = PHI_CHAIN (update_phi))
169689Skan    {
169689Skan      orig_phi = update_phi;
169689Skan      orig_def = PHI_ARG_DEF_FROM_EDGE (orig_phi, e);
169689Skan      /* This loop-closed-phi actually doesn't represent a use
169689Skan         out of the loop - the phi arg is a constant.  */
169689Skan      if (TREE_CODE (orig_def) != SSA_NAME)
169689Skan        continue;
169689Skan      orig_def_new_name = get_current_def (orig_def);
169689Skan      arg = NULL_TREE;
169689Skan
169689Skan      /** 1. Handle new-merge-point phis  **/
169689Skan
169689Skan      /* 1.1. Generate new phi node in NEW_MERGE_BB:  */
169689Skan      new_phi = create_phi_node (SSA_NAME_VAR (PHI_RESULT (orig_phi)),
169689Skan                                 new_merge_bb);
169689Skan
169689Skan      /* 1.2. NEW_MERGE_BB has two incoming edges: GUARD_EDGE and the exit-edge
169689Skan            of LOOP. Set the two PHI args in NEW_PHI for these edges:  */
169689Skan      new_name = orig_def;
169689Skan      new_name2 = NULL_TREE;
169689Skan      if (orig_def_new_name)
169689Skan        {
169689Skan          new_name = orig_def_new_name;
169689Skan	  /* Some variables have both loop-entry-phis and loop-exit-phis.
169689Skan	     Such variables were given yet newer names by phis placed in
169689Skan	     guard_bb by slpeel_update_phi_nodes_for_guard1. I.e:
169689Skan	     new_name2 = get_current_def (get_current_def (orig_name)).  */
169689Skan          new_name2 = get_current_def (new_name);
169689Skan        }
169689Skan
169689Skan      if (is_new_loop)
169689Skan        {
169689Skan          guard_arg = orig_def;
169689Skan          loop_arg = new_name;
169689Skan        }
169689Skan      else
169689Skan        {
169689Skan          guard_arg = new_name;
169689Skan          loop_arg = orig_def;
169689Skan        }
169689Skan      if (new_name2)
169689Skan        guard_arg = new_name2;
169689Skan
169689Skan      add_phi_arg (new_phi, loop_arg, new_exit_e);
169689Skan      add_phi_arg (new_phi, guard_arg, guard_edge);
169689Skan
169689Skan      /* 1.3. Update phi in successor block.  */
169689Skan      gcc_assert (PHI_ARG_DEF_FROM_EDGE (update_phi, e) == orig_def);
169689Skan      SET_PHI_ARG_DEF (update_phi, e->dest_idx, PHI_RESULT (new_phi));
169689Skan      update_phi2 = new_phi;
169689Skan
169689Skan
169689Skan      /** 2. Handle loop-closed-ssa-form phis  **/
169689Skan
169689Skan      /* 2.1. Generate new phi node in NEW_EXIT_BB:  */
169689Skan      new_phi = create_phi_node (SSA_NAME_VAR (PHI_RESULT (orig_phi)),
169689Skan                                 *new_exit_bb);
169689Skan
169689Skan      /* 2.2. NEW_EXIT_BB has one incoming edge: the exit-edge of the loop.  */
169689Skan      add_phi_arg (new_phi, loop_arg, loop->single_exit);
169689Skan
169689Skan      /* 2.3. Update phi in successor of NEW_EXIT_BB:  */
169689Skan      gcc_assert (PHI_ARG_DEF_FROM_EDGE (update_phi2, new_exit_e) == loop_arg);
169689Skan      SET_PHI_ARG_DEF (update_phi2, new_exit_e->dest_idx, PHI_RESULT (new_phi));
169689Skan
169689Skan
169689Skan      /** 3. Handle loop-closed-ssa-form phis for first loop  **/
169689Skan
169689Skan      /* 3.1. Find the relevant names that need an exit-phi in
169689Skan	 GUARD_BB, i.e. names for which
169689Skan	 slpeel_update_phi_nodes_for_guard1 had not already created a
169689Skan	 phi node. This is the case for names that are used outside
169689Skan	 the loop (and therefore need an exit phi) but are not updated
169689Skan	 across loop iterations (and therefore don't have a
169689Skan	 loop-header-phi).
169689Skan
169689Skan	 slpeel_update_phi_nodes_for_guard1 is responsible for
169689Skan	 creating loop-exit phis in GUARD_BB for names that have a
169689Skan	 loop-header-phi.  When such a phi is created we also record
169689Skan	 the new name in its current definition.  If this new name
169689Skan	 exists, then guard_arg was set to this new name (see 1.2
169689Skan	 above).  Therefore, if guard_arg is not this new name, this
169689Skan	 is an indication that an exit-phi in GUARD_BB was not yet
169689Skan	 created, so we take care of it here.  */
169689Skan      if (guard_arg == new_name2)
169689Skan	continue;
169689Skan      arg = guard_arg;
169689Skan
169689Skan      /* 3.2. Generate new phi node in GUARD_BB:  */
169689Skan      new_phi = create_phi_node (SSA_NAME_VAR (PHI_RESULT (orig_phi)),
169689Skan                                 guard_edge->src);
169689Skan
169689Skan      /* 3.3. GUARD_BB has one incoming edge:  */
169689Skan      gcc_assert (EDGE_COUNT (guard_edge->src->preds) == 1);
169689Skan      add_phi_arg (new_phi, arg, EDGE_PRED (guard_edge->src, 0));
169689Skan
169689Skan      /* 3.4. Update phi in successor of GUARD_BB:  */
169689Skan      gcc_assert (PHI_ARG_DEF_FROM_EDGE (update_phi2, guard_edge)
169689Skan                                                                == guard_arg);
169689Skan      SET_PHI_ARG_DEF (update_phi2, guard_edge->dest_idx, PHI_RESULT (new_phi));
169689Skan    }
169689Skan
169689Skan  set_phi_nodes (new_merge_bb, phi_reverse (phi_nodes (new_merge_bb)));
169689Skan}
169689Skan
169689Skan
169689Skan/* Make the LOOP iterate NITERS times. This is done by adding a new IV
169689Skan   that starts at zero, increases by one and its limit is NITERS.
169689Skan
169689Skan   Assumption: the exit-condition of LOOP is the last stmt in the loop.  */
169689Skan
169689Skanvoid
169689Skanslpeel_make_loop_iterate_ntimes (struct loop *loop, tree niters)
169689Skan{
169689Skan  tree indx_before_incr, indx_after_incr, cond_stmt, cond;
169689Skan  tree orig_cond;
169689Skan  edge exit_edge = loop->single_exit;
169689Skan  block_stmt_iterator loop_cond_bsi;
169689Skan  block_stmt_iterator incr_bsi;
169689Skan  bool insert_after;
169689Skan  tree begin_label = tree_block_label (loop->latch);
169689Skan  tree exit_label = tree_block_label (loop->single_exit->dest);
169689Skan  tree init = build_int_cst (TREE_TYPE (niters), 0);
169689Skan  tree step = build_int_cst (TREE_TYPE (niters), 1);
169689Skan  tree then_label;
169689Skan  tree else_label;
169689Skan  LOC loop_loc;
169689Skan
169689Skan  orig_cond = get_loop_exit_condition (loop);
169689Skan  gcc_assert (orig_cond);
169689Skan  loop_cond_bsi = bsi_for_stmt (orig_cond);
169689Skan
169689Skan  standard_iv_increment_position (loop, &incr_bsi, &insert_after);
169689Skan  create_iv (init, step, NULL_TREE, loop,
169689Skan             &incr_bsi, insert_after, &indx_before_incr, &indx_after_incr);
169689Skan
169689Skan  if (exit_edge->flags & EDGE_TRUE_VALUE) /* 'then' edge exits the loop.  */
169689Skan    {
169689Skan      cond = build2 (GE_EXPR, boolean_type_node, indx_after_incr, niters);
169689Skan      then_label = build1 (GOTO_EXPR, void_type_node, exit_label);
169689Skan      else_label = build1 (GOTO_EXPR, void_type_node, begin_label);
169689Skan    }
169689Skan  else /* 'then' edge loops back.  */
169689Skan    {
169689Skan      cond = build2 (LT_EXPR, boolean_type_node, indx_after_incr, niters);
169689Skan      then_label = build1 (GOTO_EXPR, void_type_node, begin_label);
169689Skan      else_label = build1 (GOTO_EXPR, void_type_node, exit_label);
169689Skan    }
169689Skan
169689Skan  cond_stmt = build3 (COND_EXPR, TREE_TYPE (orig_cond), cond,
169689Skan		     then_label, else_label);
169689Skan  bsi_insert_before (&loop_cond_bsi, cond_stmt, BSI_SAME_STMT);
169689Skan
169689Skan  /* Remove old loop exit test:  */
169689Skan  bsi_remove (&loop_cond_bsi, true);
169689Skan
169689Skan  loop_loc = find_loop_location (loop);
169689Skan  if (dump_file && (dump_flags & TDF_DETAILS))
169689Skan    {
169689Skan      if (loop_loc != UNKNOWN_LOC)
169689Skan        fprintf (dump_file, "\nloop at %s:%d: ",
169689Skan                 LOC_FILE (loop_loc), LOC_LINE (loop_loc));
169689Skan      print_generic_expr (dump_file, cond_stmt, TDF_SLIM);
169689Skan    }
169689Skan
169689Skan  loop->nb_iterations = niters;
169689Skan}
169689Skan
169689Skan
169689Skan/* Given LOOP this function generates a new copy of it and puts it
169689Skan   on E which is either the entry or exit of LOOP.  */
169689Skan
169689Skanstatic struct loop *
169689Skanslpeel_tree_duplicate_loop_to_edge_cfg (struct loop *loop, struct loops *loops,
169689Skan					edge e)
169689Skan{
169689Skan  struct loop *new_loop;
169689Skan  basic_block *new_bbs, *bbs;
169689Skan  bool at_exit;
169689Skan  bool was_imm_dom;
169689Skan  basic_block exit_dest;
169689Skan  tree phi, phi_arg;
169689Skan
169689Skan  at_exit = (e == loop->single_exit);
169689Skan  if (!at_exit && e != loop_preheader_edge (loop))
169689Skan    return NULL;
169689Skan
169689Skan  bbs = get_loop_body (loop);
169689Skan
169689Skan  /* Check whether duplication is possible.  */
169689Skan  if (!can_copy_bbs_p (bbs, loop->num_nodes))
169689Skan    {
169689Skan      free (bbs);
169689Skan      return NULL;
169689Skan    }
169689Skan
169689Skan  /* Generate new loop structure.  */
169689Skan  new_loop = duplicate_loop (loops, loop, loop->outer);
169689Skan  if (!new_loop)
169689Skan    {
169689Skan      free (bbs);
169689Skan      return NULL;
169689Skan    }
169689Skan
169689Skan  exit_dest = loop->single_exit->dest;
169689Skan  was_imm_dom = (get_immediate_dominator (CDI_DOMINATORS,
169689Skan					  exit_dest) == loop->header ?
169689Skan		 true : false);
169689Skan
169689Skan  new_bbs = XNEWVEC (basic_block, loop->num_nodes);
169689Skan
169689Skan  copy_bbs (bbs, loop->num_nodes, new_bbs,
169689Skan	    &loop->single_exit, 1, &new_loop->single_exit, NULL,
169689Skan	    e->src);
169689Skan
169689Skan  /* Duplicating phi args at exit bbs as coming
169689Skan     also from exit of duplicated loop.  */
169689Skan  for (phi = phi_nodes (exit_dest); phi; phi = PHI_CHAIN (phi))
169689Skan    {
169689Skan      phi_arg = PHI_ARG_DEF_FROM_EDGE (phi, loop->single_exit);
169689Skan      if (phi_arg)
169689Skan	{
169689Skan	  edge new_loop_exit_edge;
169689Skan
169689Skan	  if (EDGE_SUCC (new_loop->header, 0)->dest == new_loop->latch)
169689Skan	    new_loop_exit_edge = EDGE_SUCC (new_loop->header, 1);
169689Skan	  else
169689Skan	    new_loop_exit_edge = EDGE_SUCC (new_loop->header, 0);
169689Skan
169689Skan	  add_phi_arg (phi, phi_arg, new_loop_exit_edge);
169689Skan	}
169689Skan    }
169689Skan
169689Skan  if (at_exit) /* Add the loop copy at exit.  */
169689Skan    {
169689Skan      redirect_edge_and_branch_force (e, new_loop->header);
169689Skan      set_immediate_dominator (CDI_DOMINATORS, new_loop->header, e->src);
169689Skan      if (was_imm_dom)
169689Skan	set_immediate_dominator (CDI_DOMINATORS, exit_dest, new_loop->header);
169689Skan    }
169689Skan  else /* Add the copy at entry.  */
169689Skan    {
169689Skan      edge new_exit_e;
169689Skan      edge entry_e = loop_preheader_edge (loop);
169689Skan      basic_block preheader = entry_e->src;
169689Skan
169689Skan      if (!flow_bb_inside_loop_p (new_loop,
169689Skan				  EDGE_SUCC (new_loop->header, 0)->dest))
169689Skan        new_exit_e = EDGE_SUCC (new_loop->header, 0);
169689Skan      else
169689Skan	new_exit_e = EDGE_SUCC (new_loop->header, 1);
169689Skan
169689Skan      redirect_edge_and_branch_force (new_exit_e, loop->header);
169689Skan      set_immediate_dominator (CDI_DOMINATORS, loop->header,
169689Skan			       new_exit_e->src);
169689Skan
169689Skan      /* We have to add phi args to the loop->header here as coming
169689Skan	 from new_exit_e edge.  */
169689Skan      for (phi = phi_nodes (loop->header); phi; phi = PHI_CHAIN (phi))
169689Skan	{
169689Skan	  phi_arg = PHI_ARG_DEF_FROM_EDGE (phi, entry_e);
169689Skan	  if (phi_arg)
169689Skan	    add_phi_arg (phi, phi_arg, new_exit_e);
169689Skan	}
169689Skan
169689Skan      redirect_edge_and_branch_force (entry_e, new_loop->header);
169689Skan      set_immediate_dominator (CDI_DOMINATORS, new_loop->header, preheader);
169689Skan    }
169689Skan
169689Skan  free (new_bbs);
169689Skan  free (bbs);
169689Skan
169689Skan  return new_loop;
169689Skan}
169689Skan
169689Skan
169689Skan/* Given the condition statement COND, put it as the last statement
169689Skan   of GUARD_BB; EXIT_BB is the basic block to skip the loop;
169689Skan   Assumes that this is the single exit of the guarded loop.
169689Skan   Returns the skip edge.  */
169689Skan
169689Skanstatic edge
169689Skanslpeel_add_loop_guard (basic_block guard_bb, tree cond, basic_block exit_bb,
169689Skan		        basic_block dom_bb)
169689Skan{
169689Skan  block_stmt_iterator bsi;
169689Skan  edge new_e, enter_e;
169689Skan  tree cond_stmt, then_label, else_label;
169689Skan
169689Skan  enter_e = EDGE_SUCC (guard_bb, 0);
169689Skan  enter_e->flags &= ~EDGE_FALLTHRU;
169689Skan  enter_e->flags |= EDGE_FALSE_VALUE;
169689Skan  bsi = bsi_last (guard_bb);
169689Skan
169689Skan  then_label = build1 (GOTO_EXPR, void_type_node,
169689Skan                       tree_block_label (exit_bb));
169689Skan  else_label = build1 (GOTO_EXPR, void_type_node,
169689Skan                       tree_block_label (enter_e->dest));
169689Skan  cond_stmt = build3 (COND_EXPR, void_type_node, cond,
169689Skan   		     then_label, else_label);
169689Skan  bsi_insert_after (&bsi, cond_stmt, BSI_NEW_STMT);
169689Skan  /* Add new edge to connect guard block to the merge/loop-exit block.  */
169689Skan  new_e = make_edge (guard_bb, exit_bb, EDGE_TRUE_VALUE);
169689Skan  set_immediate_dominator (CDI_DOMINATORS, exit_bb, dom_bb);
169689Skan  return new_e;
169689Skan}
169689Skan
169689Skan
169689Skan/* This function verifies that the following restrictions apply to LOOP:
169689Skan   (1) it is innermost
169689Skan   (2) it consists of exactly 2 basic blocks - header, and an empty latch.
169689Skan   (3) it is single entry, single exit
169689Skan   (4) its exit condition is the last stmt in the header
169689Skan   (5) E is the entry/exit edge of LOOP.
169689Skan */
169689Skan
169689Skanbool
169689Skanslpeel_can_duplicate_loop_p (struct loop *loop, edge e)
169689Skan{
169689Skan  edge exit_e = loop->single_exit;
169689Skan  edge entry_e = loop_preheader_edge (loop);
169689Skan  tree orig_cond = get_loop_exit_condition (loop);
169689Skan  block_stmt_iterator loop_exit_bsi = bsi_last (exit_e->src);
169689Skan
169689Skan  if (need_ssa_update_p ())
169689Skan    return false;
169689Skan
169689Skan  if (loop->inner
169689Skan      /* All loops have an outer scope; the only case loop->outer is NULL is for
169689Skan         the function itself.  */
169689Skan      || !loop->outer
169689Skan      || loop->num_nodes != 2
169689Skan      || !empty_block_p (loop->latch)
169689Skan      || !loop->single_exit
169689Skan      /* Verify that new loop exit condition can be trivially modified.  */
169689Skan      || (!orig_cond || orig_cond != bsi_stmt (loop_exit_bsi))
169689Skan      || (e != exit_e && e != entry_e))
169689Skan    return false;
169689Skan
169689Skan  return true;
169689Skan}
169689Skan
169689Skan#ifdef ENABLE_CHECKING
169689Skanvoid
169689Skanslpeel_verify_cfg_after_peeling (struct loop *first_loop,
169689Skan                                 struct loop *second_loop)
169689Skan{
169689Skan  basic_block loop1_exit_bb = first_loop->single_exit->dest;
169689Skan  basic_block loop2_entry_bb = loop_preheader_edge (second_loop)->src;
169689Skan  basic_block loop1_entry_bb = loop_preheader_edge (first_loop)->src;
169689Skan
169689Skan  /* A guard that controls whether the second_loop is to be executed or skipped
169689Skan     is placed in first_loop->exit.  first_loopt->exit therefore has two
169689Skan     successors - one is the preheader of second_loop, and the other is a bb
169689Skan     after second_loop.
169689Skan   */
169689Skan  gcc_assert (EDGE_COUNT (loop1_exit_bb->succs) == 2);
169689Skan
169689Skan  /* 1. Verify that one of the successors of first_loopt->exit is the preheader
169689Skan        of second_loop.  */
169689Skan
169689Skan  /* The preheader of new_loop is expected to have two predecessors:
169689Skan     first_loop->exit and the block that precedes first_loop.  */
169689Skan
169689Skan  gcc_assert (EDGE_COUNT (loop2_entry_bb->preds) == 2
169689Skan              && ((EDGE_PRED (loop2_entry_bb, 0)->src == loop1_exit_bb
169689Skan                   && EDGE_PRED (loop2_entry_bb, 1)->src == loop1_entry_bb)
169689Skan               || (EDGE_PRED (loop2_entry_bb, 1)->src ==  loop1_exit_bb
169689Skan                   && EDGE_PRED (loop2_entry_bb, 0)->src == loop1_entry_bb)));
169689Skan
169689Skan  /* Verify that the other successor of first_loopt->exit is after the
169689Skan     second_loop.  */
169689Skan  /* TODO */
169689Skan}
169689Skan#endif
169689Skan
169689Skan/* Function slpeel_tree_peel_loop_to_edge.
169689Skan
169689Skan   Peel the first (last) iterations of LOOP into a new prolog (epilog) loop
169689Skan   that is placed on the entry (exit) edge E of LOOP. After this transformation
169689Skan   we have two loops one after the other - first-loop iterates FIRST_NITERS
169689Skan   times, and second-loop iterates the remainder NITERS - FIRST_NITERS times.
169689Skan
169689Skan   Input:
169689Skan   - LOOP: the loop to be peeled.
169689Skan   - E: the exit or entry edge of LOOP.
169689Skan        If it is the entry edge, we peel the first iterations of LOOP. In this
169689Skan        case first-loop is LOOP, and second-loop is the newly created loop.
169689Skan        If it is the exit edge, we peel the last iterations of LOOP. In this
169689Skan        case, first-loop is the newly created loop, and second-loop is LOOP.
169689Skan   - NITERS: the number of iterations that LOOP iterates.
169689Skan   - FIRST_NITERS: the number of iterations that the first-loop should iterate.
169689Skan   - UPDATE_FIRST_LOOP_COUNT:  specified whether this function is responsible
169689Skan        for updating the loop bound of the first-loop to FIRST_NITERS.  If it
169689Skan        is false, the caller of this function may want to take care of this
169689Skan        (this can be useful if we don't want new stmts added to first-loop).
169689Skan
169689Skan   Output:
169689Skan   The function returns a pointer to the new loop-copy, or NULL if it failed
169689Skan   to perform the transformation.
169689Skan
169689Skan   The function generates two if-then-else guards: one before the first loop,
169689Skan   and the other before the second loop:
169689Skan   The first guard is:
169689Skan     if (FIRST_NITERS == 0) then skip the first loop,
169689Skan     and go directly to the second loop.
169689Skan   The second guard is:
169689Skan     if (FIRST_NITERS == NITERS) then skip the second loop.
169689Skan
169689Skan   FORNOW only simple loops are supported (see slpeel_can_duplicate_loop_p).
169689Skan   FORNOW the resulting code will not be in loop-closed-ssa form.
169689Skan*/
169689Skan
169689Skanstruct loop*
169689Skanslpeel_tree_peel_loop_to_edge (struct loop *loop, struct loops *loops,
169689Skan			       edge e, tree first_niters,
169689Skan			       tree niters, bool update_first_loop_count)
169689Skan{
169689Skan  struct loop *new_loop = NULL, *first_loop, *second_loop;
169689Skan  edge skip_e;
169689Skan  tree pre_condition;
169689Skan  bitmap definitions;
169689Skan  basic_block bb_before_second_loop, bb_after_second_loop;
169689Skan  basic_block bb_before_first_loop;
169689Skan  basic_block bb_between_loops;
169689Skan  basic_block new_exit_bb;
169689Skan  edge exit_e = loop->single_exit;
169689Skan  LOC loop_loc;
169689Skan
169689Skan  if (!slpeel_can_duplicate_loop_p (loop, e))
169689Skan    return NULL;
169689Skan
169689Skan  /* We have to initialize cfg_hooks. Then, when calling
169689Skan   cfg_hooks->split_edge, the function tree_split_edge
169689Skan   is actually called and, when calling cfg_hooks->duplicate_block,
169689Skan   the function tree_duplicate_bb is called.  */
169689Skan  tree_register_cfg_hooks ();
169689Skan
169689Skan
169689Skan  /* 1. Generate a copy of LOOP and put it on E (E is the entry/exit of LOOP).
169689Skan        Resulting CFG would be:
169689Skan
169689Skan        first_loop:
169689Skan        do {
169689Skan        } while ...
169689Skan
169689Skan        second_loop:
169689Skan        do {
169689Skan        } while ...
169689Skan
169689Skan        orig_exit_bb:
169689Skan   */
169689Skan
169689Skan  if (!(new_loop = slpeel_tree_duplicate_loop_to_edge_cfg (loop, loops, e)))
169689Skan    {
169689Skan      loop_loc = find_loop_location (loop);
169689Skan      if (dump_file && (dump_flags & TDF_DETAILS))
169689Skan        {
169689Skan          if (loop_loc != UNKNOWN_LOC)
169689Skan            fprintf (dump_file, "\n%s:%d: note: ",
169689Skan                     LOC_FILE (loop_loc), LOC_LINE (loop_loc));
169689Skan          fprintf (dump_file, "tree_duplicate_loop_to_edge_cfg failed.\n");
169689Skan        }
169689Skan      return NULL;
169689Skan    }
169689Skan
169689Skan  if (e == exit_e)
169689Skan    {
169689Skan      /* NEW_LOOP was placed after LOOP.  */
169689Skan      first_loop = loop;
169689Skan      second_loop = new_loop;
169689Skan    }
169689Skan  else
169689Skan    {
169689Skan      /* NEW_LOOP was placed before LOOP.  */
169689Skan      first_loop = new_loop;
169689Skan      second_loop = loop;
169689Skan    }
169689Skan
169689Skan  definitions = ssa_names_to_replace ();
169689Skan  slpeel_update_phis_for_duplicate_loop (loop, new_loop, e == exit_e);
169689Skan  rename_variables_in_loop (new_loop);
169689Skan
169689Skan
169689Skan  /* 2. Add the guard that controls whether the first loop is executed.
169689Skan        Resulting CFG would be:
169689Skan
169689Skan        bb_before_first_loop:
169689Skan        if (FIRST_NITERS == 0) GOTO bb_before_second_loop
169689Skan                               GOTO first-loop
169689Skan
169689Skan        first_loop:
169689Skan        do {
169689Skan        } while ...
169689Skan
169689Skan        bb_before_second_loop:
169689Skan
169689Skan        second_loop:
169689Skan        do {
169689Skan        } while ...
169689Skan
169689Skan        orig_exit_bb:
169689Skan   */
169689Skan
169689Skan  bb_before_first_loop = split_edge (loop_preheader_edge (first_loop));
169689Skan  add_bb_to_loop (bb_before_first_loop, first_loop->outer);
169689Skan  bb_before_second_loop = split_edge (first_loop->single_exit);
169689Skan  add_bb_to_loop (bb_before_second_loop, first_loop->outer);
169689Skan
169689Skan  pre_condition =
169689Skan    fold_build2 (LE_EXPR, boolean_type_node, first_niters,
169689Skan                 build_int_cst (TREE_TYPE (first_niters), 0));
169689Skan  skip_e = slpeel_add_loop_guard (bb_before_first_loop, pre_condition,
169689Skan                                  bb_before_second_loop, bb_before_first_loop);
169689Skan  slpeel_update_phi_nodes_for_guard1 (skip_e, first_loop,
169689Skan				      first_loop == new_loop,
169689Skan				      &new_exit_bb, &definitions);
169689Skan
169689Skan
169689Skan  /* 3. Add the guard that controls whether the second loop is executed.
169689Skan        Resulting CFG would be:
169689Skan
169689Skan        bb_before_first_loop:
169689Skan        if (FIRST_NITERS == 0) GOTO bb_before_second_loop (skip first loop)
169689Skan                               GOTO first-loop
169689Skan
169689Skan        first_loop:
169689Skan        do {
169689Skan        } while ...
169689Skan
169689Skan        bb_between_loops:
169689Skan        if (FIRST_NITERS == NITERS) GOTO bb_after_second_loop (skip second loop)
169689Skan                                    GOTO bb_before_second_loop
169689Skan
169689Skan        bb_before_second_loop:
169689Skan
169689Skan        second_loop:
169689Skan        do {
169689Skan        } while ...
169689Skan
169689Skan        bb_after_second_loop:
169689Skan
169689Skan        orig_exit_bb:
169689Skan   */
169689Skan
169689Skan  bb_between_loops = new_exit_bb;
169689Skan  bb_after_second_loop = split_edge (second_loop->single_exit);
169689Skan  add_bb_to_loop (bb_after_second_loop, second_loop->outer);
169689Skan
169689Skan  pre_condition =
169689Skan	fold_build2 (EQ_EXPR, boolean_type_node, first_niters, niters);
169689Skan  skip_e = slpeel_add_loop_guard (bb_between_loops, pre_condition,
169689Skan                                  bb_after_second_loop, bb_before_first_loop);
169689Skan  slpeel_update_phi_nodes_for_guard2 (skip_e, second_loop,
169689Skan                                     second_loop == new_loop, &new_exit_bb);
169689Skan
169689Skan  /* 4. Make first-loop iterate FIRST_NITERS times, if requested.
169689Skan   */
169689Skan  if (update_first_loop_count)
169689Skan    slpeel_make_loop_iterate_ntimes (first_loop, first_niters);
169689Skan
169689Skan  BITMAP_FREE (definitions);
169689Skan  delete_update_ssa ();
169689Skan
169689Skan  return new_loop;
169689Skan}
169689Skan
169689Skan/* Function vect_get_loop_location.
169689Skan
169689Skan   Extract the location of the loop in the source code.
169689Skan   If the loop is not well formed for vectorization, an estimated
169689Skan   location is calculated.
169689Skan   Return the loop location if succeed and NULL if not.  */
169689Skan
169689SkanLOC
169689Skanfind_loop_location (struct loop *loop)
169689Skan{
169689Skan  tree node = NULL_TREE;
169689Skan  basic_block bb;
169689Skan  block_stmt_iterator si;
169689Skan
169689Skan  if (!loop)
169689Skan    return UNKNOWN_LOC;
169689Skan
169689Skan  node = get_loop_exit_condition (loop);
169689Skan
169689Skan  if (node && EXPR_P (node) && EXPR_HAS_LOCATION (node)
169689Skan      && EXPR_FILENAME (node) && EXPR_LINENO (node))
169689Skan    return EXPR_LOC (node);
169689Skan
169689Skan  /* If we got here the loop is probably not "well formed",
169689Skan     try to estimate the loop location */
169689Skan
169689Skan  if (!loop->header)
169689Skan    return UNKNOWN_LOC;
169689Skan
169689Skan  bb = loop->header;
169689Skan
169689Skan  for (si = bsi_start (bb); !bsi_end_p (si); bsi_next (&si))
169689Skan    {
169689Skan      node = bsi_stmt (si);
169689Skan      if (node && EXPR_P (node) && EXPR_HAS_LOCATION (node))
169689Skan        return EXPR_LOC (node);
169689Skan    }
169689Skan
169689Skan  return UNKNOWN_LOC;
169689Skan}
169689Skan
169689Skan
169689Skan/*************************************************************************
169689Skan  Vectorization Debug Information.
169689Skan *************************************************************************/
169689Skan
169689Skan/* Function vect_set_verbosity_level.
169689Skan
169689Skan   Called from toplev.c upon detection of the
169689Skan   -ftree-vectorizer-verbose=N option.  */
169689Skan
169689Skanvoid
169689Skanvect_set_verbosity_level (const char *val)
169689Skan{
169689Skan   unsigned int vl;
169689Skan
169689Skan   vl = atoi (val);
169689Skan   if (vl < MAX_VERBOSITY_LEVEL)
169689Skan     vect_verbosity_level = vl;
169689Skan   else
169689Skan     vect_verbosity_level = MAX_VERBOSITY_LEVEL - 1;
169689Skan}
169689Skan
169689Skan
169689Skan/* Function vect_set_dump_settings.
169689Skan
169689Skan   Fix the verbosity level of the vectorizer if the
169689Skan   requested level was not set explicitly using the flag
169689Skan   -ftree-vectorizer-verbose=N.
169689Skan   Decide where to print the debugging information (dump_file/stderr).
169689Skan   If the user defined the verbosity level, but there is no dump file,
169689Skan   print to stderr, otherwise print to the dump file.  */
169689Skan
169689Skanstatic void
169689Skanvect_set_dump_settings (void)
169689Skan{
169689Skan  vect_dump = dump_file;
169689Skan
169689Skan  /* Check if the verbosity level was defined by the user:  */
169689Skan  if (vect_verbosity_level != MAX_VERBOSITY_LEVEL)
169689Skan    {
169689Skan      /* If there is no dump file, print to stderr.  */
169689Skan      if (!dump_file)
169689Skan        vect_dump = stderr;
169689Skan      return;
169689Skan    }
169689Skan
169689Skan  /* User didn't specify verbosity level:  */
169689Skan  if (dump_file && (dump_flags & TDF_DETAILS))
169689Skan    vect_verbosity_level = REPORT_DETAILS;
169689Skan  else if (dump_file && (dump_flags & TDF_STATS))
169689Skan    vect_verbosity_level = REPORT_UNVECTORIZED_LOOPS;
169689Skan  else
169689Skan    vect_verbosity_level = REPORT_NONE;
169689Skan
169689Skan  gcc_assert (dump_file || vect_verbosity_level == REPORT_NONE);
169689Skan}
169689Skan
169689Skan
169689Skan/* Function debug_loop_details.
169689Skan
169689Skan   For vectorization debug dumps.  */
169689Skan
169689Skanbool
169689Skanvect_print_dump_info (enum verbosity_levels vl)
169689Skan{
169689Skan  if (vl > vect_verbosity_level)
169689Skan    return false;
169689Skan
169689Skan  if (!current_function_decl || !vect_dump)
169689Skan    return false;
169689Skan
169689Skan  if (vect_loop_location == UNKNOWN_LOC)
169689Skan    fprintf (vect_dump, "\n%s:%d: note: ",
169689Skan		 DECL_SOURCE_FILE (current_function_decl),
169689Skan		 DECL_SOURCE_LINE (current_function_decl));
169689Skan  else
169689Skan    fprintf (vect_dump, "\n%s:%d: note: ",
169689Skan	     LOC_FILE (vect_loop_location), LOC_LINE (vect_loop_location));
169689Skan
169689Skan  return true;
169689Skan}
169689Skan
169689Skan
169689Skan/*************************************************************************
169689Skan  Vectorization Utilities.
169689Skan *************************************************************************/
169689Skan
169689Skan/* Function new_stmt_vec_info.
169689Skan
169689Skan   Create and initialize a new stmt_vec_info struct for STMT.  */
169689Skan
169689Skanstmt_vec_info
169689Skannew_stmt_vec_info (tree stmt, loop_vec_info loop_vinfo)
169689Skan{
169689Skan  stmt_vec_info res;
169689Skan  res = (stmt_vec_info) xcalloc (1, sizeof (struct _stmt_vec_info));
169689Skan
169689Skan  STMT_VINFO_TYPE (res) = undef_vec_info_type;
169689Skan  STMT_VINFO_STMT (res) = stmt;
169689Skan  STMT_VINFO_LOOP_VINFO (res) = loop_vinfo;
169689Skan  STMT_VINFO_RELEVANT_P (res) = 0;
169689Skan  STMT_VINFO_LIVE_P (res) = 0;
169689Skan  STMT_VINFO_VECTYPE (res) = NULL;
169689Skan  STMT_VINFO_VEC_STMT (res) = NULL;
169689Skan  STMT_VINFO_IN_PATTERN_P (res) = false;
169689Skan  STMT_VINFO_RELATED_STMT (res) = NULL;
169689Skan  STMT_VINFO_DATA_REF (res) = NULL;
169689Skan  if (TREE_CODE (stmt) == PHI_NODE)
169689Skan    STMT_VINFO_DEF_TYPE (res) = vect_unknown_def_type;
169689Skan  else
169689Skan    STMT_VINFO_DEF_TYPE (res) = vect_loop_def;
169689Skan  STMT_VINFO_SAME_ALIGN_REFS (res) = VEC_alloc (dr_p, heap, 5);
169689Skan
169689Skan  return res;
169689Skan}
169689Skan
169689Skan
169689Skan/* Function new_loop_vec_info.
169689Skan
169689Skan   Create and initialize a new loop_vec_info struct for LOOP, as well as
169689Skan   stmt_vec_info structs for all the stmts in LOOP.  */
169689Skan
169689Skanloop_vec_info
169689Skannew_loop_vec_info (struct loop *loop)
169689Skan{
169689Skan  loop_vec_info res;
169689Skan  basic_block *bbs;
169689Skan  block_stmt_iterator si;
169689Skan  unsigned int i;
169689Skan
169689Skan  res = (loop_vec_info) xcalloc (1, sizeof (struct _loop_vec_info));
169689Skan
169689Skan  bbs = get_loop_body (loop);
169689Skan
169689Skan  /* Create stmt_info for all stmts in the loop.  */
169689Skan  for (i = 0; i < loop->num_nodes; i++)
169689Skan    {
169689Skan      basic_block bb = bbs[i];
169689Skan      tree phi;
169689Skan
169689Skan      for (phi = phi_nodes (bb); phi; phi = PHI_CHAIN (phi))
169689Skan        {
169689Skan          stmt_ann_t ann = get_stmt_ann (phi);
169689Skan          set_stmt_info (ann, new_stmt_vec_info (phi, res));
169689Skan        }
169689Skan
169689Skan      for (si = bsi_start (bb); !bsi_end_p (si); bsi_next (&si))
169689Skan	{
169689Skan	  tree stmt = bsi_stmt (si);
169689Skan	  stmt_ann_t ann;
169689Skan
169689Skan	  ann = stmt_ann (stmt);
169689Skan	  set_stmt_info (ann, new_stmt_vec_info (stmt, res));
169689Skan	}
169689Skan    }
169689Skan
169689Skan  LOOP_VINFO_LOOP (res) = loop;
169689Skan  LOOP_VINFO_BBS (res) = bbs;
169689Skan  LOOP_VINFO_EXIT_COND (res) = NULL;
169689Skan  LOOP_VINFO_NITERS (res) = NULL;
169689Skan  LOOP_VINFO_VECTORIZABLE_P (res) = 0;
169689Skan  LOOP_PEELING_FOR_ALIGNMENT (res) = 0;
169689Skan  LOOP_VINFO_VECT_FACTOR (res) = 0;
169689Skan  LOOP_VINFO_DATAREFS (res) = VEC_alloc (data_reference_p, heap, 10);
169689Skan  LOOP_VINFO_DDRS (res) = VEC_alloc (ddr_p, heap, 10 * 10);
169689Skan  LOOP_VINFO_UNALIGNED_DR (res) = NULL;
169689Skan  LOOP_VINFO_MAY_MISALIGN_STMTS (res)
169689Skan    = VEC_alloc (tree, heap, PARAM_VALUE (PARAM_VECT_MAX_VERSION_CHECKS));
169689Skan
169689Skan  return res;
169689Skan}
169689Skan
169689Skan
169689Skan/* Function destroy_loop_vec_info.
169689Skan
169689Skan   Free LOOP_VINFO struct, as well as all the stmt_vec_info structs of all the
169689Skan   stmts in the loop.  */
169689Skan
169689Skanvoid
169689Skandestroy_loop_vec_info (loop_vec_info loop_vinfo)
169689Skan{
169689Skan  struct loop *loop;
169689Skan  basic_block *bbs;
169689Skan  int nbbs;
169689Skan  block_stmt_iterator si;
169689Skan  int j;
169689Skan
169689Skan  if (!loop_vinfo)
169689Skan    return;
169689Skan
169689Skan  loop = LOOP_VINFO_LOOP (loop_vinfo);
169689Skan
169689Skan  bbs = LOOP_VINFO_BBS (loop_vinfo);
169689Skan  nbbs = loop->num_nodes;
169689Skan
169689Skan  for (j = 0; j < nbbs; j++)
169689Skan    {
169689Skan      basic_block bb = bbs[j];
169689Skan      tree phi;
169689Skan      stmt_vec_info stmt_info;
169689Skan
169689Skan      for (phi = phi_nodes (bb); phi; phi = PHI_CHAIN (phi))
169689Skan        {
169689Skan          stmt_ann_t ann = stmt_ann (phi);
169689Skan
169689Skan          stmt_info = vinfo_for_stmt (phi);
169689Skan          free (stmt_info);
169689Skan          set_stmt_info (ann, NULL);
169689Skan        }
169689Skan
169689Skan      for (si = bsi_start (bb); !bsi_end_p (si); )
169689Skan	{
169689Skan	  tree stmt = bsi_stmt (si);
169689Skan	  stmt_ann_t ann = stmt_ann (stmt);
169689Skan	  stmt_vec_info stmt_info = vinfo_for_stmt (stmt);
169689Skan
169689Skan	  if (stmt_info)
169689Skan	    {
169689Skan	      /* Check if this is a "pattern stmt" (introduced by the
169689Skan		 vectorizer during the pattern recognition pass).  */
169689Skan	      bool remove_stmt_p = false;
169689Skan	      tree orig_stmt = STMT_VINFO_RELATED_STMT (stmt_info);
169689Skan	      if (orig_stmt)
169689Skan		{
169689Skan		  stmt_vec_info orig_stmt_info = vinfo_for_stmt (orig_stmt);
169689Skan		  if (orig_stmt_info
169689Skan		      && STMT_VINFO_IN_PATTERN_P (orig_stmt_info))
169689Skan		    remove_stmt_p = true;
169689Skan		}
169689Skan
169689Skan	      /* Free stmt_vec_info.  */
169689Skan	      VEC_free (dr_p, heap, STMT_VINFO_SAME_ALIGN_REFS (stmt_info));
169689Skan	      free (stmt_info);
169689Skan	      set_stmt_info (ann, NULL);
169689Skan
169689Skan	      /* Remove dead "pattern stmts".  */
169689Skan	      if (remove_stmt_p)
169689Skan	        bsi_remove (&si, true);
169689Skan	    }
169689Skan	  bsi_next (&si);
169689Skan	}
169689Skan    }
169689Skan
169689Skan  free (LOOP_VINFO_BBS (loop_vinfo));
169689Skan  free_data_refs (LOOP_VINFO_DATAREFS (loop_vinfo));
169689Skan  free_dependence_relations (LOOP_VINFO_DDRS (loop_vinfo));
169689Skan  VEC_free (tree, heap, LOOP_VINFO_MAY_MISALIGN_STMTS (loop_vinfo));
169689Skan
169689Skan  free (loop_vinfo);
169689Skan}
169689Skan
169689Skan
169689Skan/* Function vect_force_dr_alignment_p.
169689Skan
169689Skan   Returns whether the alignment of a DECL can be forced to be aligned
169689Skan   on ALIGNMENT bit boundary.  */
169689Skan
169689Skanbool
169689Skanvect_can_force_dr_alignment_p (tree decl, unsigned int alignment)
169689Skan{
169689Skan  if (TREE_CODE (decl) != VAR_DECL)
169689Skan    return false;
169689Skan
169689Skan  if (DECL_EXTERNAL (decl))
169689Skan    return false;
169689Skan
169689Skan  if (TREE_ASM_WRITTEN (decl))
169689Skan    return false;
169689Skan
169689Skan  if (TREE_STATIC (decl))
169689Skan    return (alignment <= MAX_OFILE_ALIGNMENT);
169689Skan  else
169689Skan    /* This is not 100% correct.  The absolute correct stack alignment
169689Skan       is STACK_BOUNDARY.  We're supposed to hope, but not assume, that
169689Skan       PREFERRED_STACK_BOUNDARY is honored by all translation units.
169689Skan       However, until someone implements forced stack alignment, SSE
169689Skan       isn't really usable without this.  */
169689Skan    return (alignment <= PREFERRED_STACK_BOUNDARY);
169689Skan}
169689Skan
169689Skan
169689Skan/* Function get_vectype_for_scalar_type.
169689Skan
169689Skan   Returns the vector type corresponding to SCALAR_TYPE as supported
169689Skan   by the target.  */
169689Skan
169689Skantree
169689Skanget_vectype_for_scalar_type (tree scalar_type)
169689Skan{
169689Skan  enum machine_mode inner_mode = TYPE_MODE (scalar_type);
169689Skan  int nbytes = GET_MODE_SIZE (inner_mode);
169689Skan  int nunits;
169689Skan  tree vectype;
169689Skan
169689Skan  if (nbytes == 0 || nbytes >= UNITS_PER_SIMD_WORD)
169689Skan    return NULL_TREE;
169689Skan
169689Skan  /* FORNOW: Only a single vector size per target (UNITS_PER_SIMD_WORD)
169689Skan     is expected.  */
169689Skan  nunits = UNITS_PER_SIMD_WORD / nbytes;
169689Skan
169689Skan  vectype = build_vector_type (scalar_type, nunits);
169689Skan  if (vect_print_dump_info (REPORT_DETAILS))
169689Skan    {
169689Skan      fprintf (vect_dump, "get vectype with %d units of type ", nunits);
169689Skan      print_generic_expr (vect_dump, scalar_type, TDF_SLIM);
169689Skan    }
169689Skan
169689Skan  if (!vectype)
169689Skan    return NULL_TREE;
169689Skan
169689Skan  if (vect_print_dump_info (REPORT_DETAILS))
169689Skan    {
169689Skan      fprintf (vect_dump, "vectype: ");
169689Skan      print_generic_expr (vect_dump, vectype, TDF_SLIM);
169689Skan    }
169689Skan
169689Skan  if (!VECTOR_MODE_P (TYPE_MODE (vectype))
169689Skan      && !INTEGRAL_MODE_P (TYPE_MODE (vectype)))
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        fprintf (vect_dump, "mode not supported by target.");
169689Skan      return NULL_TREE;
169689Skan    }
169689Skan
169689Skan  return vectype;
169689Skan}
169689Skan
169689Skan
169689Skan/* Function vect_supportable_dr_alignment
169689Skan
169689Skan   Return whether the data reference DR is supported with respect to its
169689Skan   alignment.  */
169689Skan
169689Skanenum dr_alignment_support
169689Skanvect_supportable_dr_alignment (struct data_reference *dr)
169689Skan{
169689Skan  tree vectype = STMT_VINFO_VECTYPE (vinfo_for_stmt (DR_STMT (dr)));
169689Skan  enum machine_mode mode = (int) TYPE_MODE (vectype);
169689Skan
169689Skan  if (aligned_access_p (dr))
169689Skan    return dr_aligned;
169689Skan
169689Skan  /* Possibly unaligned access.  */
169689Skan
169689Skan  if (DR_IS_READ (dr))
169689Skan    {
169689Skan      if (vec_realign_load_optab->handlers[mode].insn_code != CODE_FOR_nothing
169689Skan	  && (!targetm.vectorize.builtin_mask_for_load
169689Skan	      || targetm.vectorize.builtin_mask_for_load ()))
169689Skan	return dr_unaligned_software_pipeline;
169689Skan
169689Skan      if (movmisalign_optab->handlers[mode].insn_code != CODE_FOR_nothing)
169689Skan	/* Can't software pipeline the loads, but can at least do them.  */
169689Skan	return dr_unaligned_supported;
169689Skan    }
169689Skan
169689Skan  /* Unsupported.  */
169689Skan  return dr_unaligned_unsupported;
169689Skan}
169689Skan
169689Skan
169689Skan/* Function vect_is_simple_use.
169689Skan
169689Skan   Input:
169689Skan   LOOP - the loop that is being vectorized.
169689Skan   OPERAND - operand of a stmt in LOOP.
169689Skan   DEF - the defining stmt in case OPERAND is an SSA_NAME.
169689Skan
169689Skan   Returns whether a stmt with OPERAND can be vectorized.
169689Skan   Supportable operands are constants, loop invariants, and operands that are
169689Skan   defined by the current iteration of the loop. Unsupportable operands are
169689Skan   those that are defined by a previous iteration of the loop (as is the case
169689Skan   in reduction/induction computations).  */
169689Skan
169689Skanbool
169689Skanvect_is_simple_use (tree operand, loop_vec_info loop_vinfo, tree *def_stmt,
169689Skan		    tree *def, enum vect_def_type *dt)
169689Skan{
169689Skan  basic_block bb;
169689Skan  stmt_vec_info stmt_vinfo;
169689Skan  struct loop *loop = LOOP_VINFO_LOOP (loop_vinfo);
169689Skan
169689Skan  *def_stmt = NULL_TREE;
169689Skan  *def = NULL_TREE;
169689Skan
169689Skan  if (vect_print_dump_info (REPORT_DETAILS))
169689Skan    {
169689Skan      fprintf (vect_dump, "vect_is_simple_use: operand ");
169689Skan      print_generic_expr (vect_dump, operand, TDF_SLIM);
169689Skan    }
169689Skan
169689Skan  if (TREE_CODE (operand) == INTEGER_CST || TREE_CODE (operand) == REAL_CST)
169689Skan    {
169689Skan      *dt = vect_constant_def;
169689Skan      return true;
169689Skan    }
169689Skan
169689Skan  if (TREE_CODE (operand) != SSA_NAME)
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        fprintf (vect_dump, "not ssa-name.");
169689Skan      return false;
169689Skan    }
169689Skan
169689Skan  *def_stmt = SSA_NAME_DEF_STMT (operand);
169689Skan  if (*def_stmt == NULL_TREE )
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        fprintf (vect_dump, "no def_stmt.");
169689Skan      return false;
169689Skan    }
169689Skan
169689Skan  if (vect_print_dump_info (REPORT_DETAILS))
169689Skan    {
169689Skan      fprintf (vect_dump, "def_stmt: ");
169689Skan      print_generic_expr (vect_dump, *def_stmt, TDF_SLIM);
169689Skan    }
169689Skan
169689Skan  /* empty stmt is expected only in case of a function argument.
169689Skan     (Otherwise - we expect a phi_node or a modify_expr).  */
169689Skan  if (IS_EMPTY_STMT (*def_stmt))
169689Skan    {
169689Skan      tree arg = TREE_OPERAND (*def_stmt, 0);
169689Skan      if (TREE_CODE (arg) == INTEGER_CST || TREE_CODE (arg) == REAL_CST)
169689Skan        {
169689Skan          *def = operand;
169689Skan          *dt = vect_invariant_def;
169689Skan          return true;
169689Skan        }
169689Skan
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        fprintf (vect_dump, "Unexpected empty stmt.");
169689Skan      return false;
169689Skan    }
169689Skan
169689Skan  bb = bb_for_stmt (*def_stmt);
169689Skan  if (!flow_bb_inside_loop_p (loop, bb))
169689Skan    *dt = vect_invariant_def;
169689Skan  else
169689Skan    {
169689Skan      stmt_vinfo = vinfo_for_stmt (*def_stmt);
169689Skan      *dt = STMT_VINFO_DEF_TYPE (stmt_vinfo);
169689Skan    }
169689Skan
169689Skan  if (*dt == vect_unknown_def_type)
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        fprintf (vect_dump, "Unsupported pattern.");
169689Skan      return false;
169689Skan    }
169689Skan
169689Skan  /* stmts inside the loop that have been identified as performing
169689Skan     a reduction operation cannot have uses in the loop.  */
169689Skan  if (*dt == vect_reduction_def && TREE_CODE (*def_stmt) != PHI_NODE)
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        fprintf (vect_dump, "reduction used in loop.");
169689Skan      return false;
169689Skan    }
169689Skan
169689Skan  if (vect_print_dump_info (REPORT_DETAILS))
169689Skan    fprintf (vect_dump, "type of def: %d.",*dt);
169689Skan
169689Skan  switch (TREE_CODE (*def_stmt))
169689Skan    {
169689Skan    case PHI_NODE:
169689Skan      *def = PHI_RESULT (*def_stmt);
169689Skan      gcc_assert (*dt == vect_induction_def || *dt == vect_reduction_def
169689Skan                  || *dt == vect_invariant_def);
169689Skan      break;
169689Skan
169689Skan    case MODIFY_EXPR:
169689Skan      *def = TREE_OPERAND (*def_stmt, 0);
169689Skan      gcc_assert (*dt == vect_loop_def || *dt == vect_invariant_def);
169689Skan      break;
169689Skan
169689Skan    default:
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        fprintf (vect_dump, "unsupported defining stmt: ");
169689Skan      return false;
169689Skan    }
169689Skan
169689Skan  if (*dt == vect_induction_def)
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        fprintf (vect_dump, "induction not supported.");
169689Skan      return false;
169689Skan    }
169689Skan
169689Skan  return true;
169689Skan}
169689Skan
169689Skan
169689Skan/* Function reduction_code_for_scalar_code
169689Skan
169689Skan   Input:
169689Skan   CODE - tree_code of a reduction operations.
169689Skan
169689Skan   Output:
169689Skan   REDUC_CODE - the corresponding tree-code to be used to reduce the
169689Skan      vector of partial results into a single scalar result (which
169689Skan      will also reside in a vector).
169689Skan
169689Skan   Return TRUE if a corresponding REDUC_CODE was found, FALSE otherwise.  */
169689Skan
169689Skanbool
169689Skanreduction_code_for_scalar_code (enum tree_code code,
169689Skan                                enum tree_code *reduc_code)
169689Skan{
169689Skan  switch (code)
169689Skan  {
169689Skan  case MAX_EXPR:
169689Skan    *reduc_code = REDUC_MAX_EXPR;
169689Skan    return true;
169689Skan
169689Skan  case MIN_EXPR:
169689Skan    *reduc_code = REDUC_MIN_EXPR;
169689Skan    return true;
169689Skan
169689Skan  case PLUS_EXPR:
169689Skan    *reduc_code = REDUC_PLUS_EXPR;
169689Skan    return true;
169689Skan
169689Skan  default:
169689Skan    return false;
169689Skan  }
169689Skan}
169689Skan
169689Skan
169689Skan/* Function vect_is_simple_reduction
169689Skan
169689Skan   Detect a cross-iteration def-use cucle that represents a simple
169689Skan   reduction computation. We look for the following pattern:
169689Skan
169689Skan   loop_header:
169689Skan     a1 = phi < a0, a2 >
169689Skan     a3 = ...
169689Skan     a2 = operation (a3, a1)
169689Skan
169689Skan   such that:
169689Skan   1. operation is commutative and associative and it is safe to
169689Skan      change the order of the computation.
169689Skan   2. no uses for a2 in the loop (a2 is used out of the loop)
169689Skan   3. no uses of a1 in the loop besides the reduction operation.
169689Skan
169689Skan   Condition 1 is tested here.
169689Skan   Conditions 2,3 are tested in vect_mark_stmts_to_be_vectorized.  */
169689Skan
169689Skantree
169689Skanvect_is_simple_reduction (struct loop *loop, tree phi)
169689Skan{
169689Skan  edge latch_e = loop_latch_edge (loop);
169689Skan  tree loop_arg = PHI_ARG_DEF_FROM_EDGE (phi, latch_e);
169689Skan  tree def_stmt, def1, def2;
169689Skan  enum tree_code code;
169689Skan  int op_type;
169689Skan  tree operation, op1, op2;
169689Skan  tree type;
169689Skan
169689Skan  if (TREE_CODE (loop_arg) != SSA_NAME)
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        {
169689Skan          fprintf (vect_dump, "reduction: not ssa_name: ");
169689Skan          print_generic_expr (vect_dump, loop_arg, TDF_SLIM);
169689Skan        }
169689Skan      return NULL_TREE;
169689Skan    }
169689Skan
169689Skan  def_stmt = SSA_NAME_DEF_STMT (loop_arg);
169689Skan  if (!def_stmt)
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        fprintf (vect_dump, "reduction: no def_stmt.");
169689Skan      return NULL_TREE;
169689Skan    }
169689Skan
169689Skan  if (TREE_CODE (def_stmt) != MODIFY_EXPR)
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        {
169689Skan          print_generic_expr (vect_dump, def_stmt, TDF_SLIM);
169689Skan        }
169689Skan      return NULL_TREE;
169689Skan    }
169689Skan
169689Skan  operation = TREE_OPERAND (def_stmt, 1);
169689Skan  code = TREE_CODE (operation);
169689Skan  if (!commutative_tree_code (code) || !associative_tree_code (code))
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        {
169689Skan          fprintf (vect_dump, "reduction: not commutative/associative: ");
169689Skan          print_generic_expr (vect_dump, operation, TDF_SLIM);
169689Skan        }
169689Skan      return NULL_TREE;
169689Skan    }
169689Skan
169689Skan  op_type = TREE_CODE_LENGTH (code);
169689Skan  if (op_type != binary_op)
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        {
169689Skan          fprintf (vect_dump, "reduction: not binary operation: ");
169689Skan          print_generic_expr (vect_dump, operation, TDF_SLIM);
169689Skan        }
169689Skan      return NULL_TREE;
169689Skan    }
169689Skan
169689Skan  op1 = TREE_OPERAND (operation, 0);
169689Skan  op2 = TREE_OPERAND (operation, 1);
169689Skan  if (TREE_CODE (op1) != SSA_NAME || TREE_CODE (op2) != SSA_NAME)
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        {
169689Skan          fprintf (vect_dump, "reduction: uses not ssa_names: ");
169689Skan          print_generic_expr (vect_dump, operation, TDF_SLIM);
169689Skan        }
169689Skan      return NULL_TREE;
169689Skan    }
169689Skan
169689Skan  /* Check that it's ok to change the order of the computation.  */
169689Skan  type = TREE_TYPE (operation);
169689Skan  if (TYPE_MAIN_VARIANT (type) != TYPE_MAIN_VARIANT (TREE_TYPE (op1))
169689Skan      || TYPE_MAIN_VARIANT (type) != TYPE_MAIN_VARIANT (TREE_TYPE (op2)))
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        {
169689Skan          fprintf (vect_dump, "reduction: multiple types: operation type: ");
169689Skan          print_generic_expr (vect_dump, type, TDF_SLIM);
169689Skan          fprintf (vect_dump, ", operands types: ");
169689Skan          print_generic_expr (vect_dump, TREE_TYPE (op1), TDF_SLIM);
169689Skan          fprintf (vect_dump, ",");
169689Skan          print_generic_expr (vect_dump, TREE_TYPE (op2), TDF_SLIM);
169689Skan        }
169689Skan      return NULL_TREE;
169689Skan    }
169689Skan
169689Skan  /* CHECKME: check for !flag_finite_math_only too?  */
169689Skan  if (SCALAR_FLOAT_TYPE_P (type) && !flag_unsafe_math_optimizations)
169689Skan    {
169689Skan      /* Changing the order of operations changes the semantics.  */
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        {
169689Skan          fprintf (vect_dump, "reduction: unsafe fp math optimization: ");
169689Skan          print_generic_expr (vect_dump, operation, TDF_SLIM);
169689Skan        }
169689Skan      return NULL_TREE;
169689Skan    }
169689Skan  else if (INTEGRAL_TYPE_P (type) && TYPE_OVERFLOW_TRAPS (type))
169689Skan    {
169689Skan      /* Changing the order of operations changes the semantics.  */
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        {
169689Skan          fprintf (vect_dump, "reduction: unsafe int math optimization: ");
169689Skan          print_generic_expr (vect_dump, operation, TDF_SLIM);
169689Skan        }
169689Skan      return NULL_TREE;
169689Skan    }
169689Skan
169689Skan  /* reduction is safe. we're dealing with one of the following:
169689Skan     1) integer arithmetic and no trapv
169689Skan     2) floating point arithmetic, and special flags permit this optimization.
169689Skan   */
169689Skan  def1 = SSA_NAME_DEF_STMT (op1);
169689Skan  def2 = SSA_NAME_DEF_STMT (op2);
169689Skan  if (!def1 || !def2)
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        {
169689Skan          fprintf (vect_dump, "reduction: no defs for operands: ");
169689Skan          print_generic_expr (vect_dump, operation, TDF_SLIM);
169689Skan        }
169689Skan      return NULL_TREE;
169689Skan    }
169689Skan
169689Skan  if (TREE_CODE (def1) == MODIFY_EXPR
169689Skan      && flow_bb_inside_loop_p (loop, bb_for_stmt (def1))
169689Skan      && def2 == phi)
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        {
169689Skan          fprintf (vect_dump, "detected reduction:");
169689Skan          print_generic_expr (vect_dump, operation, TDF_SLIM);
169689Skan        }
169689Skan      return def_stmt;
169689Skan    }
169689Skan  else if (TREE_CODE (def2) == MODIFY_EXPR
169689Skan      && flow_bb_inside_loop_p (loop, bb_for_stmt (def2))
169689Skan      && def1 == phi)
169689Skan    {
169689Skan      /* Swap operands (just for simplicity - so that the rest of the code
169689Skan	 can assume that the reduction variable is always the last (second)
169689Skan	 argument).  */
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        {
169689Skan          fprintf (vect_dump, "detected reduction: need to swap operands:");
169689Skan          print_generic_expr (vect_dump, operation, TDF_SLIM);
169689Skan        }
169689Skan      swap_tree_operands (def_stmt, &TREE_OPERAND (operation, 0),
169689Skan				    &TREE_OPERAND (operation, 1));
169689Skan      return def_stmt;
169689Skan    }
169689Skan  else
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        {
169689Skan          fprintf (vect_dump, "reduction: unknown pattern.");
169689Skan          print_generic_expr (vect_dump, operation, TDF_SLIM);
169689Skan        }
169689Skan      return NULL_TREE;
169689Skan    }
169689Skan}
169689Skan
169689Skan
169689Skan/* Function vect_is_simple_iv_evolution.
169689Skan
169689Skan   FORNOW: A simple evolution of an induction variables in the loop is
169689Skan   considered a polynomial evolution with constant step.  */
169689Skan
169689Skanbool
169689Skanvect_is_simple_iv_evolution (unsigned loop_nb, tree access_fn, tree * init,
169689Skan			     tree * step)
169689Skan{
169689Skan  tree init_expr;
169689Skan  tree step_expr;
169689Skan
169689Skan  tree evolution_part = evolution_part_in_loop_num (access_fn, loop_nb);
169689Skan
169689Skan  /* When there is no evolution in this loop, the evolution function
169689Skan     is not "simple".  */
169689Skan  if (evolution_part == NULL_TREE)
169689Skan    return false;
169689Skan
169689Skan  /* When the evolution is a polynomial of degree >= 2
169689Skan     the evolution function is not "simple".  */
169689Skan  if (tree_is_chrec (evolution_part))
169689Skan    return false;
169689Skan
169689Skan  step_expr = evolution_part;
169689Skan  init_expr = unshare_expr (initial_condition_in_loop_num (access_fn,
169689Skan                                                           loop_nb));
169689Skan
169689Skan  if (vect_print_dump_info (REPORT_DETAILS))
169689Skan    {
169689Skan      fprintf (vect_dump, "step: ");
169689Skan      print_generic_expr (vect_dump, step_expr, TDF_SLIM);
169689Skan      fprintf (vect_dump, ",  init: ");
169689Skan      print_generic_expr (vect_dump, init_expr, TDF_SLIM);
169689Skan    }
169689Skan
169689Skan  *init = init_expr;
169689Skan  *step = step_expr;
169689Skan
169689Skan  if (TREE_CODE (step_expr) != INTEGER_CST)
169689Skan    {
169689Skan      if (vect_print_dump_info (REPORT_DETAILS))
169689Skan        fprintf (vect_dump, "step unknown.");
169689Skan      return false;
169689Skan    }
169689Skan
169689Skan  return true;
169689Skan}
169689Skan
169689Skan
169689Skan/* Function vectorize_loops.
169689Skan
169689Skan   Entry Point to loop vectorization phase.  */
169689Skan
169689Skanvoid
169689Skanvectorize_loops (struct loops *loops)
169689Skan{
169689Skan  unsigned int i;
169689Skan  unsigned int num_vectorized_loops = 0;
169689Skan
169689Skan  /* Fix the verbosity level if not defined explicitly by the user.  */
169689Skan  vect_set_dump_settings ();
169689Skan
169689Skan  /* Allocate the bitmap that records which virtual variables that
169689Skan     need to be renamed.  */
169689Skan  vect_vnames_to_rename = BITMAP_ALLOC (NULL);
169689Skan
169689Skan  /*  ----------- Analyze loops. -----------  */
169689Skan
169689Skan  /* If some loop was duplicated, it gets bigger number
169689Skan     than all previously defined loops. This fact allows us to run
169689Skan     only over initial loops skipping newly generated ones.  */
169689Skan  vect_loops_num = loops->num;
169689Skan  for (i = 1; i < vect_loops_num; i++)
169689Skan    {
169689Skan      loop_vec_info loop_vinfo;
169689Skan      struct loop *loop = loops->parray[i];
169689Skan
169689Skan      if (!loop)
169689Skan        continue;
169689Skan
169689Skan      vect_loop_location = find_loop_location (loop);
169689Skan      loop_vinfo = vect_analyze_loop (loop);
169689Skan      loop->aux = loop_vinfo;
169689Skan
169689Skan      if (!loop_vinfo || !LOOP_VINFO_VECTORIZABLE_P (loop_vinfo))
169689Skan	continue;
169689Skan
169689Skan      vect_transform_loop (loop_vinfo, loops);
169689Skan      num_vectorized_loops++;
169689Skan    }
169689Skan  vect_loop_location = UNKNOWN_LOC;
169689Skan
169689Skan  if (vect_print_dump_info (REPORT_VECTORIZED_LOOPS))
169689Skan    fprintf (vect_dump, "vectorized %u loops in function.\n",
169689Skan	     num_vectorized_loops);
169689Skan
169689Skan  /*  ----------- Finalize. -----------  */
169689Skan
169689Skan  BITMAP_FREE (vect_vnames_to_rename);
169689Skan
169689Skan  for (i = 1; i < vect_loops_num; i++)
169689Skan    {
169689Skan      struct loop *loop = loops->parray[i];
169689Skan      loop_vec_info loop_vinfo;
169689Skan
169689Skan      if (!loop)
169689Skan	continue;
169689Skan      loop_vinfo = loop->aux;
169689Skan      destroy_loop_vec_info (loop_vinfo);
169689Skan      loop->aux = NULL;
169689Skan    }
169689Skan}