LCOV - code coverage report
Current view: top level - gcc - tree-vectorizer.h (source / functions) Coverage Total Hit
Test: gcc.info Lines: 96.7 % 214 207
Test Date: 2024-12-21 13:15:12 Functions: 93.3 % 30 28
Legend: Lines: hit not hit | Branches: + taken - not taken # not executed Branches: - 0 0

             Branch data     Line data    Source code
       1                 :             : /* Vectorizer
       2                 :             :    Copyright (C) 2003-2024 Free Software Foundation, Inc.
       3                 :             :    Contributed by Dorit Naishlos <dorit@il.ibm.com>
       4                 :             : 
       5                 :             : This file is part of GCC.
       6                 :             : 
       7                 :             : GCC is free software; you can redistribute it and/or modify it under
       8                 :             : the terms of the GNU General Public License as published by the Free
       9                 :             : Software Foundation; either version 3, or (at your option) any later
      10                 :             : version.
      11                 :             : 
      12                 :             : GCC is distributed in the hope that it will be useful, but WITHOUT ANY
      13                 :             : WARRANTY; without even the implied warranty of MERCHANTABILITY or
      14                 :             : FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
      15                 :             : for more details.
      16                 :             : 
      17                 :             : You should have received a copy of the GNU General Public License
      18                 :             : along with GCC; see the file COPYING3.  If not see
      19                 :             : <http://www.gnu.org/licenses/>.  */
      20                 :             : 
      21                 :             : #ifndef GCC_TREE_VECTORIZER_H
      22                 :             : #define GCC_TREE_VECTORIZER_H
      23                 :             : 
      24                 :             : typedef class _stmt_vec_info *stmt_vec_info;
      25                 :             : typedef struct _slp_tree *slp_tree;
      26                 :             : 
      27                 :             : #include "tree-data-ref.h"
      28                 :             : #include "tree-hash-traits.h"
      29                 :             : #include "target.h"
      30                 :             : #include "internal-fn.h"
      31                 :             : #include "tree-ssa-operands.h"
      32                 :             : #include "gimple-match.h"
      33                 :             : 
      34                 :             : /* Used for naming of new temporaries.  */
      35                 :             : enum vect_var_kind {
      36                 :             :   vect_simple_var,
      37                 :             :   vect_pointer_var,
      38                 :             :   vect_scalar_var,
      39                 :             :   vect_mask_var
      40                 :             : };
      41                 :             : 
      42                 :             : /* Defines type of operation.  */
      43                 :             : enum operation_type {
      44                 :             :   unary_op = 1,
      45                 :             :   binary_op,
      46                 :             :   ternary_op
      47                 :             : };
      48                 :             : 
      49                 :             : /* Define type of available alignment support.  */
      50                 :             : enum dr_alignment_support {
      51                 :             :   dr_unaligned_unsupported,
      52                 :             :   dr_unaligned_supported,
      53                 :             :   dr_explicit_realign,
      54                 :             :   dr_explicit_realign_optimized,
      55                 :             :   dr_aligned
      56                 :             : };
      57                 :             : 
      58                 :             : /* Define type of def-use cross-iteration cycle.  */
      59                 :             : enum vect_def_type {
      60                 :             :   vect_uninitialized_def = 0,
      61                 :             :   vect_constant_def = 1,
      62                 :             :   vect_external_def,
      63                 :             :   vect_internal_def,
      64                 :             :   vect_induction_def,
      65                 :             :   vect_reduction_def,
      66                 :             :   vect_double_reduction_def,
      67                 :             :   vect_nested_cycle,
      68                 :             :   vect_first_order_recurrence,
      69                 :             :   vect_condition_def,
      70                 :             :   vect_unknown_def_type
      71                 :             : };
      72                 :             : 
      73                 :             : /* Define operation type of linear/non-linear induction variable.  */
      74                 :             : enum vect_induction_op_type {
      75                 :             :    vect_step_op_add = 0,
      76                 :             :    vect_step_op_neg,
      77                 :             :    vect_step_op_mul,
      78                 :             :    vect_step_op_shl,
      79                 :             :    vect_step_op_shr
      80                 :             : };
      81                 :             : 
      82                 :             : /* Define type of reduction.  */
      83                 :             : enum vect_reduction_type {
      84                 :             :   TREE_CODE_REDUCTION,
      85                 :             :   COND_REDUCTION,
      86                 :             :   INTEGER_INDUC_COND_REDUCTION,
      87                 :             :   CONST_COND_REDUCTION,
      88                 :             : 
      89                 :             :   /* Retain a scalar phi and use a FOLD_EXTRACT_LAST within the loop
      90                 :             :      to implement:
      91                 :             : 
      92                 :             :        for (int i = 0; i < VF; ++i)
      93                 :             :          res = cond[i] ? val[i] : res;  */
      94                 :             :   EXTRACT_LAST_REDUCTION,
      95                 :             : 
      96                 :             :   /* Use a folding reduction within the loop to implement:
      97                 :             : 
      98                 :             :        for (int i = 0; i < VF; ++i)
      99                 :             :          res = res OP val[i];
     100                 :             : 
     101                 :             :      (with no reassocation).  */
     102                 :             :   FOLD_LEFT_REDUCTION
     103                 :             : };
     104                 :             : 
     105                 :             : #define VECTORIZABLE_CYCLE_DEF(D) (((D) == vect_reduction_def)           \
     106                 :             :                                    || ((D) == vect_double_reduction_def) \
     107                 :             :                                    || ((D) == vect_nested_cycle))
     108                 :             : 
     109                 :             : /* Structure to encapsulate information about a group of like
     110                 :             :    instructions to be presented to the target cost model.  */
     111                 :             : struct stmt_info_for_cost {
     112                 :             :   int count;
     113                 :             :   enum vect_cost_for_stmt kind;
     114                 :             :   enum vect_cost_model_location where;
     115                 :             :   stmt_vec_info stmt_info;
     116                 :             :   slp_tree node;
     117                 :             :   tree vectype;
     118                 :             :   int misalign;
     119                 :             : };
     120                 :             : 
     121                 :             : typedef vec<stmt_info_for_cost> stmt_vector_for_cost;
     122                 :             : 
     123                 :             : /* Maps base addresses to an innermost_loop_behavior and the stmt it was
     124                 :             :    derived from that gives the maximum known alignment for that base.  */
     125                 :             : typedef hash_map<tree_operand_hash,
     126                 :             :                  std::pair<stmt_vec_info, innermost_loop_behavior *> >
     127                 :             :           vec_base_alignments;
     128                 :             : 
     129                 :             : /* Represents elements [START, START + LENGTH) of cyclical array OPS*
     130                 :             :    (i.e. OPS repeated to give at least START + LENGTH elements)  */
     131                 :             : struct vect_scalar_ops_slice
     132                 :             : {
     133                 :             :   tree op (unsigned int i) const;
     134                 :             :   bool all_same_p () const;
     135                 :             : 
     136                 :             :   vec<tree> *ops;
     137                 :             :   unsigned int start;
     138                 :             :   unsigned int length;
     139                 :             : };
     140                 :             : 
     141                 :             : /* Return element I of the slice.  */
     142                 :             : inline tree
     143                 :     2981136 : vect_scalar_ops_slice::op (unsigned int i) const
     144                 :             : {
     145                 :     5962272 :   return (*ops)[(i + start) % ops->length ()];
     146                 :             : }
     147                 :             : 
     148                 :             : /* Hash traits for vect_scalar_ops_slice.  */
     149                 :             : struct vect_scalar_ops_slice_hash : typed_noop_remove<vect_scalar_ops_slice>
     150                 :             : {
     151                 :             :   typedef vect_scalar_ops_slice value_type;
     152                 :             :   typedef vect_scalar_ops_slice compare_type;
     153                 :             : 
     154                 :             :   static const bool empty_zero_p = true;
     155                 :             : 
     156                 :             :   static void mark_deleted (value_type &s) { s.length = ~0U; }
     157                 :           0 :   static void mark_empty (value_type &s) { s.length = 0; }
     158                 :      666616 :   static bool is_deleted (const value_type &s) { return s.length == ~0U; }
     159                 :     6407009 :   static bool is_empty (const value_type &s) { return s.length == 0; }
     160                 :             :   static hashval_t hash (const value_type &);
     161                 :             :   static bool equal (const value_type &, const compare_type &);
     162                 :             : };
     163                 :             : 
     164                 :             : /* Describes how we're going to vectorize an individual load or store,
     165                 :             :    or a group of loads or stores.  */
     166                 :             : enum vect_memory_access_type {
     167                 :             :   /* An access to an invariant address.  This is used only for loads.  */
     168                 :             :   VMAT_INVARIANT,
     169                 :             : 
     170                 :             :   /* A simple contiguous access.  */
     171                 :             :   VMAT_CONTIGUOUS,
     172                 :             : 
     173                 :             :   /* A contiguous access that goes down in memory rather than up,
     174                 :             :      with no additional permutation.  This is used only for stores
     175                 :             :      of invariants.  */
     176                 :             :   VMAT_CONTIGUOUS_DOWN,
     177                 :             : 
     178                 :             :   /* A simple contiguous access in which the elements need to be permuted
     179                 :             :      after loading or before storing.  Only used for loop vectorization;
     180                 :             :      SLP uses separate permutes.  */
     181                 :             :   VMAT_CONTIGUOUS_PERMUTE,
     182                 :             : 
     183                 :             :   /* A simple contiguous access in which the elements need to be reversed
     184                 :             :      after loading or before storing.  */
     185                 :             :   VMAT_CONTIGUOUS_REVERSE,
     186                 :             : 
     187                 :             :   /* An access that uses IFN_LOAD_LANES or IFN_STORE_LANES.  */
     188                 :             :   VMAT_LOAD_STORE_LANES,
     189                 :             : 
     190                 :             :   /* An access in which each scalar element is loaded or stored
     191                 :             :      individually.  */
     192                 :             :   VMAT_ELEMENTWISE,
     193                 :             : 
     194                 :             :   /* A hybrid of VMAT_CONTIGUOUS and VMAT_ELEMENTWISE, used for grouped
     195                 :             :      SLP accesses.  Each unrolled iteration uses a contiguous load
     196                 :             :      or store for the whole group, but the groups from separate iterations
     197                 :             :      are combined in the same way as for VMAT_ELEMENTWISE.  */
     198                 :             :   VMAT_STRIDED_SLP,
     199                 :             : 
     200                 :             :   /* The access uses gather loads or scatter stores.  */
     201                 :             :   VMAT_GATHER_SCATTER
     202                 :             : };
     203                 :             : 
     204                 :             : /************************************************************************
     205                 :             :   SLP
     206                 :             :  ************************************************************************/
     207                 :             : typedef vec<std::pair<unsigned, unsigned> > lane_permutation_t;
     208                 :             : typedef auto_vec<std::pair<unsigned, unsigned>, 16> auto_lane_permutation_t;
     209                 :             : typedef vec<unsigned> load_permutation_t;
     210                 :             : typedef auto_vec<unsigned, 16> auto_load_permutation_t;
     211                 :             : 
     212                 :             : /* A computation tree of an SLP instance.  Each node corresponds to a group of
     213                 :             :    stmts to be packed in a SIMD stmt.  */
     214                 :             : struct _slp_tree {
     215                 :             :   _slp_tree ();
     216                 :             :   ~_slp_tree ();
     217                 :             : 
     218                 :             :   void push_vec_def (gimple *def);
     219                 :        7247 :   void push_vec_def (tree def) { vec_defs.quick_push (def); }
     220                 :             : 
     221                 :             :   /* Nodes that contain def-stmts of this node statements operands.  */
     222                 :             :   vec<slp_tree> children;
     223                 :             : 
     224                 :             :   /* A group of scalar stmts to be vectorized together.  */
     225                 :             :   vec<stmt_vec_info> stmts;
     226                 :             :   /* A group of scalar operands to be vectorized together.  */
     227                 :             :   vec<tree> ops;
     228                 :             :   /* The representative that should be used for analysis and
     229                 :             :      code generation.  */
     230                 :             :   stmt_vec_info representative;
     231                 :             : 
     232                 :             :   /* Load permutation relative to the stores, NULL if there is no
     233                 :             :      permutation.  */
     234                 :             :   load_permutation_t load_permutation;
     235                 :             :   /* Lane permutation of the operands scalar lanes encoded as pairs
     236                 :             :      of { operand number, lane number }.  The number of elements
     237                 :             :      denotes the number of output lanes.  */
     238                 :             :   lane_permutation_t lane_permutation;
     239                 :             : 
     240                 :             :   /* Selected SIMD clone's function info.  First vector element
     241                 :             :      is SIMD clone's function decl, followed by a pair of trees (base + step)
     242                 :             :      for linear arguments (pair of NULLs for other arguments).  */
     243                 :             :   vec<tree> simd_clone_info;
     244                 :             : 
     245                 :             :   tree vectype;
     246                 :             :   /* Vectorized defs.  */
     247                 :             :   vec<tree> vec_defs;
     248                 :             :   /* Number of vector stmts that are created to replace the group of scalar
     249                 :             :      stmts. It is calculated during the transformation phase as the number of
     250                 :             :      scalar elements in one scalar iteration (GROUP_SIZE) multiplied by VF
     251                 :             :      divided by vector size.  */
     252                 :             :   unsigned int vec_stmts_size;
     253                 :             : 
     254                 :             :   /* Reference count in the SLP graph.  */
     255                 :             :   unsigned int refcnt;
     256                 :             :   /* The maximum number of vector elements for the subtree rooted
     257                 :             :      at this node.  */
     258                 :             :   poly_uint64 max_nunits;
     259                 :             :   /* The DEF type of this node.  */
     260                 :             :   enum vect_def_type def_type;
     261                 :             :   /* The number of scalar lanes produced by this node.  */
     262                 :             :   unsigned int lanes;
     263                 :             :   /* The operation of this node.  */
     264                 :             :   enum tree_code code;
     265                 :             :   /* Whether uses of this load or feeders of this store are suitable
     266                 :             :      for load/store-lanes.  */
     267                 :             :   bool ldst_lanes;
     268                 :             : 
     269                 :             :   int vertex;
     270                 :             : 
     271                 :             :   /* Classifies how the load or store is going to be implemented
     272                 :             :      for loop vectorization.  */
     273                 :             :   vect_memory_access_type memory_access_type;
     274                 :             : 
     275                 :             :   /* If not NULL this is a cached failed SLP discovery attempt with
     276                 :             :      the lanes that failed during SLP discovery as 'false'.  This is
     277                 :             :      a copy of the matches array.  */
     278                 :             :   bool *failed;
     279                 :             : 
     280                 :             :   /* Allocate from slp_tree_pool.  */
     281                 :             :   static void *operator new (size_t);
     282                 :             : 
     283                 :             :   /* Return memory to slp_tree_pool.  */
     284                 :             :   static void operator delete (void *, size_t);
     285                 :             : 
     286                 :             :   /* Linked list of nodes to release when we free the slp_tree_pool.  */
     287                 :             :   slp_tree next_node;
     288                 :             :   slp_tree prev_node;
     289                 :             : };
     290                 :             : 
     291                 :             : /* The enum describes the type of operations that an SLP instance
     292                 :             :    can perform. */
     293                 :             : 
     294                 :             : enum slp_instance_kind {
     295                 :             :     slp_inst_kind_store,
     296                 :             :     slp_inst_kind_reduc_group,
     297                 :             :     slp_inst_kind_reduc_chain,
     298                 :             :     slp_inst_kind_bb_reduc,
     299                 :             :     slp_inst_kind_ctor,
     300                 :             :     slp_inst_kind_gcond
     301                 :             : };
     302                 :             : 
     303                 :             : /* SLP instance is a sequence of stmts in a loop that can be packed into
     304                 :             :    SIMD stmts.  */
     305                 :             : typedef class _slp_instance {
     306                 :             : public:
     307                 :             :   /* The root of SLP tree.  */
     308                 :             :   slp_tree root;
     309                 :             : 
     310                 :             :   /* For vector constructors, the constructor stmt that the SLP tree is built
     311                 :             :      from, NULL otherwise.  */
     312                 :             :   vec<stmt_vec_info> root_stmts;
     313                 :             : 
     314                 :             :   /* For slp_inst_kind_bb_reduc the defs that were not vectorized, NULL
     315                 :             :      otherwise.  */
     316                 :             :   vec<tree> remain_defs;
     317                 :             : 
     318                 :             :   /* The group of nodes that contain loads of this SLP instance.  */
     319                 :             :   vec<slp_tree> loads;
     320                 :             : 
     321                 :             :   /* The SLP node containing the reduction PHIs.  */
     322                 :             :   slp_tree reduc_phis;
     323                 :             : 
     324                 :             :   /* Vector cost of this entry to the SLP graph.  */
     325                 :             :   stmt_vector_for_cost cost_vec;
     326                 :             : 
     327                 :             :   /* If this instance is the main entry of a subgraph the set of
     328                 :             :      entries into the same subgraph, including itself.  */
     329                 :             :   vec<_slp_instance *> subgraph_entries;
     330                 :             : 
     331                 :             :   /* The type of operation the SLP instance is performing.  */
     332                 :             :   slp_instance_kind kind;
     333                 :             : 
     334                 :             :   dump_user_location_t location () const;
     335                 :             : } *slp_instance;
     336                 :             : 
     337                 :             : 
     338                 :             : /* Access Functions.  */
     339                 :             : #define SLP_INSTANCE_TREE(S)                     (S)->root
     340                 :             : #define SLP_INSTANCE_LOADS(S)                    (S)->loads
     341                 :             : #define SLP_INSTANCE_ROOT_STMTS(S)               (S)->root_stmts
     342                 :             : #define SLP_INSTANCE_REMAIN_DEFS(S)              (S)->remain_defs
     343                 :             : #define SLP_INSTANCE_KIND(S)                     (S)->kind
     344                 :             : 
     345                 :             : #define SLP_TREE_CHILDREN(S)                     (S)->children
     346                 :             : #define SLP_TREE_SCALAR_STMTS(S)                 (S)->stmts
     347                 :             : #define SLP_TREE_SCALAR_OPS(S)                   (S)->ops
     348                 :             : #define SLP_TREE_REF_COUNT(S)                    (S)->refcnt
     349                 :             : #define SLP_TREE_VEC_DEFS(S)                     (S)->vec_defs
     350                 :             : #define SLP_TREE_NUMBER_OF_VEC_STMTS(S)          (S)->vec_stmts_size
     351                 :             : #define SLP_TREE_LOAD_PERMUTATION(S)             (S)->load_permutation
     352                 :             : #define SLP_TREE_LANE_PERMUTATION(S)             (S)->lane_permutation
     353                 :             : #define SLP_TREE_SIMD_CLONE_INFO(S)              (S)->simd_clone_info
     354                 :             : #define SLP_TREE_DEF_TYPE(S)                     (S)->def_type
     355                 :             : #define SLP_TREE_VECTYPE(S)                      (S)->vectype
     356                 :             : #define SLP_TREE_REPRESENTATIVE(S)               (S)->representative
     357                 :             : #define SLP_TREE_LANES(S)                        (S)->lanes
     358                 :             : #define SLP_TREE_CODE(S)                         (S)->code
     359                 :             : #define SLP_TREE_MEMORY_ACCESS_TYPE(S)           (S)->memory_access_type
     360                 :             : 
     361                 :             : enum vect_partial_vector_style {
     362                 :             :     vect_partial_vectors_none,
     363                 :             :     vect_partial_vectors_while_ult,
     364                 :             :     vect_partial_vectors_avx512,
     365                 :             :     vect_partial_vectors_len
     366                 :             : };
     367                 :             : 
     368                 :             : /* Key for map that records association between
     369                 :             :    scalar conditions and corresponding loop mask, and
     370                 :             :    is populated by vect_record_loop_mask.  */
     371                 :             : 
     372                 :             : struct scalar_cond_masked_key
     373                 :             : {
     374                 :       46792 :   scalar_cond_masked_key (tree t, unsigned ncopies_)
     375                 :       46792 :     : ncopies (ncopies_)
     376                 :             :   {
     377                 :       46792 :     get_cond_ops_from_tree (t);
     378                 :             :   }
     379                 :             : 
     380                 :             :   void get_cond_ops_from_tree (tree);
     381                 :             : 
     382                 :             :   unsigned ncopies;
     383                 :             :   bool inverted_p;
     384                 :             :   tree_code code;
     385                 :             :   tree op0;
     386                 :             :   tree op1;
     387                 :             : };
     388                 :             : 
     389                 :             : template<>
     390                 :             : struct default_hash_traits<scalar_cond_masked_key>
     391                 :             : {
     392                 :             :   typedef scalar_cond_masked_key compare_type;
     393                 :             :   typedef scalar_cond_masked_key value_type;
     394                 :             : 
     395                 :             :   static inline hashval_t
     396                 :       54335 :   hash (value_type v)
     397                 :             :   {
     398                 :       54335 :     inchash::hash h;
     399                 :       54335 :     h.add_int (v.code);
     400                 :       54335 :     inchash::add_expr (v.op0, h, 0);
     401                 :       54335 :     inchash::add_expr (v.op1, h, 0);
     402                 :       54335 :     h.add_int (v.ncopies);
     403                 :       54335 :     h.add_flag (v.inverted_p);
     404                 :       54335 :     return h.end ();
     405                 :             :   }
     406                 :             : 
     407                 :             :   static inline bool
     408                 :        8431 :   equal (value_type existing, value_type candidate)
     409                 :             :   {
     410                 :        8431 :     return (existing.ncopies == candidate.ncopies
     411                 :        8427 :             && existing.code == candidate.code
     412                 :        4913 :             && existing.inverted_p == candidate.inverted_p
     413                 :        3459 :             && operand_equal_p (existing.op0, candidate.op0, 0)
     414                 :       10394 :             && operand_equal_p (existing.op1, candidate.op1, 0));
     415                 :             :   }
     416                 :             : 
     417                 :             :   static const bool empty_zero_p = true;
     418                 :             : 
     419                 :             :   static inline void
     420                 :           0 :   mark_empty (value_type &v)
     421                 :             :   {
     422                 :           0 :     v.ncopies = 0;
     423                 :           0 :     v.inverted_p = false;
     424                 :             :   }
     425                 :             : 
     426                 :             :   static inline bool
     427                 :     6309443 :   is_empty (value_type v)
     428                 :             :   {
     429                 :     6262667 :     return v.ncopies == 0;
     430                 :             :   }
     431                 :             : 
     432                 :             :   static inline void mark_deleted (value_type &) {}
     433                 :             : 
     434                 :             :   static inline bool is_deleted (const value_type &)
     435                 :             :   {
     436                 :             :     return false;
     437                 :             :   }
     438                 :             : 
     439                 :       40214 :   static inline void remove (value_type &) {}
     440                 :             : };
     441                 :             : 
     442                 :             : typedef hash_set<scalar_cond_masked_key> scalar_cond_masked_set_type;
     443                 :             : 
     444                 :             : /* Key and map that records association between vector conditions and
     445                 :             :    corresponding loop mask, and is populated by prepare_vec_mask.  */
     446                 :             : 
     447                 :             : typedef pair_hash<tree_operand_hash, tree_operand_hash> tree_cond_mask_hash;
     448                 :             : typedef hash_set<tree_cond_mask_hash> vec_cond_masked_set_type;
     449                 :             : 
     450                 :             : /* Describes two objects whose addresses must be unequal for the vectorized
     451                 :             :    loop to be valid.  */
     452                 :             : typedef std::pair<tree, tree> vec_object_pair;
     453                 :             : 
     454                 :             : /* Records that vectorization is only possible if abs (EXPR) >= MIN_VALUE.
     455                 :             :    UNSIGNED_P is true if we can assume that abs (EXPR) == EXPR.  */
     456                 :             : class vec_lower_bound {
     457                 :             : public:
     458                 :             :   vec_lower_bound () {}
     459                 :        1375 :   vec_lower_bound (tree e, bool u, poly_uint64 m)
     460                 :        1375 :     : expr (e), unsigned_p (u), min_value (m) {}
     461                 :             : 
     462                 :             :   tree expr;
     463                 :             :   bool unsigned_p;
     464                 :             :   poly_uint64 min_value;
     465                 :             : };
     466                 :             : 
     467                 :             : /* Vectorizer state shared between different analyses like vector sizes
     468                 :             :    of the same CFG region.  */
     469                 :             : class vec_info_shared {
     470                 :             : public:
     471                 :             :   vec_info_shared();
     472                 :             :   ~vec_info_shared();
     473                 :             : 
     474                 :             :   void save_datarefs();
     475                 :             :   void check_datarefs();
     476                 :             : 
     477                 :             :   /* All data references.  Freed by free_data_refs, so not an auto_vec.  */
     478                 :             :   vec<data_reference_p> datarefs;
     479                 :             :   vec<data_reference> datarefs_copy;
     480                 :             : 
     481                 :             :   /* The loop nest in which the data dependences are computed.  */
     482                 :             :   auto_vec<loop_p> loop_nest;
     483                 :             : 
     484                 :             :   /* All data dependences.  Freed by free_dependence_relations, so not
     485                 :             :      an auto_vec.  */
     486                 :             :   vec<ddr_p> ddrs;
     487                 :             : };
     488                 :             : 
     489                 :             : /* Vectorizer state common between loop and basic-block vectorization.  */
     490                 :             : class vec_info {
     491                 :             : public:
     492                 :             :   typedef hash_set<int_hash<machine_mode, E_VOIDmode, E_BLKmode> > mode_set;
     493                 :             :   enum vec_kind { bb, loop };
     494                 :             : 
     495                 :             :   vec_info (vec_kind, vec_info_shared *);
     496                 :             :   ~vec_info ();
     497                 :             : 
     498                 :             :   stmt_vec_info add_stmt (gimple *);
     499                 :             :   stmt_vec_info add_pattern_stmt (gimple *, stmt_vec_info);
     500                 :             :   stmt_vec_info resync_stmt_addr (gimple *);
     501                 :             :   stmt_vec_info lookup_stmt (gimple *);
     502                 :             :   stmt_vec_info lookup_def (tree);
     503                 :             :   stmt_vec_info lookup_single_use (tree);
     504                 :             :   class dr_vec_info *lookup_dr (data_reference *);
     505                 :             :   void move_dr (stmt_vec_info, stmt_vec_info);
     506                 :             :   void remove_stmt (stmt_vec_info);
     507                 :             :   void replace_stmt (gimple_stmt_iterator *, stmt_vec_info, gimple *);
     508                 :             :   void insert_on_entry (stmt_vec_info, gimple *);
     509                 :             :   void insert_seq_on_entry (stmt_vec_info, gimple_seq);
     510                 :             : 
     511                 :             :   /* The type of vectorization.  */
     512                 :             :   vec_kind kind;
     513                 :             : 
     514                 :             :   /* Shared vectorizer state.  */
     515                 :             :   vec_info_shared *shared;
     516                 :             : 
     517                 :             :   /* The mapping of GIMPLE UID to stmt_vec_info.  */
     518                 :             :   vec<stmt_vec_info> stmt_vec_infos;
     519                 :             :   /* Whether the above mapping is complete.  */
     520                 :             :   bool stmt_vec_info_ro;
     521                 :             : 
     522                 :             :   /* Whether we've done a transform we think OK to not update virtual
     523                 :             :      SSA form.  */
     524                 :             :   bool any_known_not_updated_vssa;
     525                 :             : 
     526                 :             :   /* The SLP graph.  */
     527                 :             :   auto_vec<slp_instance> slp_instances;
     528                 :             : 
     529                 :             :   /* Maps base addresses to an innermost_loop_behavior that gives the maximum
     530                 :             :      known alignment for that base.  */
     531                 :             :   vec_base_alignments base_alignments;
     532                 :             : 
     533                 :             :   /* All interleaving chains of stores, represented by the first
     534                 :             :      stmt in the chain.  */
     535                 :             :   auto_vec<stmt_vec_info> grouped_stores;
     536                 :             : 
     537                 :             :   /* The set of vector modes used in the vectorized region.  */
     538                 :             :   mode_set used_vector_modes;
     539                 :             : 
     540                 :             :   /* The argument we should pass to related_vector_mode when looking up
     541                 :             :      the vector mode for a scalar mode, or VOIDmode if we haven't yet
     542                 :             :      made any decisions about which vector modes to use.  */
     543                 :             :   machine_mode vector_mode;
     544                 :             : 
     545                 :             :   /* The basic blocks in the vectorization region.  For _loop_vec_info,
     546                 :             :      the memory is internally managed, while for _bb_vec_info, it points
     547                 :             :      to element space of an external auto_vec<>.  This inconsistency is
     548                 :             :      not a good class design pattern.  TODO: improve it with an unified
     549                 :             :      auto_vec<> whose lifetime is confined to vec_info object.  */
     550                 :             :   basic_block *bbs;
     551                 :             : 
     552                 :             :   /* The count of the basic blocks in the vectorization region.  */
     553                 :             :   unsigned int nbbs;
     554                 :             : 
     555                 :             :   /* Used to keep a sequence of def stmts of a pattern stmt that are loop
     556                 :             :     invariant if they exists.
     557                 :             :     The sequence is emitted in the loop preheader should the loop be vectorized
     558                 :             :     and are reset when undoing patterns.  */
     559                 :             :   gimple_seq inv_pattern_def_seq;
     560                 :             : 
     561                 :             : private:
     562                 :             :   stmt_vec_info new_stmt_vec_info (gimple *stmt);
     563                 :             :   void set_vinfo_for_stmt (gimple *, stmt_vec_info, bool = true);
     564                 :             :   void free_stmt_vec_infos ();
     565                 :             :   void free_stmt_vec_info (stmt_vec_info);
     566                 :             : };
     567                 :             : 
     568                 :             : class _loop_vec_info;
     569                 :             : class _bb_vec_info;
     570                 :             : 
     571                 :             : template<>
     572                 :             : template<>
     573                 :             : inline bool
     574                 :   331735291 : is_a_helper <_loop_vec_info *>::test (vec_info *i)
     575                 :             : {
     576                 :   331139389 :   return i->kind == vec_info::loop;
     577                 :             : }
     578                 :             : 
     579                 :             : template<>
     580                 :             : template<>
     581                 :             : inline bool
     582                 :    53725711 : is_a_helper <_bb_vec_info *>::test (vec_info *i)
     583                 :             : {
     584                 :    53725711 :   return i->kind == vec_info::bb;
     585                 :             : }
     586                 :             : 
     587                 :             : /* In general, we can divide the vector statements in a vectorized loop
     588                 :             :    into related groups ("rgroups") and say that for each rgroup there is
     589                 :             :    some nS such that the rgroup operates on nS values from one scalar
     590                 :             :    iteration followed by nS values from the next.  That is, if VF is the
     591                 :             :    vectorization factor of the loop, the rgroup operates on a sequence:
     592                 :             : 
     593                 :             :      (1,1) (1,2) ... (1,nS) (2,1) ... (2,nS) ... (VF,1) ... (VF,nS)
     594                 :             : 
     595                 :             :    where (i,j) represents a scalar value with index j in a scalar
     596                 :             :    iteration with index i.
     597                 :             : 
     598                 :             :    [ We use the term "rgroup" to emphasise that this grouping isn't
     599                 :             :      necessarily the same as the grouping of statements used elsewhere.
     600                 :             :      For example, if we implement a group of scalar loads using gather
     601                 :             :      loads, we'll use a separate gather load for each scalar load, and
     602                 :             :      thus each gather load will belong to its own rgroup. ]
     603                 :             : 
     604                 :             :    In general this sequence will occupy nV vectors concatenated
     605                 :             :    together.  If these vectors have nL lanes each, the total number
     606                 :             :    of scalar values N is given by:
     607                 :             : 
     608                 :             :        N = nS * VF = nV * nL
     609                 :             : 
     610                 :             :    None of nS, VF, nV and nL are required to be a power of 2.  nS and nV
     611                 :             :    are compile-time constants but VF and nL can be variable (if the target
     612                 :             :    supports variable-length vectors).
     613                 :             : 
     614                 :             :    In classical vectorization, each iteration of the vector loop would
     615                 :             :    handle exactly VF iterations of the original scalar loop.  However,
     616                 :             :    in vector loops that are able to operate on partial vectors, a
     617                 :             :    particular iteration of the vector loop might handle fewer than VF
     618                 :             :    iterations of the scalar loop.  The vector lanes that correspond to
     619                 :             :    iterations of the scalar loop are said to be "active" and the other
     620                 :             :    lanes are said to be "inactive".
     621                 :             : 
     622                 :             :    In such vector loops, many rgroups need to be controlled to ensure
     623                 :             :    that they have no effect for the inactive lanes.  Conceptually, each
     624                 :             :    such rgroup needs a sequence of booleans in the same order as above,
     625                 :             :    but with each (i,j) replaced by a boolean that indicates whether
     626                 :             :    iteration i is active.  This sequence occupies nV vector controls
     627                 :             :    that again have nL lanes each.  Thus the control sequence as a whole
     628                 :             :    consists of VF independent booleans that are each repeated nS times.
     629                 :             : 
     630                 :             :    Taking mask-based approach as a partially-populated vectors example.
     631                 :             :    We make the simplifying assumption that if a sequence of nV masks is
     632                 :             :    suitable for one (nS,nL) pair, we can reuse it for (nS/2,nL/2) by
     633                 :             :    VIEW_CONVERTing it.  This holds for all current targets that support
     634                 :             :    fully-masked loops.  For example, suppose the scalar loop is:
     635                 :             : 
     636                 :             :      float *f;
     637                 :             :      double *d;
     638                 :             :      for (int i = 0; i < n; ++i)
     639                 :             :        {
     640                 :             :          f[i * 2 + 0] += 1.0f;
     641                 :             :          f[i * 2 + 1] += 2.0f;
     642                 :             :          d[i] += 3.0;
     643                 :             :        }
     644                 :             : 
     645                 :             :    and suppose that vectors have 256 bits.  The vectorized f accesses
     646                 :             :    will belong to one rgroup and the vectorized d access to another:
     647                 :             : 
     648                 :             :      f rgroup: nS = 2, nV = 1, nL = 8
     649                 :             :      d rgroup: nS = 1, nV = 1, nL = 4
     650                 :             :                VF = 4
     651                 :             : 
     652                 :             :      [ In this simple example the rgroups do correspond to the normal
     653                 :             :        SLP grouping scheme. ]
     654                 :             : 
     655                 :             :    If only the first three lanes are active, the masks we need are:
     656                 :             : 
     657                 :             :      f rgroup: 1 1 | 1 1 | 1 1 | 0 0
     658                 :             :      d rgroup:  1  |  1  |  1  |  0
     659                 :             : 
     660                 :             :    Here we can use a mask calculated for f's rgroup for d's, but not
     661                 :             :    vice versa.
     662                 :             : 
     663                 :             :    Thus for each value of nV, it is enough to provide nV masks, with the
     664                 :             :    mask being calculated based on the highest nL (or, equivalently, based
     665                 :             :    on the highest nS) required by any rgroup with that nV.  We therefore
     666                 :             :    represent the entire collection of masks as a two-level table, with the
     667                 :             :    first level being indexed by nV - 1 (since nV == 0 doesn't exist) and
     668                 :             :    the second being indexed by the mask index 0 <= i < nV.  */
     669                 :             : 
     670                 :             : /* The controls (like masks or lengths) needed by rgroups with nV vectors,
     671                 :             :    according to the description above.  */
     672                 :             : struct rgroup_controls {
     673                 :             :   /* The largest nS for all rgroups that use these controls.
     674                 :             :      For vect_partial_vectors_avx512 this is the constant nscalars_per_iter
     675                 :             :      for all members of the group.  */
     676                 :             :   unsigned int max_nscalars_per_iter;
     677                 :             : 
     678                 :             :   /* For the largest nS recorded above, the loop controls divide each scalar
     679                 :             :      into FACTOR equal-sized pieces.  This is useful if we need to split
     680                 :             :      element-based accesses into byte-based accesses.
     681                 :             :      For vect_partial_vectors_avx512 this records nV instead.  */
     682                 :             :   unsigned int factor;
     683                 :             : 
     684                 :             :   /* This is a vector type with MAX_NSCALARS_PER_ITER * VF / nV elements.
     685                 :             :      For mask-based controls, it is the type of the masks in CONTROLS.
     686                 :             :      For length-based controls, it can be any vector type that has the
     687                 :             :      specified number of elements; the type of the elements doesn't matter.  */
     688                 :             :   tree type;
     689                 :             : 
     690                 :             :   /* When there is no uniformly used LOOP_VINFO_RGROUP_COMPARE_TYPE this
     691                 :             :      is the rgroup specific type used.  */
     692                 :             :   tree compare_type;
     693                 :             : 
     694                 :             :   /* A vector of nV controls, in iteration order.  */
     695                 :             :   vec<tree> controls;
     696                 :             : 
     697                 :             :   /* In case of len_load and len_store with a bias there is only one
     698                 :             :      rgroup.  This holds the adjusted loop length for the this rgroup.  */
     699                 :             :   tree bias_adjusted_ctrl;
     700                 :             : };
     701                 :             : 
     702                 :      387725 : struct vec_loop_masks
     703                 :             : {
     704                 :      315281 :   bool is_empty () const { return mask_set.is_empty (); }
     705                 :             : 
     706                 :             :   /* Set to record vectype, nvector pairs.  */
     707                 :             :   hash_set<pair_hash <nofree_ptr_hash <tree_node>,
     708                 :             :                       int_hash<unsigned, 0>>> mask_set;
     709                 :             : 
     710                 :             :   /* rgroup_controls used for the partial vector scheme.  */
     711                 :             :   auto_vec<rgroup_controls> rgc_vec;
     712                 :             : };
     713                 :             : 
     714                 :             : typedef auto_vec<rgroup_controls> vec_loop_lens;
     715                 :             : 
     716                 :             : typedef auto_vec<std::pair<data_reference*, tree> > drs_init_vec;
     717                 :             : 
     718                 :             : /* Information about a reduction accumulator from the main loop that could
     719                 :             :    conceivably be reused as the input to a reduction in an epilogue loop.  */
     720                 :             : struct vect_reusable_accumulator {
     721                 :             :   /* The final value of the accumulator, which forms the input to the
     722                 :             :      reduction operation.  */
     723                 :             :   tree reduc_input;
     724                 :             : 
     725                 :             :   /* The stmt_vec_info that describes the reduction (i.e. the one for
     726                 :             :      which is_reduc_info is true).  */
     727                 :             :   stmt_vec_info reduc_info;
     728                 :             : };
     729                 :             : 
     730                 :             : /*-----------------------------------------------------------------*/
     731                 :             : /* Info on vectorized loops.                                       */
     732                 :             : /*-----------------------------------------------------------------*/
     733                 :             : typedef class _loop_vec_info : public vec_info {
     734                 :             : public:
     735                 :             :   _loop_vec_info (class loop *, vec_info_shared *);
     736                 :             :   ~_loop_vec_info ();
     737                 :             : 
     738                 :             :   /* The loop to which this info struct refers to.  */
     739                 :             :   class loop *loop;
     740                 :             : 
     741                 :             :   /* Number of latch executions.  */
     742                 :             :   tree num_itersm1;
     743                 :             :   /* Number of iterations.  */
     744                 :             :   tree num_iters;
     745                 :             :   /* Number of iterations of the original loop.  */
     746                 :             :   tree num_iters_unchanged;
     747                 :             :   /* Condition under which this loop is analyzed and versioned.  */
     748                 :             :   tree num_iters_assumptions;
     749                 :             : 
     750                 :             :   /* The cost of the vector code.  */
     751                 :             :   class vector_costs *vector_costs;
     752                 :             : 
     753                 :             :   /* The cost of the scalar code.  */
     754                 :             :   class vector_costs *scalar_costs;
     755                 :             : 
     756                 :             :   /* Threshold of number of iterations below which vectorization will not be
     757                 :             :      performed. It is calculated from MIN_PROFITABLE_ITERS and
     758                 :             :      param_min_vect_loop_bound.  */
     759                 :             :   unsigned int th;
     760                 :             : 
     761                 :             :   /* When applying loop versioning, the vector form should only be used
     762                 :             :      if the number of scalar iterations is >= this value, on top of all
     763                 :             :      the other requirements.  Ignored when loop versioning is not being
     764                 :             :      used.  */
     765                 :             :   poly_uint64 versioning_threshold;
     766                 :             : 
     767                 :             :   /* Unrolling factor  */
     768                 :             :   poly_uint64 vectorization_factor;
     769                 :             : 
     770                 :             :   /* If this loop is an epilogue loop whose main loop can be skipped,
     771                 :             :      MAIN_LOOP_EDGE is the edge from the main loop to this loop's
     772                 :             :      preheader.  SKIP_MAIN_LOOP_EDGE is then the edge that skips the
     773                 :             :      main loop and goes straight to this loop's preheader.
     774                 :             : 
     775                 :             :      Both fields are null otherwise.  */
     776                 :             :   edge main_loop_edge;
     777                 :             :   edge skip_main_loop_edge;
     778                 :             : 
     779                 :             :   /* If this loop is an epilogue loop that might be skipped after executing
     780                 :             :      the main loop, this edge is the one that skips the epilogue.  */
     781                 :             :   edge skip_this_loop_edge;
     782                 :             : 
     783                 :             :   /* The vectorized form of a standard reduction replaces the original
     784                 :             :      scalar code's final result (a loop-closed SSA PHI) with the result
     785                 :             :      of a vector-to-scalar reduction operation.  After vectorization,
     786                 :             :      this variable maps these vector-to-scalar results to information
     787                 :             :      about the reductions that generated them.  */
     788                 :             :   hash_map<tree, vect_reusable_accumulator> reusable_accumulators;
     789                 :             : 
     790                 :             :   /* The number of times that the target suggested we unroll the vector loop
     791                 :             :      in order to promote more ILP.  This value will be used to re-analyze the
     792                 :             :      loop for vectorization and if successful the value will be folded into
     793                 :             :      vectorization_factor (and therefore exactly divides
     794                 :             :      vectorization_factor).  */
     795                 :             :   unsigned int suggested_unroll_factor;
     796                 :             : 
     797                 :             :   /* Maximum runtime vectorization factor, or MAX_VECTORIZATION_FACTOR
     798                 :             :      if there is no particular limit.  */
     799                 :             :   unsigned HOST_WIDE_INT max_vectorization_factor;
     800                 :             : 
     801                 :             :   /* The masks that a fully-masked loop should use to avoid operating
     802                 :             :      on inactive scalars.  */
     803                 :             :   vec_loop_masks masks;
     804                 :             : 
     805                 :             :   /* The lengths that a loop with length should use to avoid operating
     806                 :             :      on inactive scalars.  */
     807                 :             :   vec_loop_lens lens;
     808                 :             : 
     809                 :             :   /* Set of scalar conditions that have loop mask applied.  */
     810                 :             :   scalar_cond_masked_set_type scalar_cond_masked_set;
     811                 :             : 
     812                 :             :   /* Set of vector conditions that have loop mask applied.  */
     813                 :             :   vec_cond_masked_set_type vec_cond_masked_set;
     814                 :             : 
     815                 :             :   /* If we are using a loop mask to align memory addresses, this variable
     816                 :             :      contains the number of vector elements that we should skip in the
     817                 :             :      first iteration of the vector loop (i.e. the number of leading
     818                 :             :      elements that should be false in the first mask).  */
     819                 :             :   tree mask_skip_niters;
     820                 :             : 
     821                 :             :   /* The type that the loop control IV should be converted to before
     822                 :             :      testing which of the VF scalars are active and inactive.
     823                 :             :      Only meaningful if LOOP_VINFO_USING_PARTIAL_VECTORS_P.  */
     824                 :             :   tree rgroup_compare_type;
     825                 :             : 
     826                 :             :   /* For #pragma omp simd if (x) loops the x expression.  If constant 0,
     827                 :             :      the loop should not be vectorized, if constant non-zero, simd_if_cond
     828                 :             :      shouldn't be set and loop vectorized normally, if SSA_NAME, the loop
     829                 :             :      should be versioned on that condition, using scalar loop if the condition
     830                 :             :      is false and vectorized loop otherwise.  */
     831                 :             :   tree simd_if_cond;
     832                 :             : 
     833                 :             :   /* The type that the vector loop control IV should have when
     834                 :             :      LOOP_VINFO_USING_PARTIAL_VECTORS_P is true.  */
     835                 :             :   tree rgroup_iv_type;
     836                 :             : 
     837                 :             :   /* The style used for implementing partial vectors when
     838                 :             :      LOOP_VINFO_USING_PARTIAL_VECTORS_P is true.  */
     839                 :             :   vect_partial_vector_style partial_vector_style;
     840                 :             : 
     841                 :             :   /* Unknown DRs according to which loop was peeled.  */
     842                 :             :   class dr_vec_info *unaligned_dr;
     843                 :             : 
     844                 :             :   /* peeling_for_alignment indicates whether peeling for alignment will take
     845                 :             :      place, and what the peeling factor should be:
     846                 :             :      peeling_for_alignment = X means:
     847                 :             :         If X=0: Peeling for alignment will not be applied.
     848                 :             :         If X>0: Peel first X iterations.
     849                 :             :         If X=-1: Generate a runtime test to calculate the number of iterations
     850                 :             :                  to be peeled, using the dataref recorded in the field
     851                 :             :                  unaligned_dr.  */
     852                 :             :   int peeling_for_alignment;
     853                 :             : 
     854                 :             :   /* The mask used to check the alignment of pointers or arrays.  */
     855                 :             :   int ptr_mask;
     856                 :             : 
     857                 :             :   /* Data Dependence Relations defining address ranges that are candidates
     858                 :             :      for a run-time aliasing check.  */
     859                 :             :   auto_vec<ddr_p> may_alias_ddrs;
     860                 :             : 
     861                 :             :   /* Data Dependence Relations defining address ranges together with segment
     862                 :             :      lengths from which the run-time aliasing check is built.  */
     863                 :             :   auto_vec<dr_with_seg_len_pair_t> comp_alias_ddrs;
     864                 :             : 
     865                 :             :   /* Check that the addresses of each pair of objects is unequal.  */
     866                 :             :   auto_vec<vec_object_pair> check_unequal_addrs;
     867                 :             : 
     868                 :             :   /* List of values that are required to be nonzero.  This is used to check
     869                 :             :      whether things like "x[i * n] += 1;" are safe and eventually gets added
     870                 :             :      to the checks for lower bounds below.  */
     871                 :             :   auto_vec<tree> check_nonzero;
     872                 :             : 
     873                 :             :   /* List of values that need to be checked for a minimum value.  */
     874                 :             :   auto_vec<vec_lower_bound> lower_bounds;
     875                 :             : 
     876                 :             :   /* Statements in the loop that have data references that are candidates for a
     877                 :             :      runtime (loop versioning) misalignment check.  */
     878                 :             :   auto_vec<stmt_vec_info> may_misalign_stmts;
     879                 :             : 
     880                 :             :   /* Reduction cycles detected in the loop. Used in loop-aware SLP.  */
     881                 :             :   auto_vec<stmt_vec_info> reductions;
     882                 :             : 
     883                 :             :   /* All reduction chains in the loop, represented by the first
     884                 :             :      stmt in the chain.  */
     885                 :             :   auto_vec<stmt_vec_info> reduction_chains;
     886                 :             : 
     887                 :             :   /* Cost vector for a single scalar iteration.  */
     888                 :             :   auto_vec<stmt_info_for_cost> scalar_cost_vec;
     889                 :             : 
     890                 :             :   /* Map of IV base/step expressions to inserted name in the preheader.  */
     891                 :             :   hash_map<tree_operand_hash, tree> *ivexpr_map;
     892                 :             : 
     893                 :             :   /* Map of OpenMP "omp simd array" scan variables to corresponding
     894                 :             :      rhs of the store of the initializer.  */
     895                 :             :   hash_map<tree, tree> *scan_map;
     896                 :             : 
     897                 :             :   /* The unrolling factor needed to SLP the loop. In case of that pure SLP is
     898                 :             :      applied to the loop, i.e., no unrolling is needed, this is 1.  */
     899                 :             :   poly_uint64 slp_unrolling_factor;
     900                 :             : 
     901                 :             :   /* The factor used to over weight those statements in an inner loop
     902                 :             :      relative to the loop being vectorized.  */
     903                 :             :   unsigned int inner_loop_cost_factor;
     904                 :             : 
     905                 :             :   /* Is the loop vectorizable? */
     906                 :             :   bool vectorizable;
     907                 :             : 
     908                 :             :   /* Records whether we still have the option of vectorizing this loop
     909                 :             :      using partially-populated vectors; in other words, whether it is
     910                 :             :      still possible for one iteration of the vector loop to handle
     911                 :             :      fewer than VF scalars.  */
     912                 :             :   bool can_use_partial_vectors_p;
     913                 :             : 
     914                 :             :   /* Records whether we must use niter masking for correctness reasons.  */
     915                 :             :   bool must_use_partial_vectors_p;
     916                 :             : 
     917                 :             :   /* True if we've decided to use partially-populated vectors, so that
     918                 :             :      the vector loop can handle fewer than VF scalars.  */
     919                 :             :   bool using_partial_vectors_p;
     920                 :             : 
     921                 :             :   /* True if we've decided to use a decrementing loop control IV that counts
     922                 :             :      scalars. This can be done for any loop that:
     923                 :             : 
     924                 :             :         (a) uses length "controls"; and
     925                 :             :         (b) can iterate more than once.  */
     926                 :             :   bool using_decrementing_iv_p;
     927                 :             : 
     928                 :             :   /* True if we've decided to use output of select_vl to adjust IV of
     929                 :             :      both loop control and data reference pointer. This is only true
     930                 :             :      for single-rgroup control.  */
     931                 :             :   bool using_select_vl_p;
     932                 :             : 
     933                 :             :   /* True if we've decided to use partially-populated vectors for the
     934                 :             :      epilogue of loop.  */
     935                 :             :   bool epil_using_partial_vectors_p;
     936                 :             : 
     937                 :             :   /* The bias for len_load and len_store.  For now, only 0 and -1 are
     938                 :             :      supported.  -1 must be used when a backend does not support
     939                 :             :      len_load/len_store with a length of zero.  */
     940                 :             :   signed char partial_load_store_bias;
     941                 :             : 
     942                 :             :   /* When we have grouped data accesses with gaps, we may introduce invalid
     943                 :             :      memory accesses.  We peel the last iteration of the loop to prevent
     944                 :             :      this.  */
     945                 :             :   bool peeling_for_gaps;
     946                 :             : 
     947                 :             :   /* When the number of iterations is not a multiple of the vector size
     948                 :             :      we need to peel off iterations at the end to form an epilogue loop.  */
     949                 :             :   bool peeling_for_niter;
     950                 :             : 
     951                 :             :   /* When the loop has early breaks that we can vectorize we need to peel
     952                 :             :      the loop for the break finding loop.  */
     953                 :             :   bool early_breaks;
     954                 :             : 
     955                 :             :   /* List of loop additional IV conditionals found in the loop.  */
     956                 :             :   auto_vec<gcond *> conds;
     957                 :             : 
     958                 :             :   /* Main loop IV cond.  */
     959                 :             :   gcond* loop_iv_cond;
     960                 :             : 
     961                 :             :   /* True if there are no loop carried data dependencies in the loop.
     962                 :             :      If loop->safelen <= 1, then this is always true, either the loop
     963                 :             :      didn't have any loop carried data dependencies, or the loop is being
     964                 :             :      vectorized guarded with some runtime alias checks, or couldn't
     965                 :             :      be vectorized at all, but then this field shouldn't be used.
     966                 :             :      For loop->safelen >= 2, the user has asserted that there are no
     967                 :             :      backward dependencies, but there still could be loop carried forward
     968                 :             :      dependencies in such loops.  This flag will be false if normal
     969                 :             :      vectorizer data dependency analysis would fail or require versioning
     970                 :             :      for alias, but because of loop->safelen >= 2 it has been vectorized
     971                 :             :      even without versioning for alias.  E.g. in:
     972                 :             :      #pragma omp simd
     973                 :             :      for (int i = 0; i < m; i++)
     974                 :             :        a[i] = a[i + k] * c;
     975                 :             :      (or #pragma simd or #pragma ivdep) we can vectorize this and it will
     976                 :             :      DTRT even for k > 0 && k < m, but without safelen we would not
     977                 :             :      vectorize this, so this field would be false.  */
     978                 :             :   bool no_data_dependencies;
     979                 :             : 
     980                 :             :   /* Mark loops having masked stores.  */
     981                 :             :   bool has_mask_store;
     982                 :             : 
     983                 :             :   /* Queued scaling factor for the scalar loop.  */
     984                 :             :   profile_probability scalar_loop_scaling;
     985                 :             : 
     986                 :             :   /* If if-conversion versioned this loop before conversion, this is the
     987                 :             :      loop version without if-conversion.  */
     988                 :             :   class loop *scalar_loop;
     989                 :             : 
     990                 :             :   /* For loops being epilogues of already vectorized loops
     991                 :             :      this points to the main vectorized loop.  Otherwise NULL.  */
     992                 :             :   _loop_vec_info *main_loop_info;
     993                 :             : 
     994                 :             :   /* For loops being epilogues of already vectorized loops
     995                 :             :      this points to the preceeding vectorized (possibly epilogue) loop.
     996                 :             :      Otherwise NULL.  */
     997                 :             :   _loop_vec_info *orig_loop_info;
     998                 :             : 
     999                 :             :   /* Used to store loop_vec_infos of the epilogue of this loop during
    1000                 :             :      analysis.  */
    1001                 :             :   _loop_vec_info *epilogue_vinfo;
    1002                 :             : 
    1003                 :             :   /* If this is an epilogue loop the DR advancement applied.  */
    1004                 :             :   tree drs_advanced_by;
    1005                 :             : 
    1006                 :             :   /* The controlling loop IV for the current loop when vectorizing.  This IV
    1007                 :             :      controls the natural exits of the loop.  */
    1008                 :             :   edge vec_loop_iv_exit;
    1009                 :             : 
    1010                 :             :   /* The controlling loop IV for the epilogue loop when vectorizing.  This IV
    1011                 :             :      controls the natural exits of the loop.  */
    1012                 :             :   edge vec_epilogue_loop_iv_exit;
    1013                 :             : 
    1014                 :             :   /* The controlling loop IV for the scalar loop being vectorized.  This IV
    1015                 :             :      controls the natural exits of the loop.  */
    1016                 :             :   edge scalar_loop_iv_exit;
    1017                 :             : 
    1018                 :             :   /* Used to store the list of stores needing to be moved if doing early
    1019                 :             :      break vectorization as they would violate the scalar loop semantics if
    1020                 :             :      vectorized in their current location.  These are stored in order that they
    1021                 :             :      need to be moved.  */
    1022                 :             :   auto_vec<gimple *> early_break_stores;
    1023                 :             : 
    1024                 :             :   /* The final basic block where to move statements to.  In the case of
    1025                 :             :      multiple exits this could be pretty far away.  */
    1026                 :             :   basic_block early_break_dest_bb;
    1027                 :             : 
    1028                 :             :   /* Statements whose VUSES need updating if early break vectorization is to
    1029                 :             :      happen.  */
    1030                 :             :   auto_vec<gimple*> early_break_vuses;
    1031                 :             : 
    1032                 :             :   /* Record statements that are needed to be live for early break vectorization
    1033                 :             :      but may not have an LC PHI node materialized yet in the exits.  */
    1034                 :             :   auto_vec<stmt_vec_info> early_break_live_ivs;
    1035                 :             : } *loop_vec_info;
    1036                 :             : 
    1037                 :             : /* Access Functions.  */
    1038                 :             : #define LOOP_VINFO_LOOP(L)                 (L)->loop
    1039                 :             : #define LOOP_VINFO_IV_EXIT(L)              (L)->vec_loop_iv_exit
    1040                 :             : #define LOOP_VINFO_EPILOGUE_IV_EXIT(L)     (L)->vec_epilogue_loop_iv_exit
    1041                 :             : #define LOOP_VINFO_SCALAR_IV_EXIT(L)       (L)->scalar_loop_iv_exit
    1042                 :             : #define LOOP_VINFO_BBS(L)                  (L)->bbs
    1043                 :             : #define LOOP_VINFO_NBBS(L)                 (L)->nbbs
    1044                 :             : #define LOOP_VINFO_NITERSM1(L)             (L)->num_itersm1
    1045                 :             : #define LOOP_VINFO_NITERS(L)               (L)->num_iters
    1046                 :             : /* Since LOOP_VINFO_NITERS and LOOP_VINFO_NITERSM1 can change after
    1047                 :             :    prologue peeling retain total unchanged scalar loop iterations for
    1048                 :             :    cost model.  */
    1049                 :             : #define LOOP_VINFO_NITERS_UNCHANGED(L)     (L)->num_iters_unchanged
    1050                 :             : #define LOOP_VINFO_NITERS_ASSUMPTIONS(L)   (L)->num_iters_assumptions
    1051                 :             : #define LOOP_VINFO_COST_MODEL_THRESHOLD(L) (L)->th
    1052                 :             : #define LOOP_VINFO_VERSIONING_THRESHOLD(L) (L)->versioning_threshold
    1053                 :             : #define LOOP_VINFO_VECTORIZABLE_P(L)       (L)->vectorizable
    1054                 :             : #define LOOP_VINFO_CAN_USE_PARTIAL_VECTORS_P(L) (L)->can_use_partial_vectors_p
    1055                 :             : #define LOOP_VINFO_MUST_USE_PARTIAL_VECTORS_P(L) (L)->must_use_partial_vectors_p
    1056                 :             : #define LOOP_VINFO_USING_PARTIAL_VECTORS_P(L) (L)->using_partial_vectors_p
    1057                 :             : #define LOOP_VINFO_USING_DECREMENTING_IV_P(L) (L)->using_decrementing_iv_p
    1058                 :             : #define LOOP_VINFO_USING_SELECT_VL_P(L) (L)->using_select_vl_p
    1059                 :             : #define LOOP_VINFO_EPIL_USING_PARTIAL_VECTORS_P(L)                             \
    1060                 :             :   (L)->epil_using_partial_vectors_p
    1061                 :             : #define LOOP_VINFO_PARTIAL_LOAD_STORE_BIAS(L) (L)->partial_load_store_bias
    1062                 :             : #define LOOP_VINFO_VECT_FACTOR(L)          (L)->vectorization_factor
    1063                 :             : #define LOOP_VINFO_MAX_VECT_FACTOR(L)      (L)->max_vectorization_factor
    1064                 :             : #define LOOP_VINFO_MASKS(L)                (L)->masks
    1065                 :             : #define LOOP_VINFO_LENS(L)                 (L)->lens
    1066                 :             : #define LOOP_VINFO_MASK_SKIP_NITERS(L)     (L)->mask_skip_niters
    1067                 :             : #define LOOP_VINFO_RGROUP_COMPARE_TYPE(L)  (L)->rgroup_compare_type
    1068                 :             : #define LOOP_VINFO_RGROUP_IV_TYPE(L)       (L)->rgroup_iv_type
    1069                 :             : #define LOOP_VINFO_PARTIAL_VECTORS_STYLE(L) (L)->partial_vector_style
    1070                 :             : #define LOOP_VINFO_PTR_MASK(L)             (L)->ptr_mask
    1071                 :             : #define LOOP_VINFO_LOOP_NEST(L)            (L)->shared->loop_nest
    1072                 :             : #define LOOP_VINFO_DATAREFS(L)             (L)->shared->datarefs
    1073                 :             : #define LOOP_VINFO_DDRS(L)                 (L)->shared->ddrs
    1074                 :             : #define LOOP_VINFO_INT_NITERS(L)           (TREE_INT_CST_LOW ((L)->num_iters))
    1075                 :             : #define LOOP_VINFO_PEELING_FOR_ALIGNMENT(L) (L)->peeling_for_alignment
    1076                 :             : #define LOOP_VINFO_UNALIGNED_DR(L)         (L)->unaligned_dr
    1077                 :             : #define LOOP_VINFO_MAY_MISALIGN_STMTS(L)   (L)->may_misalign_stmts
    1078                 :             : #define LOOP_VINFO_MAY_ALIAS_DDRS(L)       (L)->may_alias_ddrs
    1079                 :             : #define LOOP_VINFO_COMP_ALIAS_DDRS(L)      (L)->comp_alias_ddrs
    1080                 :             : #define LOOP_VINFO_CHECK_UNEQUAL_ADDRS(L)  (L)->check_unequal_addrs
    1081                 :             : #define LOOP_VINFO_CHECK_NONZERO(L)        (L)->check_nonzero
    1082                 :             : #define LOOP_VINFO_LOWER_BOUNDS(L)         (L)->lower_bounds
    1083                 :             : #define LOOP_VINFO_GROUPED_STORES(L)       (L)->grouped_stores
    1084                 :             : #define LOOP_VINFO_SLP_INSTANCES(L)        (L)->slp_instances
    1085                 :             : #define LOOP_VINFO_SLP_UNROLLING_FACTOR(L) (L)->slp_unrolling_factor
    1086                 :             : #define LOOP_VINFO_REDUCTIONS(L)           (L)->reductions
    1087                 :             : #define LOOP_VINFO_REDUCTION_CHAINS(L)     (L)->reduction_chains
    1088                 :             : #define LOOP_VINFO_PEELING_FOR_GAPS(L)     (L)->peeling_for_gaps
    1089                 :             : #define LOOP_VINFO_PEELING_FOR_NITER(L)    (L)->peeling_for_niter
    1090                 :             : #define LOOP_VINFO_EARLY_BREAKS(L)         (L)->early_breaks
    1091                 :             : #define LOOP_VINFO_EARLY_BRK_STORES(L)     (L)->early_break_stores
    1092                 :             : #define LOOP_VINFO_EARLY_BREAKS_VECT_PEELED(L)  \
    1093                 :             :   (single_pred ((L)->loop->latch) != (L)->vec_loop_iv_exit->src)
    1094                 :             : #define LOOP_VINFO_EARLY_BREAKS_LIVE_IVS(L)  \
    1095                 :             :   (L)->early_break_live_ivs
    1096                 :             : #define LOOP_VINFO_EARLY_BRK_DEST_BB(L)    (L)->early_break_dest_bb
    1097                 :             : #define LOOP_VINFO_EARLY_BRK_VUSES(L)      (L)->early_break_vuses
    1098                 :             : #define LOOP_VINFO_LOOP_CONDS(L)           (L)->conds
    1099                 :             : #define LOOP_VINFO_LOOP_IV_COND(L)         (L)->loop_iv_cond
    1100                 :             : #define LOOP_VINFO_NO_DATA_DEPENDENCIES(L) (L)->no_data_dependencies
    1101                 :             : #define LOOP_VINFO_SCALAR_LOOP(L)          (L)->scalar_loop
    1102                 :             : #define LOOP_VINFO_SCALAR_LOOP_SCALING(L)  (L)->scalar_loop_scaling
    1103                 :             : #define LOOP_VINFO_HAS_MASK_STORE(L)       (L)->has_mask_store
    1104                 :             : #define LOOP_VINFO_SCALAR_ITERATION_COST(L) (L)->scalar_cost_vec
    1105                 :             : #define LOOP_VINFO_MAIN_LOOP_INFO(L)       (L)->main_loop_info
    1106                 :             : #define LOOP_VINFO_ORIG_LOOP_INFO(L)       (L)->orig_loop_info
    1107                 :             : #define LOOP_VINFO_SIMD_IF_COND(L)         (L)->simd_if_cond
    1108                 :             : #define LOOP_VINFO_INNER_LOOP_COST_FACTOR(L) (L)->inner_loop_cost_factor
    1109                 :             : #define LOOP_VINFO_INV_PATTERN_DEF_SEQ(L)  (L)->inv_pattern_def_seq
    1110                 :             : #define LOOP_VINFO_DRS_ADVANCED_BY(L)      (L)->drs_advanced_by
    1111                 :             : 
    1112                 :             : #define LOOP_VINFO_FULLY_MASKED_P(L)            \
    1113                 :             :   (LOOP_VINFO_USING_PARTIAL_VECTORS_P (L)       \
    1114                 :             :    && !LOOP_VINFO_MASKS (L).is_empty ())
    1115                 :             : 
    1116                 :             : #define LOOP_VINFO_FULLY_WITH_LENGTH_P(L)       \
    1117                 :             :   (LOOP_VINFO_USING_PARTIAL_VECTORS_P (L)       \
    1118                 :             :    && !LOOP_VINFO_LENS (L).is_empty ())
    1119                 :             : 
    1120                 :             : #define LOOP_REQUIRES_VERSIONING_FOR_ALIGNMENT(L)       \
    1121                 :             :   ((L)->may_misalign_stmts.length () > 0)
    1122                 :             : #define LOOP_REQUIRES_VERSIONING_FOR_ALIAS(L)           \
    1123                 :             :   ((L)->comp_alias_ddrs.length () > 0 \
    1124                 :             :    || (L)->check_unequal_addrs.length () > 0 \
    1125                 :             :    || (L)->lower_bounds.length () > 0)
    1126                 :             : #define LOOP_REQUIRES_VERSIONING_FOR_NITERS(L)          \
    1127                 :             :   (LOOP_VINFO_NITERS_ASSUMPTIONS (L))
    1128                 :             : #define LOOP_REQUIRES_VERSIONING_FOR_SIMD_IF_COND(L)    \
    1129                 :             :   (LOOP_VINFO_SIMD_IF_COND (L))
    1130                 :             : #define LOOP_REQUIRES_VERSIONING(L)                     \
    1131                 :             :   (LOOP_REQUIRES_VERSIONING_FOR_ALIGNMENT (L)           \
    1132                 :             :    || LOOP_REQUIRES_VERSIONING_FOR_ALIAS (L)            \
    1133                 :             :    || LOOP_REQUIRES_VERSIONING_FOR_NITERS (L)           \
    1134                 :             :    || LOOP_REQUIRES_VERSIONING_FOR_SIMD_IF_COND (L))
    1135                 :             : 
    1136                 :             : #define LOOP_VINFO_NITERS_KNOWN_P(L)          \
    1137                 :             :   (tree_fits_shwi_p ((L)->num_iters) && tree_to_shwi ((L)->num_iters) > 0)
    1138                 :             : 
    1139                 :             : #define LOOP_VINFO_EPILOGUE_P(L) \
    1140                 :             :   (LOOP_VINFO_ORIG_LOOP_INFO (L) != NULL)
    1141                 :             : 
    1142                 :             : #define LOOP_VINFO_ORIG_MAX_VECT_FACTOR(L) \
    1143                 :             :   (LOOP_VINFO_MAX_VECT_FACTOR (LOOP_VINFO_ORIG_LOOP_INFO (L)))
    1144                 :             : 
    1145                 :             : /* Wrapper for loop_vec_info, for tracking success/failure, where a non-NULL
    1146                 :             :    value signifies success, and a NULL value signifies failure, supporting
    1147                 :             :    propagating an opt_problem * describing the failure back up the call
    1148                 :             :    stack.  */
    1149                 :             : typedef opt_pointer_wrapper <loop_vec_info> opt_loop_vec_info;
    1150                 :             : 
    1151                 :             : inline loop_vec_info
    1152                 :      490129 : loop_vec_info_for_loop (class loop *loop)
    1153                 :             : {
    1154                 :      490129 :   return (loop_vec_info) loop->aux;
    1155                 :             : }
    1156                 :             : 
    1157                 :             : struct slp_root
    1158                 :             : {
    1159                 :     1124960 :   slp_root (slp_instance_kind kind_, vec<stmt_vec_info> stmts_,
    1160                 :        7666 :             vec<stmt_vec_info> roots_, vec<tree> remain_ = vNULL)
    1161                 :     1124960 :     : kind(kind_), stmts(stmts_), roots(roots_), remain(remain_) {}
    1162                 :             :   slp_instance_kind kind;
    1163                 :             :   vec<stmt_vec_info> stmts;
    1164                 :             :   vec<stmt_vec_info> roots;
    1165                 :             :   vec<tree> remain;
    1166                 :             : };
    1167                 :             : 
    1168                 :             : typedef class _bb_vec_info : public vec_info
    1169                 :             : {
    1170                 :             : public:
    1171                 :             :   _bb_vec_info (vec<basic_block> bbs, vec_info_shared *);
    1172                 :             :   ~_bb_vec_info ();
    1173                 :             : 
    1174                 :             :   vec<slp_root> roots;
    1175                 :             : } *bb_vec_info;
    1176                 :             : 
    1177                 :             : #define BB_VINFO_BBS(B)              (B)->bbs
    1178                 :             : #define BB_VINFO_NBBS(B)             (B)->nbbs
    1179                 :             : #define BB_VINFO_GROUPED_STORES(B)   (B)->grouped_stores
    1180                 :             : #define BB_VINFO_SLP_INSTANCES(B)    (B)->slp_instances
    1181                 :             : #define BB_VINFO_DATAREFS(B)         (B)->shared->datarefs
    1182                 :             : #define BB_VINFO_DDRS(B)             (B)->shared->ddrs
    1183                 :             : 
    1184                 :             : /*-----------------------------------------------------------------*/
    1185                 :             : /* Info on vectorized defs.                                        */
    1186                 :             : /*-----------------------------------------------------------------*/
    1187                 :             : enum stmt_vec_info_type {
    1188                 :             :   undef_vec_info_type = 0,
    1189                 :             :   load_vec_info_type,
    1190                 :             :   store_vec_info_type,
    1191                 :             :   shift_vec_info_type,
    1192                 :             :   op_vec_info_type,
    1193                 :             :   call_vec_info_type,
    1194                 :             :   call_simd_clone_vec_info_type,
    1195                 :             :   assignment_vec_info_type,
    1196                 :             :   condition_vec_info_type,
    1197                 :             :   comparison_vec_info_type,
    1198                 :             :   reduc_vec_info_type,
    1199                 :             :   induc_vec_info_type,
    1200                 :             :   type_promotion_vec_info_type,
    1201                 :             :   type_demotion_vec_info_type,
    1202                 :             :   type_conversion_vec_info_type,
    1203                 :             :   cycle_phi_info_type,
    1204                 :             :   lc_phi_info_type,
    1205                 :             :   phi_info_type,
    1206                 :             :   recurr_info_type,
    1207                 :             :   loop_exit_ctrl_vec_info_type
    1208                 :             : };
    1209                 :             : 
    1210                 :             : /* Indicates whether/how a variable is used in the scope of loop/basic
    1211                 :             :    block.  */
    1212                 :             : enum vect_relevant {
    1213                 :             :   vect_unused_in_scope = 0,
    1214                 :             : 
    1215                 :             :   /* The def is only used outside the loop.  */
    1216                 :             :   vect_used_only_live,
    1217                 :             :   /* The def is in the inner loop, and the use is in the outer loop, and the
    1218                 :             :      use is a reduction stmt.  */
    1219                 :             :   vect_used_in_outer_by_reduction,
    1220                 :             :   /* The def is in the inner loop, and the use is in the outer loop (and is
    1221                 :             :      not part of reduction).  */
    1222                 :             :   vect_used_in_outer,
    1223                 :             : 
    1224                 :             :   /* defs that feed computations that end up (only) in a reduction. These
    1225                 :             :      defs may be used by non-reduction stmts, but eventually, any
    1226                 :             :      computations/values that are affected by these defs are used to compute
    1227                 :             :      a reduction (i.e. don't get stored to memory, for example). We use this
    1228                 :             :      to identify computations that we can change the order in which they are
    1229                 :             :      computed.  */
    1230                 :             :   vect_used_by_reduction,
    1231                 :             : 
    1232                 :             :   vect_used_in_scope
    1233                 :             : };
    1234                 :             : 
    1235                 :             : /* The type of vectorization that can be applied to the stmt: regular loop-based
    1236                 :             :    vectorization; pure SLP - the stmt is a part of SLP instances and does not
    1237                 :             :    have uses outside SLP instances; or hybrid SLP and loop-based - the stmt is
    1238                 :             :    a part of SLP instance and also must be loop-based vectorized, since it has
    1239                 :             :    uses outside SLP sequences.
    1240                 :             : 
    1241                 :             :    In the loop context the meanings of pure and hybrid SLP are slightly
    1242                 :             :    different. By saying that pure SLP is applied to the loop, we mean that we
    1243                 :             :    exploit only intra-iteration parallelism in the loop; i.e., the loop can be
    1244                 :             :    vectorized without doing any conceptual unrolling, cause we don't pack
    1245                 :             :    together stmts from different iterations, only within a single iteration.
    1246                 :             :    Loop hybrid SLP means that we exploit both intra-iteration and
    1247                 :             :    inter-iteration parallelism (e.g., number of elements in the vector is 4
    1248                 :             :    and the slp-group-size is 2, in which case we don't have enough parallelism
    1249                 :             :    within an iteration, so we obtain the rest of the parallelism from subsequent
    1250                 :             :    iterations by unrolling the loop by 2).  */
    1251                 :             : enum slp_vect_type {
    1252                 :             :   loop_vect = 0,
    1253                 :             :   pure_slp,
    1254                 :             :   hybrid
    1255                 :             : };
    1256                 :             : 
    1257                 :             : /* Says whether a statement is a load, a store of a vectorized statement
    1258                 :             :    result, or a store of an invariant value.  */
    1259                 :             : enum vec_load_store_type {
    1260                 :             :   VLS_LOAD,
    1261                 :             :   VLS_STORE,
    1262                 :             :   VLS_STORE_INVARIANT
    1263                 :             : };
    1264                 :             : 
    1265                 :             : class dr_vec_info {
    1266                 :             : public:
    1267                 :             :   /* The data reference itself.  */
    1268                 :             :   data_reference *dr;
    1269                 :             :   /* The statement that contains the data reference.  */
    1270                 :             :   stmt_vec_info stmt;
    1271                 :             :   /* The analysis group this DR belongs to when doing BB vectorization.
    1272                 :             :      DRs of the same group belong to the same conditional execution context.  */
    1273                 :             :   unsigned group;
    1274                 :             :   /* The misalignment in bytes of the reference, or -1 if not known.  */
    1275                 :             :   int misalignment;
    1276                 :             :   /* The byte alignment that we'd ideally like the reference to have,
    1277                 :             :      and the value that misalignment is measured against.  */
    1278                 :             :   poly_uint64 target_alignment;
    1279                 :             :   /* If true the alignment of base_decl needs to be increased.  */
    1280                 :             :   bool base_misaligned;
    1281                 :             :   tree base_decl;
    1282                 :             : 
    1283                 :             :   /* Stores current vectorized loop's offset.  To be added to the DR's
    1284                 :             :      offset to calculate current offset of data reference.  */
    1285                 :             :   tree offset;
    1286                 :             : };
    1287                 :             : 
    1288                 :             : typedef struct data_reference *dr_p;
    1289                 :             : 
    1290                 :             : class _stmt_vec_info {
    1291                 :             : public:
    1292                 :             : 
    1293                 :             :   enum stmt_vec_info_type type;
    1294                 :             : 
    1295                 :             :   /* Indicates whether this stmts is part of a computation whose result is
    1296                 :             :      used outside the loop.  */
    1297                 :             :   bool live;
    1298                 :             : 
    1299                 :             :   /* Stmt is part of some pattern (computation idiom)  */
    1300                 :             :   bool in_pattern_p;
    1301                 :             : 
    1302                 :             :   /* True if the statement was created during pattern recognition as
    1303                 :             :      part of the replacement for RELATED_STMT.  This implies that the
    1304                 :             :      statement isn't part of any basic block, although for convenience
    1305                 :             :      its gimple_bb is the same as for RELATED_STMT.  */
    1306                 :             :   bool pattern_stmt_p;
    1307                 :             : 
    1308                 :             :   /* Is this statement vectorizable or should it be skipped in (partial)
    1309                 :             :      vectorization.  */
    1310                 :             :   bool vectorizable;
    1311                 :             : 
    1312                 :             :   /* The stmt to which this info struct refers to.  */
    1313                 :             :   gimple *stmt;
    1314                 :             : 
    1315                 :             :   /* The vector type to be used for the LHS of this statement.  */
    1316                 :             :   tree vectype;
    1317                 :             : 
    1318                 :             :   /* The vectorized stmts.  */
    1319                 :             :   vec<gimple *> vec_stmts;
    1320                 :             : 
    1321                 :             :   /* The following is relevant only for stmts that contain a non-scalar
    1322                 :             :      data-ref (array/pointer/struct access). A GIMPLE stmt is expected to have
    1323                 :             :      at most one such data-ref.  */
    1324                 :             : 
    1325                 :             :   dr_vec_info dr_aux;
    1326                 :             : 
    1327                 :             :   /* Information about the data-ref relative to this loop
    1328                 :             :      nest (the loop that is being considered for vectorization).  */
    1329                 :             :   innermost_loop_behavior dr_wrt_vec_loop;
    1330                 :             : 
    1331                 :             :   /* For loop PHI nodes, the base and evolution part of it.  This makes sure
    1332                 :             :      this information is still available in vect_update_ivs_after_vectorizer
    1333                 :             :      where we may not be able to re-analyze the PHI nodes evolution as
    1334                 :             :      peeling for the prologue loop can make it unanalyzable.  The evolution
    1335                 :             :      part is still correct after peeling, but the base may have changed from
    1336                 :             :      the version here.  */
    1337                 :             :   tree loop_phi_evolution_base_unchanged;
    1338                 :             :   tree loop_phi_evolution_part;
    1339                 :             :   enum vect_induction_op_type loop_phi_evolution_type;
    1340                 :             : 
    1341                 :             :   /* Used for various bookkeeping purposes, generally holding a pointer to
    1342                 :             :      some other stmt S that is in some way "related" to this stmt.
    1343                 :             :      Current use of this field is:
    1344                 :             :         If this stmt is part of a pattern (i.e. the field 'in_pattern_p' is
    1345                 :             :         true): S is the "pattern stmt" that represents (and replaces) the
    1346                 :             :         sequence of stmts that constitutes the pattern.  Similarly, the
    1347                 :             :         related_stmt of the "pattern stmt" points back to this stmt (which is
    1348                 :             :         the last stmt in the original sequence of stmts that constitutes the
    1349                 :             :         pattern).  */
    1350                 :             :   stmt_vec_info related_stmt;
    1351                 :             : 
    1352                 :             :   /* Used to keep a sequence of def stmts of a pattern stmt if such exists.
    1353                 :             :      The sequence is attached to the original statement rather than the
    1354                 :             :      pattern statement.  */
    1355                 :             :   gimple_seq pattern_def_seq;
    1356                 :             : 
    1357                 :             :   /* Selected SIMD clone's function info.  First vector element
    1358                 :             :      is SIMD clone's function decl, followed by a pair of trees (base + step)
    1359                 :             :      for linear arguments (pair of NULLs for other arguments).  */
    1360                 :             :   vec<tree> simd_clone_info;
    1361                 :             : 
    1362                 :             :   /* Classify the def of this stmt.  */
    1363                 :             :   enum vect_def_type def_type;
    1364                 :             : 
    1365                 :             :   /*  Whether the stmt is SLPed, loop-based vectorized, or both.  */
    1366                 :             :   enum slp_vect_type slp_type;
    1367                 :             : 
    1368                 :             :   /* Interleaving and reduction chains info.  */
    1369                 :             :   /* First element in the group.  */
    1370                 :             :   stmt_vec_info first_element;
    1371                 :             :   /* Pointer to the next element in the group.  */
    1372                 :             :   stmt_vec_info next_element;
    1373                 :             :   /* The size of the group.  */
    1374                 :             :   unsigned int size;
    1375                 :             :   /* For stores, number of stores from this group seen. We vectorize the last
    1376                 :             :      one.  */
    1377                 :             :   unsigned int store_count;
    1378                 :             :   /* For loads only, the gap from the previous load. For consecutive loads, GAP
    1379                 :             :      is 1.  */
    1380                 :             :   unsigned int gap;
    1381                 :             : 
    1382                 :             :   /* The minimum negative dependence distance this stmt participates in
    1383                 :             :      or zero if none.  */
    1384                 :             :   unsigned int min_neg_dist;
    1385                 :             : 
    1386                 :             :   /* Not all stmts in the loop need to be vectorized. e.g, the increment
    1387                 :             :      of the loop induction variable and computation of array indexes. relevant
    1388                 :             :      indicates whether the stmt needs to be vectorized.  */
    1389                 :             :   enum vect_relevant relevant;
    1390                 :             : 
    1391                 :             :   /* For loads if this is a gather, for stores if this is a scatter.  */
    1392                 :             :   bool gather_scatter_p;
    1393                 :             : 
    1394                 :             :   /* True if this is an access with loop-invariant stride.  */
    1395                 :             :   bool strided_p;
    1396                 :             : 
    1397                 :             :   /* For both loads and stores.  */
    1398                 :             :   unsigned simd_lane_access_p : 3;
    1399                 :             : 
    1400                 :             :   /* Classifies how the load or store is going to be implemented
    1401                 :             :      for loop vectorization.  */
    1402                 :             :   vect_memory_access_type memory_access_type;
    1403                 :             : 
    1404                 :             :   /* For INTEGER_INDUC_COND_REDUCTION, the initial value to be used.  */
    1405                 :             :   tree induc_cond_initial_val;
    1406                 :             : 
    1407                 :             :   /* If not NULL the value to be added to compute final reduction value.  */
    1408                 :             :   tree reduc_epilogue_adjustment;
    1409                 :             : 
    1410                 :             :   /* On a reduction PHI the reduction type as detected by
    1411                 :             :      vect_is_simple_reduction and vectorizable_reduction.  */
    1412                 :             :   enum vect_reduction_type reduc_type;
    1413                 :             : 
    1414                 :             :   /* The original reduction code, to be used in the epilogue.  */
    1415                 :             :   code_helper reduc_code;
    1416                 :             :   /* An internal function we should use in the epilogue.  */
    1417                 :             :   internal_fn reduc_fn;
    1418                 :             : 
    1419                 :             :   /* On a stmt participating in the reduction the index of the operand
    1420                 :             :      on the reduction SSA cycle.  */
    1421                 :             :   int reduc_idx;
    1422                 :             : 
    1423                 :             :   /* On a reduction PHI the def returned by vect_force_simple_reduction.
    1424                 :             :      On the def returned by vect_force_simple_reduction the
    1425                 :             :      corresponding PHI.  */
    1426                 :             :   stmt_vec_info reduc_def;
    1427                 :             : 
    1428                 :             :   /* The vector input type relevant for reduction vectorization.  */
    1429                 :             :   tree reduc_vectype_in;
    1430                 :             : 
    1431                 :             :   /* The vector type for performing the actual reduction.  */
    1432                 :             :   tree reduc_vectype;
    1433                 :             : 
    1434                 :             :   /* For loop reduction with multiple vectorized results (ncopies > 1), a
    1435                 :             :      lane-reducing operation participating in it may not use all of those
    1436                 :             :      results, this field specifies result index starting from which any
    1437                 :             :      following land-reducing operation would be assigned to.  */
    1438                 :             :   unsigned int reduc_result_pos;
    1439                 :             : 
    1440                 :             :   /* If IS_REDUC_INFO is true and if the vector code is performing
    1441                 :             :      N scalar reductions in parallel, this variable gives the initial
    1442                 :             :      scalar values of those N reductions.  */
    1443                 :             :   vec<tree> reduc_initial_values;
    1444                 :             : 
    1445                 :             :   /* If IS_REDUC_INFO is true and if the vector code is performing
    1446                 :             :      N scalar reductions in parallel, this variable gives the vectorized code's
    1447                 :             :      final (scalar) result for each of those N reductions.  In other words,
    1448                 :             :      REDUC_SCALAR_RESULTS[I] replaces the original scalar code's loop-closed
    1449                 :             :      SSA PHI for reduction number I.  */
    1450                 :             :   vec<tree> reduc_scalar_results;
    1451                 :             : 
    1452                 :             :   /* Only meaningful if IS_REDUC_INFO.  If non-null, the reduction is
    1453                 :             :      being performed by an epilogue loop and we have decided to reuse
    1454                 :             :      this accumulator from the main loop.  */
    1455                 :             :   vect_reusable_accumulator *reused_accumulator;
    1456                 :             : 
    1457                 :             :   /* Whether we force a single cycle PHI during reduction vectorization.  */
    1458                 :             :   bool force_single_cycle;
    1459                 :             : 
    1460                 :             :   /* Whether on this stmt reduction meta is recorded.  */
    1461                 :             :   bool is_reduc_info;
    1462                 :             : 
    1463                 :             :   /* If nonzero, the lhs of the statement could be truncated to this
    1464                 :             :      many bits without affecting any users of the result.  */
    1465                 :             :   unsigned int min_output_precision;
    1466                 :             : 
    1467                 :             :   /* If nonzero, all non-boolean input operands have the same precision,
    1468                 :             :      and they could each be truncated to this many bits without changing
    1469                 :             :      the result.  */
    1470                 :             :   unsigned int min_input_precision;
    1471                 :             : 
    1472                 :             :   /* If OPERATION_BITS is nonzero, the statement could be performed on
    1473                 :             :      an integer with the sign and number of bits given by OPERATION_SIGN
    1474                 :             :      and OPERATION_BITS without changing the result.  */
    1475                 :             :   unsigned int operation_precision;
    1476                 :             :   signop operation_sign;
    1477                 :             : 
    1478                 :             :   /* If the statement produces a boolean result, this value describes
    1479                 :             :      how we should choose the associated vector type.  The possible
    1480                 :             :      values are:
    1481                 :             : 
    1482                 :             :      - an integer precision N if we should use the vector mask type
    1483                 :             :        associated with N-bit integers.  This is only used if all relevant
    1484                 :             :        input booleans also want the vector mask type for N-bit integers,
    1485                 :             :        or if we can convert them into that form by pattern-matching.
    1486                 :             : 
    1487                 :             :      - ~0U if we considered choosing a vector mask type but decided
    1488                 :             :        to treat the boolean as a normal integer type instead.
    1489                 :             : 
    1490                 :             :      - 0 otherwise.  This means either that the operation isn't one that
    1491                 :             :        could have a vector mask type (and so should have a normal vector
    1492                 :             :        type instead) or that we simply haven't made a choice either way.  */
    1493                 :             :   unsigned int mask_precision;
    1494                 :             : 
    1495                 :             :   /* True if this is only suitable for SLP vectorization.  */
    1496                 :             :   bool slp_vect_only_p;
    1497                 :             : 
    1498                 :             :   /* True if this is a pattern that can only be handled by SLP
    1499                 :             :      vectorization.  */
    1500                 :             :   bool slp_vect_pattern_only_p;
    1501                 :             : };
    1502                 :             : 
    1503                 :             : /* Information about a gather/scatter call.  */
    1504                 :             : struct gather_scatter_info {
    1505                 :             :   /* The internal function to use for the gather/scatter operation,
    1506                 :             :      or IFN_LAST if a built-in function should be used instead.  */
    1507                 :             :   internal_fn ifn;
    1508                 :             : 
    1509                 :             :   /* The FUNCTION_DECL for the built-in gather/scatter function,
    1510                 :             :      or null if an internal function should be used instead.  */
    1511                 :             :   tree decl;
    1512                 :             : 
    1513                 :             :   /* The loop-invariant base value.  */
    1514                 :             :   tree base;
    1515                 :             : 
    1516                 :             :   /* The original scalar offset, which is a non-loop-invariant SSA_NAME.  */
    1517                 :             :   tree offset;
    1518                 :             : 
    1519                 :             :   /* Each offset element should be multiplied by this amount before
    1520                 :             :      being added to the base.  */
    1521                 :             :   int scale;
    1522                 :             : 
    1523                 :             :   /* The definition type for the vectorized offset.  */
    1524                 :             :   enum vect_def_type offset_dt;
    1525                 :             : 
    1526                 :             :   /* The type of the vectorized offset.  */
    1527                 :             :   tree offset_vectype;
    1528                 :             : 
    1529                 :             :   /* The type of the scalar elements after loading or before storing.  */
    1530                 :             :   tree element_type;
    1531                 :             : 
    1532                 :             :   /* The type of the scalar elements being loaded or stored.  */
    1533                 :             :   tree memory_type;
    1534                 :             : };
    1535                 :             : 
    1536                 :             : /* Access Functions.  */
    1537                 :             : #define STMT_VINFO_TYPE(S)                 (S)->type
    1538                 :             : #define STMT_VINFO_STMT(S)                 (S)->stmt
    1539                 :             : #define STMT_VINFO_RELEVANT(S)             (S)->relevant
    1540                 :             : #define STMT_VINFO_LIVE_P(S)               (S)->live
    1541                 :             : #define STMT_VINFO_VECTYPE(S)              (S)->vectype
    1542                 :             : #define STMT_VINFO_VEC_STMTS(S)            (S)->vec_stmts
    1543                 :             : #define STMT_VINFO_VECTORIZABLE(S)         (S)->vectorizable
    1544                 :             : #define STMT_VINFO_DATA_REF(S)             ((S)->dr_aux.dr + 0)
    1545                 :             : #define STMT_VINFO_GATHER_SCATTER_P(S)     (S)->gather_scatter_p
    1546                 :             : #define STMT_VINFO_STRIDED_P(S)            (S)->strided_p
    1547                 :             : #define STMT_VINFO_MEMORY_ACCESS_TYPE(S)   (S)->memory_access_type
    1548                 :             : #define STMT_VINFO_SIMD_LANE_ACCESS_P(S)   (S)->simd_lane_access_p
    1549                 :             : #define STMT_VINFO_VEC_INDUC_COND_INITIAL_VAL(S) (S)->induc_cond_initial_val
    1550                 :             : #define STMT_VINFO_REDUC_EPILOGUE_ADJUSTMENT(S) (S)->reduc_epilogue_adjustment
    1551                 :             : #define STMT_VINFO_REDUC_IDX(S)            (S)->reduc_idx
    1552                 :             : #define STMT_VINFO_FORCE_SINGLE_CYCLE(S)   (S)->force_single_cycle
    1553                 :             : 
    1554                 :             : #define STMT_VINFO_DR_WRT_VEC_LOOP(S)      (S)->dr_wrt_vec_loop
    1555                 :             : #define STMT_VINFO_DR_BASE_ADDRESS(S)      (S)->dr_wrt_vec_loop.base_address
    1556                 :             : #define STMT_VINFO_DR_INIT(S)              (S)->dr_wrt_vec_loop.init
    1557                 :             : #define STMT_VINFO_DR_OFFSET(S)            (S)->dr_wrt_vec_loop.offset
    1558                 :             : #define STMT_VINFO_DR_STEP(S)              (S)->dr_wrt_vec_loop.step
    1559                 :             : #define STMT_VINFO_DR_BASE_ALIGNMENT(S)    (S)->dr_wrt_vec_loop.base_alignment
    1560                 :             : #define STMT_VINFO_DR_BASE_MISALIGNMENT(S) \
    1561                 :             :   (S)->dr_wrt_vec_loop.base_misalignment
    1562                 :             : #define STMT_VINFO_DR_OFFSET_ALIGNMENT(S) \
    1563                 :             :   (S)->dr_wrt_vec_loop.offset_alignment
    1564                 :             : #define STMT_VINFO_DR_STEP_ALIGNMENT(S) \
    1565                 :             :   (S)->dr_wrt_vec_loop.step_alignment
    1566                 :             : 
    1567                 :             : #define STMT_VINFO_DR_INFO(S) \
    1568                 :             :   (gcc_checking_assert ((S)->dr_aux.stmt == (S)), &(S)->dr_aux)
    1569                 :             : 
    1570                 :             : #define STMT_VINFO_IN_PATTERN_P(S)         (S)->in_pattern_p
    1571                 :             : #define STMT_VINFO_RELATED_STMT(S)         (S)->related_stmt
    1572                 :             : #define STMT_VINFO_PATTERN_DEF_SEQ(S)      (S)->pattern_def_seq
    1573                 :             : #define STMT_VINFO_SIMD_CLONE_INFO(S)      (S)->simd_clone_info
    1574                 :             : #define STMT_VINFO_DEF_TYPE(S)             (S)->def_type
    1575                 :             : #define STMT_VINFO_GROUPED_ACCESS(S) \
    1576                 :             :   ((S)->dr_aux.dr && DR_GROUP_FIRST_ELEMENT(S))
    1577                 :             : #define STMT_VINFO_LOOP_PHI_EVOLUTION_BASE_UNCHANGED(S) (S)->loop_phi_evolution_base_unchanged
    1578                 :             : #define STMT_VINFO_LOOP_PHI_EVOLUTION_PART(S) (S)->loop_phi_evolution_part
    1579                 :             : #define STMT_VINFO_LOOP_PHI_EVOLUTION_TYPE(S) (S)->loop_phi_evolution_type
    1580                 :             : #define STMT_VINFO_MIN_NEG_DIST(S)      (S)->min_neg_dist
    1581                 :             : #define STMT_VINFO_REDUC_TYPE(S)        (S)->reduc_type
    1582                 :             : #define STMT_VINFO_REDUC_CODE(S)        (S)->reduc_code
    1583                 :             : #define STMT_VINFO_REDUC_FN(S)          (S)->reduc_fn
    1584                 :             : #define STMT_VINFO_REDUC_DEF(S)         (S)->reduc_def
    1585                 :             : #define STMT_VINFO_REDUC_VECTYPE(S)     (S)->reduc_vectype
    1586                 :             : #define STMT_VINFO_REDUC_VECTYPE_IN(S)  (S)->reduc_vectype_in
    1587                 :             : #define STMT_VINFO_SLP_VECT_ONLY(S)     (S)->slp_vect_only_p
    1588                 :             : #define STMT_VINFO_SLP_VECT_ONLY_PATTERN(S) (S)->slp_vect_pattern_only_p
    1589                 :             : 
    1590                 :             : #define DR_GROUP_FIRST_ELEMENT(S) \
    1591                 :             :   (gcc_checking_assert ((S)->dr_aux.dr), (S)->first_element)
    1592                 :             : #define DR_GROUP_NEXT_ELEMENT(S) \
    1593                 :             :   (gcc_checking_assert ((S)->dr_aux.dr), (S)->next_element)
    1594                 :             : #define DR_GROUP_SIZE(S) \
    1595                 :             :   (gcc_checking_assert ((S)->dr_aux.dr), (S)->size)
    1596                 :             : #define DR_GROUP_STORE_COUNT(S) \
    1597                 :             :   (gcc_checking_assert ((S)->dr_aux.dr), (S)->store_count)
    1598                 :             : #define DR_GROUP_GAP(S) \
    1599                 :             :   (gcc_checking_assert ((S)->dr_aux.dr), (S)->gap)
    1600                 :             : 
    1601                 :             : #define REDUC_GROUP_FIRST_ELEMENT(S) \
    1602                 :             :   (gcc_checking_assert (!(S)->dr_aux.dr), (S)->first_element)
    1603                 :             : #define REDUC_GROUP_NEXT_ELEMENT(S) \
    1604                 :             :   (gcc_checking_assert (!(S)->dr_aux.dr), (S)->next_element)
    1605                 :             : #define REDUC_GROUP_SIZE(S) \
    1606                 :             :   (gcc_checking_assert (!(S)->dr_aux.dr), (S)->size)
    1607                 :             : 
    1608                 :             : #define STMT_VINFO_RELEVANT_P(S)          ((S)->relevant != vect_unused_in_scope)
    1609                 :             : 
    1610                 :             : #define HYBRID_SLP_STMT(S)                ((S)->slp_type == hybrid)
    1611                 :             : #define PURE_SLP_STMT(S)                  ((S)->slp_type == pure_slp)
    1612                 :             : #define STMT_SLP_TYPE(S)                   (S)->slp_type
    1613                 :             : 
    1614                 :             : /* Contains the scalar or vector costs for a vec_info.  */
    1615                 :             : class vector_costs
    1616                 :             : {
    1617                 :             : public:
    1618                 :             :   vector_costs (vec_info *, bool);
    1619                 :           0 :   virtual ~vector_costs () {}
    1620                 :             : 
    1621                 :             :   /* Update the costs in response to adding COUNT copies of a statement.
    1622                 :             : 
    1623                 :             :      - WHERE specifies whether the cost occurs in the loop prologue,
    1624                 :             :        the loop body, or the loop epilogue.
    1625                 :             :      - KIND is the kind of statement, which is always meaningful.
    1626                 :             :      - STMT_INFO or NODE, if nonnull, describe the statement that will be
    1627                 :             :        vectorized.
    1628                 :             :      - VECTYPE, if nonnull, is the vector type that the vectorized
    1629                 :             :        statement will operate on.  Note that this should be used in
    1630                 :             :        preference to STMT_VINFO_VECTYPE (STMT_INFO) since the latter
    1631                 :             :        is not correct for SLP.
    1632                 :             :      - for unaligned_load and unaligned_store statements, MISALIGN is
    1633                 :             :        the byte misalignment of the load or store relative to the target's
    1634                 :             :        preferred alignment for VECTYPE, or DR_MISALIGNMENT_UNKNOWN
    1635                 :             :        if the misalignment is not known.
    1636                 :             : 
    1637                 :             :      Return the calculated cost as well as recording it.  The return
    1638                 :             :      value is used for dumping purposes.  */
    1639                 :             :   virtual unsigned int add_stmt_cost (int count, vect_cost_for_stmt kind,
    1640                 :             :                                       stmt_vec_info stmt_info,
    1641                 :             :                                       slp_tree node,
    1642                 :             :                                       tree vectype, int misalign,
    1643                 :             :                                       vect_cost_model_location where);
    1644                 :             : 
    1645                 :             :   /* Finish calculating the cost of the code.  The results can be
    1646                 :             :      read back using the functions below.
    1647                 :             : 
    1648                 :             :      If the costs describe vector code, SCALAR_COSTS gives the costs
    1649                 :             :      of the corresponding scalar code, otherwise it is null.  */
    1650                 :             :   virtual void finish_cost (const vector_costs *scalar_costs);
    1651                 :             : 
    1652                 :             :   /* The costs in THIS and OTHER both describe ways of vectorizing
    1653                 :             :      a main loop.  Return true if the costs described by THIS are
    1654                 :             :      cheaper than the costs described by OTHER.  Return false if any
    1655                 :             :      of the following are true:
    1656                 :             : 
    1657                 :             :      - THIS and OTHER are of equal cost
    1658                 :             :      - OTHER is better than THIS
    1659                 :             :      - we can't be sure about the relative costs of THIS and OTHER.  */
    1660                 :             :   virtual bool better_main_loop_than_p (const vector_costs *other) const;
    1661                 :             : 
    1662                 :             :   /* Likewise, but the costs in THIS and OTHER both describe ways of
    1663                 :             :      vectorizing an epilogue loop of MAIN_LOOP.  */
    1664                 :             :   virtual bool better_epilogue_loop_than_p (const vector_costs *other,
    1665                 :             :                                             loop_vec_info main_loop) const;
    1666                 :             : 
    1667                 :             :   unsigned int prologue_cost () const;
    1668                 :             :   unsigned int body_cost () const;
    1669                 :             :   unsigned int epilogue_cost () const;
    1670                 :             :   unsigned int outside_cost () const;
    1671                 :             :   unsigned int total_cost () const;
    1672                 :             :   unsigned int suggested_unroll_factor () const;
    1673                 :             :   machine_mode suggested_epilogue_mode () const;
    1674                 :             : 
    1675                 :             : protected:
    1676                 :             :   unsigned int record_stmt_cost (stmt_vec_info, vect_cost_model_location,
    1677                 :             :                                  unsigned int);
    1678                 :             :   unsigned int adjust_cost_for_freq (stmt_vec_info, vect_cost_model_location,
    1679                 :             :                                      unsigned int);
    1680                 :             :   int compare_inside_loop_cost (const vector_costs *) const;
    1681                 :             :   int compare_outside_loop_cost (const vector_costs *) const;
    1682                 :             : 
    1683                 :             :   /* The region of code that we're considering vectorizing.  */
    1684                 :             :   vec_info *m_vinfo;
    1685                 :             : 
    1686                 :             :   /* True if we're costing the scalar code, false if we're costing
    1687                 :             :      the vector code.  */
    1688                 :             :   bool m_costing_for_scalar;
    1689                 :             : 
    1690                 :             :   /* The costs of the three regions, indexed by vect_cost_model_location.  */
    1691                 :             :   unsigned int m_costs[3];
    1692                 :             : 
    1693                 :             :   /* The suggested unrolling factor determined at finish_cost.  */
    1694                 :             :   unsigned int m_suggested_unroll_factor;
    1695                 :             : 
    1696                 :             :   /* The suggested mode to be used for a vectorized epilogue or VOIDmode,
    1697                 :             :      determined at finish_cost.  */
    1698                 :             :   machine_mode m_suggested_epilogue_mode;
    1699                 :             : 
    1700                 :             :   /* True if finish_cost has been called.  */
    1701                 :             :   bool m_finished;
    1702                 :             : };
    1703                 :             : 
    1704                 :             : /* Create costs for VINFO.  COSTING_FOR_SCALAR is true if the costs
    1705                 :             :    are for scalar code, false if they are for vector code.  */
    1706                 :             : 
    1707                 :             : inline
    1708                 :     1705645 : vector_costs::vector_costs (vec_info *vinfo, bool costing_for_scalar)
    1709                 :     1705645 :   : m_vinfo (vinfo),
    1710                 :     1705645 :     m_costing_for_scalar (costing_for_scalar),
    1711                 :     6822580 :     m_costs (),
    1712                 :     1705645 :     m_suggested_unroll_factor(1),
    1713                 :     1705645 :     m_suggested_epilogue_mode(VOIDmode),
    1714                 :     1705645 :     m_finished (false)
    1715                 :             : {
    1716                 :             : }
    1717                 :             : 
    1718                 :             : /* Return the cost of the prologue code (in abstract units).  */
    1719                 :             : 
    1720                 :             : inline unsigned int
    1721                 :      796631 : vector_costs::prologue_cost () const
    1722                 :             : {
    1723                 :      796631 :   gcc_checking_assert (m_finished);
    1724                 :      796631 :   return m_costs[vect_prologue];
    1725                 :             : }
    1726                 :             : 
    1727                 :             : /* Return the cost of the body code (in abstract units).  */
    1728                 :             : 
    1729                 :             : inline unsigned int
    1730                 :     1444422 : vector_costs::body_cost () const
    1731                 :             : {
    1732                 :     1444422 :   gcc_checking_assert (m_finished);
    1733                 :     1444422 :   return m_costs[vect_body];
    1734                 :             : }
    1735                 :             : 
    1736                 :             : /* Return the cost of the epilogue code (in abstract units).  */
    1737                 :             : 
    1738                 :             : inline unsigned int
    1739                 :      796631 : vector_costs::epilogue_cost () const
    1740                 :             : {
    1741                 :      796631 :   gcc_checking_assert (m_finished);
    1742                 :      796631 :   return m_costs[vect_epilogue];
    1743                 :             : }
    1744                 :             : 
    1745                 :             : /* Return the cost of the prologue and epilogue code (in abstract units).  */
    1746                 :             : 
    1747                 :             : inline unsigned int
    1748                 :       74420 : vector_costs::outside_cost () const
    1749                 :             : {
    1750                 :       74420 :   return prologue_cost () + epilogue_cost ();
    1751                 :             : }
    1752                 :             : 
    1753                 :             : /* Return the cost of the prologue, body and epilogue code
    1754                 :             :    (in abstract units).  */
    1755                 :             : 
    1756                 :             : inline unsigned int
    1757                 :       74420 : vector_costs::total_cost () const
    1758                 :             : {
    1759                 :       74420 :   return body_cost () + outside_cost ();
    1760                 :             : }
    1761                 :             : 
    1762                 :             : /* Return the suggested unroll factor.  */
    1763                 :             : 
    1764                 :             : inline unsigned int
    1765                 :       74420 : vector_costs::suggested_unroll_factor () const
    1766                 :             : {
    1767                 :       74420 :   gcc_checking_assert (m_finished);
    1768                 :       74420 :   return m_suggested_unroll_factor;
    1769                 :             : }
    1770                 :             : 
    1771                 :             : /* Return the suggested epilogue mode.  */
    1772                 :             : 
    1773                 :             : inline machine_mode
    1774                 :       11172 : vector_costs::suggested_epilogue_mode () const
    1775                 :             : {
    1776                 :       11172 :   gcc_checking_assert (m_finished);
    1777                 :       11172 :   return m_suggested_epilogue_mode;
    1778                 :             : }
    1779                 :             : 
    1780                 :             : #define VECT_MAX_COST 1000
    1781                 :             : 
    1782                 :             : /* The maximum number of intermediate steps required in multi-step type
    1783                 :             :    conversion.  */
    1784                 :             : #define MAX_INTERM_CVT_STEPS         3
    1785                 :             : 
    1786                 :             : #define MAX_VECTORIZATION_FACTOR INT_MAX
    1787                 :             : 
    1788                 :             : /* Nonzero if TYPE represents a (scalar) boolean type or type
    1789                 :             :    in the middle-end compatible with it (unsigned precision 1 integral
    1790                 :             :    types).  Used to determine which types should be vectorized as
    1791                 :             :    VECTOR_BOOLEAN_TYPE_P.  */
    1792                 :             : 
    1793                 :             : #define VECT_SCALAR_BOOLEAN_TYPE_P(TYPE) \
    1794                 :             :   (TREE_CODE (TYPE) == BOOLEAN_TYPE             \
    1795                 :             :    || ((TREE_CODE (TYPE) == INTEGER_TYPE        \
    1796                 :             :         || TREE_CODE (TYPE) == ENUMERAL_TYPE)   \
    1797                 :             :        && TYPE_PRECISION (TYPE) == 1            \
    1798                 :             :        && TYPE_UNSIGNED (TYPE)))
    1799                 :             : 
    1800                 :             : inline bool
    1801                 :     8270239 : nested_in_vect_loop_p (class loop *loop, stmt_vec_info stmt_info)
    1802                 :             : {
    1803                 :     8270239 :   return (loop->inner
    1804                 :     6756704 :           && (loop->inner == (gimple_bb (stmt_info->stmt))->loop_father));
    1805                 :             : }
    1806                 :             : 
    1807                 :             : /* PHI is either a scalar reduction phi or a scalar induction phi.
    1808                 :             :    Return the initial value of the variable on entry to the containing
    1809                 :             :    loop.  */
    1810                 :             : 
    1811                 :             : inline tree
    1812                 :       32101 : vect_phi_initial_value (gphi *phi)
    1813                 :             : {
    1814                 :       32101 :   basic_block bb = gimple_bb (phi);
    1815                 :       32101 :   edge pe = loop_preheader_edge (bb->loop_father);
    1816                 :       32101 :   gcc_assert (pe->dest == bb);
    1817                 :       32101 :   return PHI_ARG_DEF_FROM_EDGE (phi, pe);
    1818                 :             : }
    1819                 :             : 
    1820                 :             : /* Return true if STMT_INFO should produce a vector mask type rather than
    1821                 :             :    a normal nonmask type.  */
    1822                 :             : 
    1823                 :             : inline bool
    1824                 :     5284304 : vect_use_mask_type_p (stmt_vec_info stmt_info)
    1825                 :             : {
    1826                 :     5284304 :   return stmt_info->mask_precision && stmt_info->mask_precision != ~0U;
    1827                 :             : }
    1828                 :             : 
    1829                 :             : /* Return TRUE if a statement represented by STMT_INFO is a part of a
    1830                 :             :    pattern.  */
    1831                 :             : 
    1832                 :             : inline bool
    1833                 :   114311146 : is_pattern_stmt_p (stmt_vec_info stmt_info)
    1834                 :             : {
    1835                 :    75341163 :   return stmt_info->pattern_stmt_p;
    1836                 :             : }
    1837                 :             : 
    1838                 :             : /* If STMT_INFO is a pattern statement, return the statement that it
    1839                 :             :    replaces, otherwise return STMT_INFO itself.  */
    1840                 :             : 
    1841                 :             : inline stmt_vec_info
    1842                 :    43251327 : vect_orig_stmt (stmt_vec_info stmt_info)
    1843                 :             : {
    1844                 :    37326398 :   if (is_pattern_stmt_p (stmt_info))
    1845                 :     1906259 :     return STMT_VINFO_RELATED_STMT (stmt_info);
    1846                 :             :   return stmt_info;
    1847                 :             : }
    1848                 :             : 
    1849                 :             : /* Return the later statement between STMT1_INFO and STMT2_INFO.  */
    1850                 :             : 
    1851                 :             : inline stmt_vec_info
    1852                 :     5726086 : get_later_stmt (stmt_vec_info stmt1_info, stmt_vec_info stmt2_info)
    1853                 :             : {
    1854                 :     5726530 :   if (gimple_uid (vect_orig_stmt (stmt1_info)->stmt)
    1855                 :     5726086 :       > gimple_uid (vect_orig_stmt (stmt2_info)->stmt))
    1856                 :             :     return stmt1_info;
    1857                 :             :   else
    1858                 :     1131255 :     return stmt2_info;
    1859                 :             : }
    1860                 :             : 
    1861                 :             : /* If STMT_INFO has been replaced by a pattern statement, return the
    1862                 :             :    replacement statement, otherwise return STMT_INFO itself.  */
    1863                 :             : 
    1864                 :             : inline stmt_vec_info
    1865                 :    46908561 : vect_stmt_to_vectorize (stmt_vec_info stmt_info)
    1866                 :             : {
    1867                 :    46908560 :   if (STMT_VINFO_IN_PATTERN_P (stmt_info))
    1868                 :      832493 :     return STMT_VINFO_RELATED_STMT (stmt_info);
    1869                 :             :   return stmt_info;
    1870                 :             : }
    1871                 :             : 
    1872                 :             : /* Return true if BB is a loop header.  */
    1873                 :             : 
    1874                 :             : inline bool
    1875                 :     1284609 : is_loop_header_bb_p (basic_block bb)
    1876                 :             : {
    1877                 :     1284609 :   if (bb == (bb->loop_father)->header)
    1878                 :     1274349 :     return true;
    1879                 :             : 
    1880                 :             :   return false;
    1881                 :             : }
    1882                 :             : 
    1883                 :             : /* Return pow2 (X).  */
    1884                 :             : 
    1885                 :             : inline int
    1886                 :             : vect_pow2 (int x)
    1887                 :             : {
    1888                 :             :   int i, res = 1;
    1889                 :             : 
    1890                 :           0 :   for (i = 0; i < x; i++)
    1891                 :           0 :     res *= 2;
    1892                 :             : 
    1893                 :             :   return res;
    1894                 :             : }
    1895                 :             : 
    1896                 :             : /* Alias targetm.vectorize.builtin_vectorization_cost.  */
    1897                 :             : 
    1898                 :             : inline int
    1899                 :     8165960 : builtin_vectorization_cost (enum vect_cost_for_stmt type_of_cost,
    1900                 :             :                             tree vectype, int misalign)
    1901                 :             : {
    1902                 :     8165960 :   return targetm.vectorize.builtin_vectorization_cost (type_of_cost,
    1903                 :             :                                                        vectype, misalign);
    1904                 :             : }
    1905                 :             : 
    1906                 :             : /* Get cost by calling cost target builtin.  */
    1907                 :             : 
    1908                 :             : inline
    1909                 :           2 : int vect_get_stmt_cost (enum vect_cost_for_stmt type_of_cost)
    1910                 :             : {
    1911                 :       44322 :   return builtin_vectorization_cost (type_of_cost, NULL, 0);
    1912                 :             : }
    1913                 :             : 
    1914                 :             : /* Alias targetm.vectorize.init_cost.  */
    1915                 :             : 
    1916                 :             : inline vector_costs *
    1917                 :     1705645 : init_cost (vec_info *vinfo, bool costing_for_scalar)
    1918                 :             : {
    1919                 :     1705645 :   return targetm.vectorize.create_costs (vinfo, costing_for_scalar);
    1920                 :             : }
    1921                 :             : 
    1922                 :             : extern void dump_stmt_cost (FILE *, int, enum vect_cost_for_stmt,
    1923                 :             :                             stmt_vec_info, slp_tree, tree, int, unsigned,
    1924                 :             :                             enum vect_cost_model_location);
    1925                 :             : 
    1926                 :             : /* Dump and add costs.  */
    1927                 :             : 
    1928                 :             : inline unsigned
    1929                 :     6198433 : add_stmt_cost (vector_costs *costs, int count,
    1930                 :             :                enum vect_cost_for_stmt kind,
    1931                 :             :                stmt_vec_info stmt_info, slp_tree node,
    1932                 :             :                tree vectype, int misalign,
    1933                 :             :                enum vect_cost_model_location where)
    1934                 :             : {
    1935                 :     6198433 :   unsigned cost = costs->add_stmt_cost (count, kind, stmt_info, node, vectype,
    1936                 :             :                                         misalign, where);
    1937                 :     6198433 :   if (dump_file && (dump_flags & TDF_DETAILS))
    1938                 :      229019 :     dump_stmt_cost (dump_file, count, kind, stmt_info, node, vectype, misalign,
    1939                 :             :                     cost, where);
    1940                 :     6198433 :   return cost;
    1941                 :             : }
    1942                 :             : 
    1943                 :             : inline unsigned
    1944                 :       52403 : add_stmt_cost (vector_costs *costs, int count, enum vect_cost_for_stmt kind,
    1945                 :             :                enum vect_cost_model_location where)
    1946                 :             : {
    1947                 :       52403 :   gcc_assert (kind == cond_branch_taken || kind == cond_branch_not_taken
    1948                 :             :               || kind == scalar_stmt);
    1949                 :       52403 :   return add_stmt_cost (costs, count, kind, NULL, NULL, NULL_TREE, 0, where);
    1950                 :             : }
    1951                 :             : 
    1952                 :             : inline unsigned
    1953                 :     3804409 : add_stmt_cost (vector_costs *costs, stmt_info_for_cost *i)
    1954                 :             : {
    1955                 :     3804409 :   return add_stmt_cost (costs, i->count, i->kind, i->stmt_info, i->node,
    1956                 :     3804409 :                         i->vectype, i->misalign, i->where);
    1957                 :             : }
    1958                 :             : 
    1959                 :             : inline void
    1960                 :      458782 : add_stmt_costs (vector_costs *costs, stmt_vector_for_cost *cost_vec)
    1961                 :             : {
    1962                 :      458782 :   stmt_info_for_cost *cost;
    1963                 :      458782 :   unsigned i;
    1964                 :     2595289 :   FOR_EACH_VEC_ELT (*cost_vec, i, cost)
    1965                 :     2136507 :     add_stmt_cost (costs, cost->count, cost->kind, cost->stmt_info,
    1966                 :             :                    cost->node, cost->vectype, cost->misalign, cost->where);
    1967                 :      458782 : }
    1968                 :             : 
    1969                 :             : /*-----------------------------------------------------------------*/
    1970                 :             : /* Info on data references alignment.                              */
    1971                 :             : /*-----------------------------------------------------------------*/
    1972                 :             : #define DR_MISALIGNMENT_UNKNOWN (-1)
    1973                 :             : #define DR_MISALIGNMENT_UNINITIALIZED (-2)
    1974                 :             : 
    1975                 :             : inline void
    1976                 :     2116142 : set_dr_misalignment (dr_vec_info *dr_info, int val)
    1977                 :             : {
    1978                 :     2116142 :   dr_info->misalignment = val;
    1979                 :             : }
    1980                 :             : 
    1981                 :             : extern int dr_misalignment (dr_vec_info *dr_info, tree vectype,
    1982                 :             :                             poly_int64 offset = 0);
    1983                 :             : 
    1984                 :             : #define SET_DR_MISALIGNMENT(DR, VAL) set_dr_misalignment (DR, VAL)
    1985                 :             : 
    1986                 :             : /* Only defined once DR_MISALIGNMENT is defined.  */
    1987                 :             : inline const poly_uint64
    1988                 :    10352798 : dr_target_alignment (dr_vec_info *dr_info)
    1989                 :             : {
    1990                 :    10352798 :   if (STMT_VINFO_GROUPED_ACCESS (dr_info->stmt))
    1991                 :     8087174 :     dr_info = STMT_VINFO_DR_INFO (DR_GROUP_FIRST_ELEMENT (dr_info->stmt));
    1992                 :    10352798 :   return dr_info->target_alignment;
    1993                 :             : }
    1994                 :             : #define DR_TARGET_ALIGNMENT(DR) dr_target_alignment (DR)
    1995                 :             : 
    1996                 :             : inline void
    1997                 :     1260229 : set_dr_target_alignment (dr_vec_info *dr_info, poly_uint64 val)
    1998                 :             : {
    1999                 :     1260229 :   dr_info->target_alignment = val;
    2000                 :             : }
    2001                 :             : #define SET_DR_TARGET_ALIGNMENT(DR, VAL) set_dr_target_alignment (DR, VAL)
    2002                 :             : 
    2003                 :             : /* Return true if data access DR_INFO is aligned to the targets
    2004                 :             :    preferred alignment for VECTYPE (which may be less than a full vector).  */
    2005                 :             : 
    2006                 :             : inline bool
    2007                 :      221914 : aligned_access_p (dr_vec_info *dr_info, tree vectype)
    2008                 :             : {
    2009                 :      221914 :   return (dr_misalignment (dr_info, vectype) == 0);
    2010                 :             : }
    2011                 :             : 
    2012                 :             : /* Return TRUE if the (mis-)alignment of the data access is known with
    2013                 :             :    respect to the targets preferred alignment for VECTYPE, and FALSE
    2014                 :             :    otherwise.  */
    2015                 :             : 
    2016                 :             : inline bool
    2017                 :     1077121 : known_alignment_for_access_p (dr_vec_info *dr_info, tree vectype)
    2018                 :             : {
    2019                 :      974667 :   return (dr_misalignment (dr_info, vectype) != DR_MISALIGNMENT_UNKNOWN);
    2020                 :             : }
    2021                 :             : 
    2022                 :             : /* Return the minimum alignment in bytes that the vectorized version
    2023                 :             :    of DR_INFO is guaranteed to have.  */
    2024                 :             : 
    2025                 :             : inline unsigned int
    2026                 :      236084 : vect_known_alignment_in_bytes (dr_vec_info *dr_info, tree vectype)
    2027                 :             : {
    2028                 :      236084 :   int misalignment = dr_misalignment (dr_info, vectype);
    2029                 :      236084 :   if (misalignment == DR_MISALIGNMENT_UNKNOWN)
    2030                 :       97885 :     return TYPE_ALIGN_UNIT (TREE_TYPE (DR_REF (dr_info->dr)));
    2031                 :      138199 :   else if (misalignment == 0)
    2032                 :      106396 :     return known_alignment (DR_TARGET_ALIGNMENT (dr_info));
    2033                 :       31803 :   return misalignment & -misalignment;
    2034                 :             : }
    2035                 :             : 
    2036                 :             : /* Return the behavior of DR_INFO with respect to the vectorization context
    2037                 :             :    (which for outer loop vectorization might not be the behavior recorded
    2038                 :             :    in DR_INFO itself).  */
    2039                 :             : 
    2040                 :             : inline innermost_loop_behavior *
    2041                 :     5491892 : vect_dr_behavior (vec_info *vinfo, dr_vec_info *dr_info)
    2042                 :             : {
    2043                 :     5491892 :   stmt_vec_info stmt_info = dr_info->stmt;
    2044                 :     5491892 :   loop_vec_info loop_vinfo = dyn_cast<loop_vec_info> (vinfo);
    2045                 :     1521604 :   if (loop_vinfo == NULL
    2046                 :     1521604 :       || !nested_in_vect_loop_p (LOOP_VINFO_LOOP (loop_vinfo), stmt_info))
    2047                 :     5487553 :     return &DR_INNERMOST (dr_info->dr);
    2048                 :             :   else
    2049                 :        4339 :     return &STMT_VINFO_DR_WRT_VEC_LOOP (stmt_info);
    2050                 :             : }
    2051                 :             : 
    2052                 :             : /* Return the offset calculated by adding the offset of this DR_INFO to the
    2053                 :             :    corresponding data_reference's offset.  If CHECK_OUTER then use
    2054                 :             :    vect_dr_behavior to select the appropriate data_reference to use.  */
    2055                 :             : 
    2056                 :             : inline tree
    2057                 :      710411 : get_dr_vinfo_offset (vec_info *vinfo,
    2058                 :             :                      dr_vec_info *dr_info, bool check_outer = false)
    2059                 :             : {
    2060                 :      710411 :   innermost_loop_behavior *base;
    2061                 :      710411 :   if (check_outer)
    2062                 :      669224 :     base = vect_dr_behavior (vinfo, dr_info);
    2063                 :             :   else
    2064                 :       41187 :     base = &dr_info->dr->innermost;
    2065                 :             : 
    2066                 :      710411 :   tree offset = base->offset;
    2067                 :             : 
    2068                 :      710411 :   if (!dr_info->offset)
    2069                 :             :     return offset;
    2070                 :             : 
    2071                 :       17880 :   offset = fold_convert (sizetype, offset);
    2072                 :       17880 :   return fold_build2 (PLUS_EXPR, TREE_TYPE (dr_info->offset), offset,
    2073                 :             :                       dr_info->offset);
    2074                 :             : }
    2075                 :             : 
    2076                 :             : 
    2077                 :             : /* Return the vect cost model for LOOP.  */
    2078                 :             : inline enum vect_cost_model
    2079                 :     1411851 : loop_cost_model (loop_p loop)
    2080                 :             : {
    2081                 :     1411851 :   if (loop != NULL
    2082                 :      764523 :       && loop->force_vectorize
    2083                 :       70489 :       && flag_simd_cost_model != VECT_COST_MODEL_DEFAULT)
    2084                 :             :     return flag_simd_cost_model;
    2085                 :     1341362 :   return flag_vect_cost_model;
    2086                 :             : }
    2087                 :             : 
    2088                 :             : /* Return true if the vect cost model is unlimited.  */
    2089                 :             : inline bool
    2090                 :     1023504 : unlimited_cost_model (loop_p loop)
    2091                 :             : {
    2092                 :     1023504 :   return loop_cost_model (loop) == VECT_COST_MODEL_UNLIMITED;
    2093                 :             : }
    2094                 :             : 
    2095                 :             : /* Return true if the loop described by LOOP_VINFO is fully-masked and
    2096                 :             :    if the first iteration should use a partial mask in order to achieve
    2097                 :             :    alignment.  */
    2098                 :             : 
    2099                 :             : inline bool
    2100                 :      195166 : vect_use_loop_mask_for_alignment_p (loop_vec_info loop_vinfo)
    2101                 :             : {
    2102                 :          35 :   return (LOOP_VINFO_FULLY_MASKED_P (loop_vinfo)
    2103                 :      195201 :           && LOOP_VINFO_PEELING_FOR_ALIGNMENT (loop_vinfo));
    2104                 :             : }
    2105                 :             : 
    2106                 :             : /* Return the number of vectors of type VECTYPE that are needed to get
    2107                 :             :    NUNITS elements.  NUNITS should be based on the vectorization factor,
    2108                 :             :    so it is always a known multiple of the number of elements in VECTYPE.  */
    2109                 :             : 
    2110                 :             : inline unsigned int
    2111                 :     3221256 : vect_get_num_vectors (poly_uint64 nunits, tree vectype)
    2112                 :             : {
    2113                 :     3221256 :   return exact_div (nunits, TYPE_VECTOR_SUBPARTS (vectype)).to_constant ();
    2114                 :             : }
    2115                 :             : 
    2116                 :             : /* Return the number of vectors in the context of vectorization region VINFO,
    2117                 :             :    needed for a group of statements, whose size is specified by lanes of NODE,
    2118                 :             :    if NULL, it is 1.  The statements are supposed to be interleaved together
    2119                 :             :    with no gap, and all operate on vectors of type VECTYPE, if NULL, the
    2120                 :             :    vectype of NODE is used.  */
    2121                 :             : 
    2122                 :             : inline unsigned int
    2123                 :     3221256 : vect_get_num_copies (vec_info *vinfo, slp_tree node, tree vectype = NULL)
    2124                 :             : {
    2125                 :     3221256 :   poly_uint64 vf;
    2126                 :             : 
    2127                 :     3199528 :   if (loop_vec_info loop_vinfo = dyn_cast <loop_vec_info> (vinfo))
    2128                 :     1334061 :     vf = LOOP_VINFO_VECT_FACTOR (loop_vinfo);
    2129                 :             :   else
    2130                 :             :     vf = 1;
    2131                 :             : 
    2132                 :     3171612 :   if (node)
    2133                 :             :     {
    2134                 :     3157642 :       vf *= SLP_TREE_LANES (node);
    2135                 :     3157642 :       if (!vectype)
    2136                 :     3146611 :         vectype = SLP_TREE_VECTYPE (node);
    2137                 :             :     }
    2138                 :             : 
    2139                 :     3221256 :   return vect_get_num_vectors (vf, vectype);
    2140                 :             : }
    2141                 :             : 
    2142                 :             : /* Return the number of copies needed for loop vectorization when
    2143                 :             :    a statement operates on vectors of type VECTYPE.  This is the
    2144                 :             :    vectorization factor divided by the number of elements in
    2145                 :             :    VECTYPE and is always known at compile time.  */
    2146                 :             : 
    2147                 :             : inline unsigned int
    2148                 :       63602 : vect_get_num_copies (loop_vec_info loop_vinfo, tree vectype)
    2149                 :             : {
    2150                 :       63602 :   return vect_get_num_copies (loop_vinfo, NULL, vectype);
    2151                 :             : }
    2152                 :             : 
    2153                 :             : /* Update maximum unit count *MAX_NUNITS so that it accounts for
    2154                 :             :    NUNITS.  *MAX_NUNITS can be 1 if we haven't yet recorded anything.  */
    2155                 :             : 
    2156                 :             : inline void
    2157                 :     8807796 : vect_update_max_nunits (poly_uint64 *max_nunits, poly_uint64 nunits)
    2158                 :             : {
    2159                 :             :   /* All unit counts have the form vec_info::vector_size * X for some
    2160                 :             :      rational X, so two unit sizes must have a common multiple.
    2161                 :             :      Everything is a multiple of the initial value of 1.  */
    2162                 :     5690567 :   *max_nunits = force_common_multiple (*max_nunits, nunits);
    2163                 :             : }
    2164                 :             : 
    2165                 :             : /* Update maximum unit count *MAX_NUNITS so that it accounts for
    2166                 :             :    the number of units in vector type VECTYPE.  *MAX_NUNITS can be 1
    2167                 :             :    if we haven't yet recorded any vector types.  */
    2168                 :             : 
    2169                 :             : inline void
    2170                 :     5808143 : vect_update_max_nunits (poly_uint64 *max_nunits, tree vectype)
    2171                 :             : {
    2172                 :     5808143 :   vect_update_max_nunits (max_nunits, TYPE_VECTOR_SUBPARTS (vectype));
    2173                 :     5808143 : }
    2174                 :             : 
    2175                 :             : /* Return the vectorization factor that should be used for costing
    2176                 :             :    purposes while vectorizing the loop described by LOOP_VINFO.
    2177                 :             :    Pick a reasonable estimate if the vectorization factor isn't
    2178                 :             :    known at compile time.  */
    2179                 :             : 
    2180                 :             : inline unsigned int
    2181                 :      746132 : vect_vf_for_cost (loop_vec_info loop_vinfo)
    2182                 :             : {
    2183                 :      746132 :   return estimated_poly_value (LOOP_VINFO_VECT_FACTOR (loop_vinfo));
    2184                 :             : }
    2185                 :             : 
    2186                 :             : /* Estimate the number of elements in VEC_TYPE for costing purposes.
    2187                 :             :    Pick a reasonable estimate if the exact number isn't known at
    2188                 :             :    compile time.  */
    2189                 :             : 
    2190                 :             : inline unsigned int
    2191                 :       22563 : vect_nunits_for_cost (tree vec_type)
    2192                 :             : {
    2193                 :       22563 :   return estimated_poly_value (TYPE_VECTOR_SUBPARTS (vec_type));
    2194                 :             : }
    2195                 :             : 
    2196                 :             : /* Return the maximum possible vectorization factor for LOOP_VINFO.  */
    2197                 :             : 
    2198                 :             : inline unsigned HOST_WIDE_INT
    2199                 :       17810 : vect_max_vf (loop_vec_info loop_vinfo)
    2200                 :             : {
    2201                 :       17810 :   unsigned HOST_WIDE_INT vf;
    2202                 :       17810 :   if (LOOP_VINFO_VECT_FACTOR (loop_vinfo).is_constant (&vf))
    2203                 :       17810 :     return vf;
    2204                 :             :   return MAX_VECTORIZATION_FACTOR;
    2205                 :             : }
    2206                 :             : 
    2207                 :             : /* Return the size of the value accessed by unvectorized data reference
    2208                 :             :    DR_INFO.  This is only valid once STMT_VINFO_VECTYPE has been calculated
    2209                 :             :    for the associated gimple statement, since that guarantees that DR_INFO
    2210                 :             :    accesses either a scalar or a scalar equivalent.  ("Scalar equivalent"
    2211                 :             :    here includes things like V1SI, which can be vectorized in the same way
    2212                 :             :    as a plain SI.)  */
    2213                 :             : 
    2214                 :             : inline unsigned int
    2215                 :      239010 : vect_get_scalar_dr_size (dr_vec_info *dr_info)
    2216                 :             : {
    2217                 :      239010 :   return tree_to_uhwi (TYPE_SIZE_UNIT (TREE_TYPE (DR_REF (dr_info->dr))));
    2218                 :             : }
    2219                 :             : 
    2220                 :             : /* Return true if LOOP_VINFO requires a runtime check for whether the
    2221                 :             :    vector loop is profitable.  */
    2222                 :             : 
    2223                 :             : inline bool
    2224                 :       60191 : vect_apply_runtime_profitability_check_p (loop_vec_info loop_vinfo)
    2225                 :             : {
    2226                 :       60191 :   unsigned int th = LOOP_VINFO_COST_MODEL_THRESHOLD (loop_vinfo);
    2227                 :       32991 :   return (!LOOP_VINFO_NITERS_KNOWN_P (loop_vinfo)
    2228                 :       60191 :           && th >= vect_vf_for_cost (loop_vinfo));
    2229                 :             : }
    2230                 :             : 
    2231                 :             : /* Return true if CODE is a lane-reducing opcode.  */
    2232                 :             : 
    2233                 :             : inline bool
    2234                 :      317046 : lane_reducing_op_p (code_helper code)
    2235                 :             : {
    2236                 :      317046 :   return code == DOT_PROD_EXPR || code == WIDEN_SUM_EXPR || code == SAD_EXPR;
    2237                 :             : }
    2238                 :             : 
    2239                 :             : /* Return true if STMT is a lane-reducing statement.  */
    2240                 :             : 
    2241                 :             : inline bool
    2242                 :      355790 : lane_reducing_stmt_p (gimple *stmt)
    2243                 :             : {
    2244                 :      355790 :   if (auto *assign = dyn_cast <gassign *> (stmt))
    2245                 :      217598 :     return lane_reducing_op_p (gimple_assign_rhs_code (assign));
    2246                 :             :   return false;
    2247                 :             : }
    2248                 :             : 
    2249                 :             : /* Source location + hotness information. */
    2250                 :             : extern dump_user_location_t vect_location;
    2251                 :             : 
    2252                 :             : /* A macro for calling:
    2253                 :             :      dump_begin_scope (MSG, vect_location);
    2254                 :             :    via an RAII object, thus printing "=== MSG ===\n" to the dumpfile etc,
    2255                 :             :    and then calling
    2256                 :             :      dump_end_scope ();
    2257                 :             :    once the object goes out of scope, thus capturing the nesting of
    2258                 :             :    the scopes.
    2259                 :             : 
    2260                 :             :    These scopes affect dump messages within them: dump messages at the
    2261                 :             :    top level implicitly default to MSG_PRIORITY_USER_FACING, whereas those
    2262                 :             :    in a nested scope implicitly default to MSG_PRIORITY_INTERNALS.  */
    2263                 :             : 
    2264                 :             : #define DUMP_VECT_SCOPE(MSG) \
    2265                 :             :   AUTO_DUMP_SCOPE (MSG, vect_location)
    2266                 :             : 
    2267                 :             : /* A sentinel class for ensuring that the "vect_location" global gets
    2268                 :             :    reset at the end of a scope.
    2269                 :             : 
    2270                 :             :    The "vect_location" global is used during dumping and contains a
    2271                 :             :    location_t, which could contain references to a tree block via the
    2272                 :             :    ad-hoc data.  This data is used for tracking inlining information,
    2273                 :             :    but it's not a GC root; it's simply assumed that such locations never
    2274                 :             :    get accessed if the blocks are optimized away.
    2275                 :             : 
    2276                 :             :    Hence we need to ensure that such locations are purged at the end
    2277                 :             :    of any operations using them (e.g. via this class).  */
    2278                 :             : 
    2279                 :             : class auto_purge_vect_location
    2280                 :             : {
    2281                 :             :  public:
    2282                 :             :   ~auto_purge_vect_location ();
    2283                 :             : };
    2284                 :             : 
    2285                 :             : /*-----------------------------------------------------------------*/
    2286                 :             : /* Function prototypes.                                            */
    2287                 :             : /*-----------------------------------------------------------------*/
    2288                 :             : 
    2289                 :             : /* Simple loop peeling and versioning utilities for vectorizer's purposes -
    2290                 :             :    in tree-vect-loop-manip.cc.  */
    2291                 :             : extern void vect_set_loop_condition (class loop *, edge, loop_vec_info,
    2292                 :             :                                      tree, tree, tree, bool);
    2293                 :             : extern bool slpeel_can_duplicate_loop_p (const class loop *, const_edge,
    2294                 :             :                                          const_edge);
    2295                 :             : class loop *slpeel_tree_duplicate_loop_to_edge_cfg (class loop *, edge,
    2296                 :             :                                                     class loop *, edge,
    2297                 :             :                                                     edge, edge *, bool = true,
    2298                 :             :                                                     vec<basic_block> * = NULL);
    2299                 :             : class loop *vect_loop_versioning (loop_vec_info, gimple *);
    2300                 :             : extern class loop *vect_do_peeling (loop_vec_info, tree, tree,
    2301                 :             :                                     tree *, tree *, tree *, int, bool, bool,
    2302                 :             :                                     tree *);
    2303                 :             : extern tree vect_get_main_loop_result (loop_vec_info, tree, tree);
    2304                 :             : extern void vect_prepare_for_masked_peels (loop_vec_info);
    2305                 :             : extern dump_user_location_t find_loop_location (class loop *);
    2306                 :             : extern bool vect_can_advance_ivs_p (loop_vec_info);
    2307                 :             : extern void vect_update_inits_of_drs (loop_vec_info, tree, tree_code);
    2308                 :             : extern edge vec_init_loop_exit_info (class loop *);
    2309                 :             : extern void vect_iv_increment_position (edge, gimple_stmt_iterator *, bool *);
    2310                 :             : 
    2311                 :             : /* In tree-vect-stmts.cc.  */
    2312                 :             : extern tree get_related_vectype_for_scalar_type (machine_mode, tree,
    2313                 :             :                                                  poly_uint64 = 0);
    2314                 :             : extern tree get_vectype_for_scalar_type (vec_info *, tree, unsigned int = 0);
    2315                 :             : extern tree get_vectype_for_scalar_type (vec_info *, tree, slp_tree);
    2316                 :             : extern tree get_mask_type_for_scalar_type (vec_info *, tree, unsigned int = 0);
    2317                 :             : extern tree get_mask_type_for_scalar_type (vec_info *, tree, slp_tree);
    2318                 :             : extern tree get_same_sized_vectype (tree, tree);
    2319                 :             : extern bool vect_chooses_same_modes_p (vec_info *, machine_mode);
    2320                 :             : extern bool vect_get_loop_mask_type (loop_vec_info);
    2321                 :             : extern bool vect_is_simple_use (tree, vec_info *, enum vect_def_type *,
    2322                 :             :                                 stmt_vec_info * = NULL, gimple ** = NULL);
    2323                 :             : extern bool vect_is_simple_use (tree, vec_info *, enum vect_def_type *,
    2324                 :             :                                 tree *, stmt_vec_info * = NULL,
    2325                 :             :                                 gimple ** = NULL);
    2326                 :             : extern bool vect_is_simple_use (vec_info *, stmt_vec_info, slp_tree,
    2327                 :             :                                 unsigned, tree *, slp_tree *,
    2328                 :             :                                 enum vect_def_type *,
    2329                 :             :                                 tree *, stmt_vec_info * = NULL);
    2330                 :             : extern bool vect_maybe_update_slp_op_vectype (slp_tree, tree);
    2331                 :             : extern tree perm_mask_for_reverse (tree);
    2332                 :             : extern bool supportable_widening_operation (vec_info*, code_helper,
    2333                 :             :                                             stmt_vec_info, tree, tree,
    2334                 :             :                                             code_helper*, code_helper*,
    2335                 :             :                                             int*, vec<tree> *);
    2336                 :             : extern bool supportable_narrowing_operation (code_helper, tree, tree,
    2337                 :             :                                              code_helper *, int *,
    2338                 :             :                                              vec<tree> *);
    2339                 :             : extern bool supportable_indirect_convert_operation (code_helper,
    2340                 :             :                                                     tree, tree,
    2341                 :             :                                                     vec<std::pair<tree, tree_code> > *,
    2342                 :             :                                                     tree = NULL_TREE);
    2343                 :             : extern int compare_step_with_zero (vec_info *, stmt_vec_info);
    2344                 :             : 
    2345                 :             : extern unsigned record_stmt_cost (stmt_vector_for_cost *, int,
    2346                 :             :                                   enum vect_cost_for_stmt, stmt_vec_info,
    2347                 :             :                                   tree, int, enum vect_cost_model_location);
    2348                 :             : extern unsigned record_stmt_cost (stmt_vector_for_cost *, int,
    2349                 :             :                                   enum vect_cost_for_stmt, slp_tree,
    2350                 :             :                                   tree, int, enum vect_cost_model_location);
    2351                 :             : extern unsigned record_stmt_cost (stmt_vector_for_cost *, int,
    2352                 :             :                                   enum vect_cost_for_stmt,
    2353                 :             :                                   enum vect_cost_model_location);
    2354                 :             : extern unsigned record_stmt_cost (stmt_vector_for_cost *, int,
    2355                 :             :                                   enum vect_cost_for_stmt, stmt_vec_info,
    2356                 :             :                                   slp_tree, tree, int,
    2357                 :             :                                   enum vect_cost_model_location);
    2358                 :             : 
    2359                 :             : /* Overload of record_stmt_cost with VECTYPE derived from STMT_INFO.  */
    2360                 :             : 
    2361                 :             : inline unsigned
    2362                 :     2779521 : record_stmt_cost (stmt_vector_for_cost *body_cost_vec, int count,
    2363                 :             :                   enum vect_cost_for_stmt kind, stmt_vec_info stmt_info,
    2364                 :             :                   int misalign, enum vect_cost_model_location where)
    2365                 :             : {
    2366                 :     2654710 :   return record_stmt_cost (body_cost_vec, count, kind, stmt_info,
    2367                 :      918780 :                            STMT_VINFO_VECTYPE (stmt_info), misalign, where);
    2368                 :             : }
    2369                 :             : 
    2370                 :             : /* Overload of record_stmt_cost with VECTYPE derived from STMT_INFO and
    2371                 :             :    SLP node specified.  */
    2372                 :             : 
    2373                 :             : inline unsigned
    2374                 :     1825825 : record_stmt_cost (stmt_vector_for_cost *body_cost_vec, int count,
    2375                 :             :                   enum vect_cost_for_stmt kind, stmt_vec_info stmt_info,
    2376                 :             :                   slp_tree node,
    2377                 :             :                   int misalign, enum vect_cost_model_location where)
    2378                 :             : {
    2379                 :     1793400 :   return record_stmt_cost (body_cost_vec, count, kind, stmt_info, node,
    2380                 :             :                            STMT_VINFO_VECTYPE (stmt_info), misalign, where);
    2381                 :             : }
    2382                 :             : 
    2383                 :             : extern void vect_finish_replace_stmt (vec_info *, stmt_vec_info, gimple *);
    2384                 :             : extern void vect_finish_stmt_generation (vec_info *, stmt_vec_info, gimple *,
    2385                 :             :                                          gimple_stmt_iterator *);
    2386                 :             : extern opt_result vect_mark_stmts_to_be_vectorized (loop_vec_info, bool *);
    2387                 :             : extern tree vect_get_store_rhs (stmt_vec_info);
    2388                 :             : void vect_get_vec_defs_for_operand (vec_info *vinfo, stmt_vec_info, unsigned,
    2389                 :             :                                     tree op, vec<tree> *, tree = NULL);
    2390                 :             : void vect_get_vec_defs (vec_info *, stmt_vec_info, slp_tree, unsigned,
    2391                 :             :                         tree, vec<tree> *,
    2392                 :             :                         tree = NULL, vec<tree> * = NULL,
    2393                 :             :                         tree = NULL, vec<tree> * = NULL,
    2394                 :             :                         tree = NULL, vec<tree> * = NULL);
    2395                 :             : void vect_get_vec_defs (vec_info *, stmt_vec_info, slp_tree, unsigned,
    2396                 :             :                         tree, tree, vec<tree> *,
    2397                 :             :                         tree = NULL, tree = NULL, vec<tree> * = NULL,
    2398                 :             :                         tree = NULL, tree = NULL, vec<tree> * = NULL,
    2399                 :             :                         tree = NULL, tree = NULL, vec<tree> * = NULL);
    2400                 :             : extern tree vect_init_vector (vec_info *, stmt_vec_info, tree, tree,
    2401                 :             :                               gimple_stmt_iterator *);
    2402                 :             : extern tree vect_get_slp_vect_def (slp_tree, unsigned);
    2403                 :             : extern bool vect_transform_stmt (vec_info *, stmt_vec_info,
    2404                 :             :                                  gimple_stmt_iterator *,
    2405                 :             :                                  slp_tree, slp_instance);
    2406                 :             : extern void vect_remove_stores (vec_info *, stmt_vec_info);
    2407                 :             : extern bool vect_nop_conversion_p (stmt_vec_info);
    2408                 :             : extern opt_result vect_analyze_stmt (vec_info *, stmt_vec_info, bool *,
    2409                 :             :                                      slp_tree,
    2410                 :             :                                      slp_instance, stmt_vector_for_cost *);
    2411                 :             : extern void vect_get_load_cost (vec_info *, stmt_vec_info, slp_tree, int,
    2412                 :             :                                 dr_alignment_support, int, bool,
    2413                 :             :                                 unsigned int *, unsigned int *,
    2414                 :             :                                 stmt_vector_for_cost *,
    2415                 :             :                                 stmt_vector_for_cost *, bool);
    2416                 :             : extern void vect_get_store_cost (vec_info *, stmt_vec_info, slp_tree, int,
    2417                 :             :                                  dr_alignment_support, int,
    2418                 :             :                                  unsigned int *, stmt_vector_for_cost *);
    2419                 :             : extern bool vect_supportable_shift (vec_info *, enum tree_code, tree);
    2420                 :             : extern tree vect_gen_perm_mask_any (tree, const vec_perm_indices &);
    2421                 :             : extern tree vect_gen_perm_mask_checked (tree, const vec_perm_indices &);
    2422                 :             : extern void optimize_mask_stores (class loop*);
    2423                 :             : extern tree vect_gen_while (gimple_seq *, tree, tree, tree,
    2424                 :             :                             const char * = nullptr);
    2425                 :             : extern tree vect_gen_while_not (gimple_seq *, tree, tree, tree);
    2426                 :             : extern opt_result vect_get_vector_types_for_stmt (vec_info *,
    2427                 :             :                                                   stmt_vec_info, tree *,
    2428                 :             :                                                   tree *, unsigned int = 0);
    2429                 :             : extern opt_tree vect_get_mask_type_for_stmt (stmt_vec_info, unsigned int = 0);
    2430                 :             : 
    2431                 :             : /* In tree-if-conv.cc.  */
    2432                 :             : extern bool ref_within_array_bound (gimple *, tree);
    2433                 :             : 
    2434                 :             : /* In tree-vect-data-refs.cc.  */
    2435                 :             : extern bool vect_can_force_dr_alignment_p (const_tree, poly_uint64);
    2436                 :             : extern enum dr_alignment_support vect_supportable_dr_alignment
    2437                 :             :                                    (vec_info *, dr_vec_info *, tree, int);
    2438                 :             : extern tree vect_get_smallest_scalar_type (stmt_vec_info, tree);
    2439                 :             : extern opt_result vect_analyze_data_ref_dependences (loop_vec_info, unsigned int *);
    2440                 :             : extern bool vect_slp_analyze_instance_dependence (vec_info *, slp_instance);
    2441                 :             : extern opt_result vect_enhance_data_refs_alignment (loop_vec_info);
    2442                 :             : extern opt_result vect_analyze_data_refs_alignment (loop_vec_info);
    2443                 :             : extern bool vect_slp_analyze_instance_alignment (vec_info *, slp_instance);
    2444                 :             : extern opt_result vect_analyze_data_ref_accesses (vec_info *, vec<int> *);
    2445                 :             : extern opt_result vect_prune_runtime_alias_test_list (loop_vec_info);
    2446                 :             : extern bool vect_gather_scatter_fn_p (vec_info *, bool, bool, tree, tree,
    2447                 :             :                                       tree, int, internal_fn *, tree *,
    2448                 :             :                                       vec<int> * = nullptr);
    2449                 :             : extern bool vect_check_gather_scatter (stmt_vec_info, loop_vec_info,
    2450                 :             :                                        gather_scatter_info *,
    2451                 :             :                                        vec<int> * = nullptr);
    2452                 :             : extern opt_result vect_find_stmt_data_reference (loop_p, gimple *,
    2453                 :             :                                                  vec<data_reference_p> *,
    2454                 :             :                                                  vec<int> *, int);
    2455                 :             : extern opt_result vect_analyze_data_refs (vec_info *, poly_uint64 *, bool *);
    2456                 :             : extern void vect_record_base_alignments (vec_info *);
    2457                 :             : extern tree vect_create_data_ref_ptr (vec_info *,
    2458                 :             :                                       stmt_vec_info, tree, class loop *, tree,
    2459                 :             :                                       tree *, gimple_stmt_iterator *,
    2460                 :             :                                       gimple **, bool,
    2461                 :             :                                       tree = NULL_TREE);
    2462                 :             : extern tree bump_vector_ptr (vec_info *, tree, gimple *, gimple_stmt_iterator *,
    2463                 :             :                              stmt_vec_info, tree);
    2464                 :             : extern void vect_copy_ref_info (tree, tree);
    2465                 :             : extern tree vect_create_destination_var (tree, tree);
    2466                 :             : extern bool vect_grouped_store_supported (tree, unsigned HOST_WIDE_INT);
    2467                 :             : extern internal_fn vect_store_lanes_supported (tree, unsigned HOST_WIDE_INT, bool);
    2468                 :             : extern bool vect_grouped_load_supported (tree, bool, unsigned HOST_WIDE_INT);
    2469                 :             : extern internal_fn vect_load_lanes_supported (tree, unsigned HOST_WIDE_INT,
    2470                 :             :                                               bool, vec<int> * = nullptr);
    2471                 :             : extern void vect_permute_store_chain (vec_info *, vec<tree> &,
    2472                 :             :                                       unsigned int, stmt_vec_info,
    2473                 :             :                                       gimple_stmt_iterator *, vec<tree> *);
    2474                 :             : extern tree vect_setup_realignment (vec_info *,
    2475                 :             :                                     stmt_vec_info, gimple_stmt_iterator *,
    2476                 :             :                                     tree *, enum dr_alignment_support, tree,
    2477                 :             :                                     class loop **);
    2478                 :             : extern void vect_transform_grouped_load (vec_info *, stmt_vec_info, vec<tree>,
    2479                 :             :                                          int, gimple_stmt_iterator *);
    2480                 :             : extern void vect_record_grouped_load_vectors (vec_info *,
    2481                 :             :                                               stmt_vec_info, vec<tree>);
    2482                 :             : extern tree vect_get_new_vect_var (tree, enum vect_var_kind, const char *);
    2483                 :             : extern tree vect_get_new_ssa_name (tree, enum vect_var_kind,
    2484                 :             :                                    const char * = NULL);
    2485                 :             : extern tree vect_create_addr_base_for_vector_ref (vec_info *,
    2486                 :             :                                                   stmt_vec_info, gimple_seq *,
    2487                 :             :                                                   tree);
    2488                 :             : 
    2489                 :             : /* In tree-vect-loop.cc.  */
    2490                 :             : extern tree neutral_op_for_reduction (tree, code_helper, tree, bool = true);
    2491                 :             : extern widest_int vect_iv_limit_for_partial_vectors (loop_vec_info loop_vinfo);
    2492                 :             : bool vect_rgroup_iv_might_wrap_p (loop_vec_info, rgroup_controls *);
    2493                 :             : /* Used in tree-vect-loop-manip.cc */
    2494                 :             : extern opt_result vect_determine_partial_vectors_and_peeling (loop_vec_info);
    2495                 :             : /* Used in gimple-loop-interchange.c and tree-parloops.cc.  */
    2496                 :             : extern bool check_reduction_path (dump_user_location_t, loop_p, gphi *, tree,
    2497                 :             :                                   enum tree_code);
    2498                 :             : extern bool needs_fold_left_reduction_p (tree, code_helper);
    2499                 :             : /* Drive for loop analysis stage.  */
    2500                 :             : extern opt_loop_vec_info vect_analyze_loop (class loop *, gimple *,
    2501                 :             :                                             vec_info_shared *);
    2502                 :             : extern tree vect_build_loop_niters (loop_vec_info, bool * = NULL);
    2503                 :             : extern void vect_gen_vector_loop_niters (loop_vec_info, tree, tree *,
    2504                 :             :                                          tree *, bool);
    2505                 :             : extern tree vect_halve_mask_nunits (tree, machine_mode);
    2506                 :             : extern tree vect_double_mask_nunits (tree, machine_mode);
    2507                 :             : extern void vect_record_loop_mask (loop_vec_info, vec_loop_masks *,
    2508                 :             :                                    unsigned int, tree, tree);
    2509                 :             : extern tree vect_get_loop_mask (loop_vec_info, gimple_stmt_iterator *,
    2510                 :             :                                 vec_loop_masks *,
    2511                 :             :                                 unsigned int, tree, unsigned int);
    2512                 :             : extern void vect_record_loop_len (loop_vec_info, vec_loop_lens *, unsigned int,
    2513                 :             :                                   tree, unsigned int);
    2514                 :             : extern tree vect_get_loop_len (loop_vec_info, gimple_stmt_iterator *,
    2515                 :             :                                vec_loop_lens *, unsigned int, tree,
    2516                 :             :                                unsigned int, unsigned int);
    2517                 :             : extern tree vect_gen_loop_len_mask (loop_vec_info, gimple_stmt_iterator *,
    2518                 :             :                                     gimple_stmt_iterator *, vec_loop_lens *,
    2519                 :             :                                     unsigned int, tree, tree, unsigned int,
    2520                 :             :                                     unsigned int);
    2521                 :             : extern gimple_seq vect_gen_len (tree, tree, tree, tree);
    2522                 :             : extern stmt_vec_info info_for_reduction (vec_info *, stmt_vec_info);
    2523                 :             : extern bool reduction_fn_for_scalar_code (code_helper, internal_fn *);
    2524                 :             : 
    2525                 :             : /* Drive for loop transformation stage.  */
    2526                 :             : extern class loop *vect_transform_loop (loop_vec_info, gimple *);
    2527                 :      842536 : struct vect_loop_form_info
    2528                 :             : {
    2529                 :             :   tree number_of_iterations;
    2530                 :             :   tree number_of_iterationsm1;
    2531                 :             :   tree assumptions;
    2532                 :             :   auto_vec<gcond *> conds;
    2533                 :             :   gcond *inner_loop_cond;
    2534                 :             :   edge loop_exit;
    2535                 :             : };
    2536                 :             : extern opt_result vect_analyze_loop_form (class loop *, gimple *,
    2537                 :             :                                           vect_loop_form_info *);
    2538                 :             : extern loop_vec_info vect_create_loop_vinfo (class loop *, vec_info_shared *,
    2539                 :             :                                              const vect_loop_form_info *,
    2540                 :             :                                              loop_vec_info = nullptr);
    2541                 :             : extern bool vectorizable_live_operation (vec_info *, stmt_vec_info,
    2542                 :             :                                          slp_tree, slp_instance, int,
    2543                 :             :                                          bool, stmt_vector_for_cost *);
    2544                 :             : extern bool vectorizable_lane_reducing (loop_vec_info, stmt_vec_info,
    2545                 :             :                                         slp_tree, stmt_vector_for_cost *);
    2546                 :             : extern bool vectorizable_reduction (loop_vec_info, stmt_vec_info,
    2547                 :             :                                     slp_tree, slp_instance,
    2548                 :             :                                     stmt_vector_for_cost *);
    2549                 :             : extern bool vectorizable_induction (loop_vec_info, stmt_vec_info,
    2550                 :             :                                     gimple **, slp_tree,
    2551                 :             :                                     stmt_vector_for_cost *);
    2552                 :             : extern bool vect_transform_reduction (loop_vec_info, stmt_vec_info,
    2553                 :             :                                       gimple_stmt_iterator *,
    2554                 :             :                                       gimple **, slp_tree);
    2555                 :             : extern bool vect_transform_cycle_phi (loop_vec_info, stmt_vec_info,
    2556                 :             :                                       gimple **,
    2557                 :             :                                       slp_tree, slp_instance);
    2558                 :             : extern bool vectorizable_lc_phi (loop_vec_info, stmt_vec_info,
    2559                 :             :                                  gimple **, slp_tree);
    2560                 :             : extern bool vectorizable_phi (vec_info *, stmt_vec_info, gimple **, slp_tree,
    2561                 :             :                               stmt_vector_for_cost *);
    2562                 :             : extern bool vectorizable_recurr (loop_vec_info, stmt_vec_info,
    2563                 :             :                                   gimple **, slp_tree, stmt_vector_for_cost *);
    2564                 :             : extern bool vectorizable_early_exit (vec_info *, stmt_vec_info,
    2565                 :             :                                      gimple_stmt_iterator *, gimple **,
    2566                 :             :                                      slp_tree, stmt_vector_for_cost *);
    2567                 :             : extern bool vect_emulated_vector_p (tree);
    2568                 :             : extern bool vect_can_vectorize_without_simd_p (tree_code);
    2569                 :             : extern bool vect_can_vectorize_without_simd_p (code_helper);
    2570                 :             : extern int vect_get_known_peeling_cost (loop_vec_info, int, int *,
    2571                 :             :                                         stmt_vector_for_cost *,
    2572                 :             :                                         stmt_vector_for_cost *,
    2573                 :             :                                         stmt_vector_for_cost *);
    2574                 :             : extern tree cse_and_gimplify_to_preheader (loop_vec_info, tree);
    2575                 :             : 
    2576                 :             : /* Nonlinear induction.  */
    2577                 :             : extern tree vect_peel_nonlinear_iv_init (gimple_seq*, tree, tree,
    2578                 :             :                                          tree, enum vect_induction_op_type);
    2579                 :             : 
    2580                 :             : /* In tree-vect-slp.cc.  */
    2581                 :             : extern void vect_slp_init (void);
    2582                 :             : extern void vect_slp_fini (void);
    2583                 :             : extern void vect_free_slp_instance (slp_instance);
    2584                 :             : extern bool vect_transform_slp_perm_load (vec_info *, slp_tree, const vec<tree> &,
    2585                 :             :                                           gimple_stmt_iterator *, poly_uint64,
    2586                 :             :                                           bool, unsigned *,
    2587                 :             :                                           unsigned * = nullptr, bool = false);
    2588                 :             : extern bool vect_slp_analyze_operations (vec_info *);
    2589                 :             : extern void vect_schedule_slp (vec_info *, const vec<slp_instance> &);
    2590                 :             : extern opt_result vect_analyze_slp (vec_info *, unsigned, bool);
    2591                 :             : extern bool vect_make_slp_decision (loop_vec_info);
    2592                 :             : extern void vect_detect_hybrid_slp (loop_vec_info);
    2593                 :             : extern void vect_optimize_slp (vec_info *);
    2594                 :             : extern void vect_gather_slp_loads (vec_info *);
    2595                 :             : extern void vect_get_slp_defs (slp_tree, vec<tree> *);
    2596                 :             : extern void vect_get_slp_defs (vec_info *, slp_tree, vec<vec<tree> > *,
    2597                 :             :                                unsigned n = -1U);
    2598                 :             : extern bool vect_slp_if_converted_bb (basic_block bb, loop_p orig_loop);
    2599                 :             : extern bool vect_slp_function (function *);
    2600                 :             : extern stmt_vec_info vect_find_last_scalar_stmt_in_slp (slp_tree);
    2601                 :             : extern stmt_vec_info vect_find_first_scalar_stmt_in_slp (slp_tree);
    2602                 :             : extern bool is_simple_and_all_uses_invariant (stmt_vec_info, loop_vec_info);
    2603                 :             : extern bool can_duplicate_and_interleave_p (vec_info *, unsigned int, tree,
    2604                 :             :                                             unsigned int * = NULL,
    2605                 :             :                                             tree * = NULL, tree * = NULL);
    2606                 :             : extern void duplicate_and_interleave (vec_info *, gimple_seq *, tree,
    2607                 :             :                                       const vec<tree> &, unsigned int, vec<tree> &);
    2608                 :             : extern int vect_get_place_in_interleaving_chain (stmt_vec_info, stmt_vec_info);
    2609                 :             : extern slp_tree vect_create_new_slp_node (unsigned, tree_code);
    2610                 :             : extern void vect_free_slp_tree (slp_tree);
    2611                 :             : extern bool compatible_calls_p (gcall *, gcall *);
    2612                 :             : extern int vect_slp_child_index_for_operand (const gimple *, int op, bool);
    2613                 :             : 
    2614                 :             : extern tree prepare_vec_mask (loop_vec_info, tree, tree, tree,
    2615                 :             :                               gimple_stmt_iterator *);
    2616                 :             : extern tree vect_get_mask_load_else (int, tree);
    2617                 :             : 
    2618                 :             : /* In tree-vect-patterns.cc.  */
    2619                 :             : extern void
    2620                 :             : vect_mark_pattern_stmts (vec_info *, stmt_vec_info, gimple *, tree);
    2621                 :             : extern bool vect_get_range_info (tree, wide_int*, wide_int*);
    2622                 :             : 
    2623                 :             : /* Pattern recognition functions.
    2624                 :             :    Additional pattern recognition functions can (and will) be added
    2625                 :             :    in the future.  */
    2626                 :             : void vect_pattern_recog (vec_info *);
    2627                 :             : 
    2628                 :             : /* In tree-vectorizer.cc.  */
    2629                 :             : unsigned vectorize_loops (void);
    2630                 :             : void vect_free_loop_info_assumptions (class loop *);
    2631                 :             : gimple *vect_loop_vectorized_call (class loop *, gcond **cond = NULL);
    2632                 :             : bool vect_stmt_dominates_stmt_p (gimple *, gimple *);
    2633                 :             : 
    2634                 :             : /* SLP Pattern matcher types, tree-vect-slp-patterns.cc.  */
    2635                 :             : 
    2636                 :             : /* Forward declaration of possible two operands operation that can be matched
    2637                 :             :    by the complex numbers pattern matchers.  */
    2638                 :             : enum _complex_operation : unsigned;
    2639                 :             : 
    2640                 :             : /* All possible load permute values that could result from the partial data-flow
    2641                 :             :    analysis.  */
    2642                 :             : typedef enum _complex_perm_kinds {
    2643                 :             :    PERM_UNKNOWN,
    2644                 :             :    PERM_EVENODD,
    2645                 :             :    PERM_ODDEVEN,
    2646                 :             :    PERM_ODDODD,
    2647                 :             :    PERM_EVENEVEN,
    2648                 :             :    /* Can be combined with any other PERM values.  */
    2649                 :             :    PERM_TOP
    2650                 :             : } complex_perm_kinds_t;
    2651                 :             : 
    2652                 :             : /* Cache from nodes to the load permutation they represent.  */
    2653                 :             : typedef hash_map <slp_tree, complex_perm_kinds_t>
    2654                 :             :   slp_tree_to_load_perm_map_t;
    2655                 :             : 
    2656                 :             : /* Cache from nodes pair to being compatible or not.  */
    2657                 :             : typedef pair_hash <nofree_ptr_hash <_slp_tree>,
    2658                 :             :                    nofree_ptr_hash <_slp_tree>> slp_node_hash;
    2659                 :             : typedef hash_map <slp_node_hash, bool> slp_compat_nodes_map_t;
    2660                 :             : 
    2661                 :             : 
    2662                 :             : /* Vector pattern matcher base class.  All SLP pattern matchers must inherit
    2663                 :             :    from this type.  */
    2664                 :             : 
    2665                 :             : class vect_pattern
    2666                 :             : {
    2667                 :             :   protected:
    2668                 :             :     /* The number of arguments that the IFN requires.  */
    2669                 :             :     unsigned m_num_args;
    2670                 :             : 
    2671                 :             :     /* The internal function that will be used when a pattern is created.  */
    2672                 :             :     internal_fn m_ifn;
    2673                 :             : 
    2674                 :             :     /* The current node being inspected.  */
    2675                 :             :     slp_tree *m_node;
    2676                 :             : 
    2677                 :             :     /* The list of operands to be the children for the node produced when the
    2678                 :             :        internal function is created.  */
    2679                 :             :     vec<slp_tree> m_ops;
    2680                 :             : 
    2681                 :             :     /* Default constructor where NODE is the root of the tree to inspect.  */
    2682                 :         448 :     vect_pattern (slp_tree *node, vec<slp_tree> *m_ops, internal_fn ifn)
    2683                 :         448 :     {
    2684                 :         448 :       this->m_ifn = ifn;
    2685                 :         448 :       this->m_node = node;
    2686                 :         448 :       this->m_ops.create (0);
    2687                 :         448 :       if (m_ops)
    2688                 :          20 :         this->m_ops.safe_splice (*m_ops);
    2689                 :             :     }
    2690                 :             : 
    2691                 :             :   public:
    2692                 :             : 
    2693                 :             :     /* Create a new instance of the pattern matcher class of the given type.  */
    2694                 :             :     static vect_pattern* recognize (slp_tree_to_load_perm_map_t *,
    2695                 :             :                                     slp_compat_nodes_map_t *, slp_tree *);
    2696                 :             : 
    2697                 :             :     /* Build the pattern from the data collected so far.  */
    2698                 :             :     virtual void build (vec_info *) = 0;
    2699                 :             : 
    2700                 :             :     /* Default destructor.  */
    2701                 :             :     virtual ~vect_pattern ()
    2702                 :             :     {
    2703                 :             :         this->m_ops.release ();
    2704                 :             :     }
    2705                 :             : };
    2706                 :             : 
    2707                 :             : /* Function pointer to create a new pattern matcher from a generic type.  */
    2708                 :             : typedef vect_pattern* (*vect_pattern_decl_t) (slp_tree_to_load_perm_map_t *,
    2709                 :             :                                               slp_compat_nodes_map_t *,
    2710                 :             :                                               slp_tree *);
    2711                 :             : 
    2712                 :             : /* List of supported pattern matchers.  */
    2713                 :             : extern vect_pattern_decl_t slp_patterns[];
    2714                 :             : 
    2715                 :             : /* Number of supported pattern matchers.  */
    2716                 :             : extern size_t num__slp_patterns;
    2717                 :             : 
    2718                 :             : /* ----------------------------------------------------------------------
    2719                 :             :    Target support routines
    2720                 :             :    -----------------------------------------------------------------------
    2721                 :             :    The following routines are provided to simplify costing decisions in
    2722                 :             :    target code.  Please add more as needed.  */
    2723                 :             : 
    2724                 :             : /* Return true if an operaton of kind KIND for STMT_INFO represents
    2725                 :             :    the extraction of an element from a vector in preparation for
    2726                 :             :    storing the element to memory.  */
    2727                 :             : inline bool
    2728                 :             : vect_is_store_elt_extraction (vect_cost_for_stmt kind, stmt_vec_info stmt_info)
    2729                 :             : {
    2730                 :             :   return (kind == vec_to_scalar
    2731                 :             :           && STMT_VINFO_DATA_REF (stmt_info)
    2732                 :             :           && DR_IS_WRITE (STMT_VINFO_DATA_REF (stmt_info)));
    2733                 :             : }
    2734                 :             : 
    2735                 :             : /* Return true if STMT_INFO represents part of a reduction.  */
    2736                 :             : inline bool
    2737                 :             : vect_is_reduction (stmt_vec_info stmt_info)
    2738                 :             : {
    2739                 :             :   return STMT_VINFO_REDUC_IDX (stmt_info) >= 0;
    2740                 :             : }
    2741                 :             : 
    2742                 :             : /* Returns the memory acccess type being used to vectorize the statement.  If
    2743                 :             :    SLP this is read from NODE, otherwise it's read from the STMT_VINFO.  */
    2744                 :             : 
    2745                 :             : inline vect_memory_access_type
    2746                 :             : vect_mem_access_type (stmt_vec_info stmt_info, slp_tree node)
    2747                 :             : {
    2748                 :             :   if (node)
    2749                 :             :     return SLP_TREE_MEMORY_ACCESS_TYPE (node);
    2750                 :             :   else
    2751                 :             :     return STMT_VINFO_MEMORY_ACCESS_TYPE (stmt_info);
    2752                 :             : }
    2753                 :             : 
    2754                 :             : /* If STMT_INFO describes a reduction, return the vect_reduction_type
    2755                 :             :    of the reduction it describes, otherwise return -1.  */
    2756                 :             : inline int
    2757                 :             : vect_reduc_type (vec_info *vinfo, stmt_vec_info stmt_info)
    2758                 :             : {
    2759                 :             :   if (loop_vec_info loop_vinfo = dyn_cast<loop_vec_info> (vinfo))
    2760                 :             :     if (STMT_VINFO_REDUC_DEF (stmt_info))
    2761                 :             :       {
    2762                 :             :         stmt_vec_info reduc_info = info_for_reduction (loop_vinfo, stmt_info);
    2763                 :             :         return int (STMT_VINFO_REDUC_TYPE (reduc_info));
    2764                 :             :       }
    2765                 :             :   return -1;
    2766                 :             : }
    2767                 :             : 
    2768                 :             : /* If STMT_INFO is a COND_EXPR that includes an embedded comparison, return the
    2769                 :             :    scalar type of the values being compared.  Return null otherwise.  */
    2770                 :             : inline tree
    2771                 :             : vect_embedded_comparison_type (stmt_vec_info stmt_info)
    2772                 :             : {
    2773                 :             :   if (auto *assign = dyn_cast<gassign *> (stmt_info->stmt))
    2774                 :             :     if (gimple_assign_rhs_code (assign) == COND_EXPR)
    2775                 :             :       {
    2776                 :             :         tree cond = gimple_assign_rhs1 (assign);
    2777                 :             :         if (COMPARISON_CLASS_P (cond))
    2778                 :             :           return TREE_TYPE (TREE_OPERAND (cond, 0));
    2779                 :             :       }
    2780                 :             :   return NULL_TREE;
    2781                 :             : }
    2782                 :             : 
    2783                 :             : /* If STMT_INFO is a comparison or contains an embedded comparison, return the
    2784                 :             :    scalar type of the values being compared.  Return null otherwise.  */
    2785                 :             : inline tree
    2786                 :             : vect_comparison_type (stmt_vec_info stmt_info)
    2787                 :             : {
    2788                 :             :   if (auto *assign = dyn_cast<gassign *> (stmt_info->stmt))
    2789                 :             :     if (TREE_CODE_CLASS (gimple_assign_rhs_code (assign)) == tcc_comparison)
    2790                 :             :       return TREE_TYPE (gimple_assign_rhs1 (assign));
    2791                 :             :   return vect_embedded_comparison_type (stmt_info);
    2792                 :             : }
    2793                 :             : 
    2794                 :             : /* Return true if STMT_INFO extends the result of a load.  */
    2795                 :             : inline bool
    2796                 :             : vect_is_extending_load (class vec_info *vinfo, stmt_vec_info stmt_info)
    2797                 :             : {
    2798                 :             :   /* Although this is quite large for an inline function, this part
    2799                 :             :      at least should be inline.  */
    2800                 :             :   gassign *assign = dyn_cast <gassign *> (stmt_info->stmt);
    2801                 :             :   if (!assign || !CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (assign)))
    2802                 :             :     return false;
    2803                 :             : 
    2804                 :             :   tree rhs = gimple_assign_rhs1 (stmt_info->stmt);
    2805                 :             :   tree lhs_type = TREE_TYPE (gimple_assign_lhs (assign));
    2806                 :             :   tree rhs_type = TREE_TYPE (rhs);
    2807                 :             :   if (!INTEGRAL_TYPE_P (lhs_type)
    2808                 :             :       || !INTEGRAL_TYPE_P (rhs_type)
    2809                 :             :       || TYPE_PRECISION (lhs_type) <= TYPE_PRECISION (rhs_type))
    2810                 :             :     return false;
    2811                 :             : 
    2812                 :             :   stmt_vec_info def_stmt_info = vinfo->lookup_def (rhs);
    2813                 :             :   return (def_stmt_info
    2814                 :             :           && STMT_VINFO_DATA_REF (def_stmt_info)
    2815                 :             :           && DR_IS_READ (STMT_VINFO_DATA_REF (def_stmt_info)));
    2816                 :             : }
    2817                 :             : 
    2818                 :             : /* Return true if STMT_INFO is an integer truncation.  */
    2819                 :             : inline bool
    2820                 :             : vect_is_integer_truncation (stmt_vec_info stmt_info)
    2821                 :             : {
    2822                 :             :   gassign *assign = dyn_cast <gassign *> (stmt_info->stmt);
    2823                 :             :   if (!assign || !CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (assign)))
    2824                 :             :     return false;
    2825                 :             : 
    2826                 :             :   tree lhs_type = TREE_TYPE (gimple_assign_lhs (assign));
    2827                 :             :   tree rhs_type = TREE_TYPE (gimple_assign_rhs1 (assign));
    2828                 :             :   return (INTEGRAL_TYPE_P (lhs_type)
    2829                 :             :           && INTEGRAL_TYPE_P (rhs_type)
    2830                 :             :           && TYPE_PRECISION (lhs_type) < TYPE_PRECISION (rhs_type));
    2831                 :             : }
    2832                 :             : 
    2833                 :             : /* Build a GIMPLE_ASSIGN or GIMPLE_CALL with the tree_code,
    2834                 :             :    or internal_fn contained in ch, respectively.  */
    2835                 :             : gimple * vect_gimple_build (tree, code_helper, tree, tree = NULL_TREE);
    2836                 :             : #endif  /* GCC_TREE_VECTORIZER_H  */
        

Generated by: LCOV version 2.1-beta

LCOV profile is generated on x86_64 machine using following configure options: configure --disable-bootstrap --enable-coverage=opt --enable-languages=c,c++,fortran,go,jit,lto,rust,m2 --enable-host-shared. GCC test suite is run with the built compiler.