dist/gcc/vector-builder.h

cef8759bSmrg/* A class for building vector constant patterns.
*4c3eb207Smrg   Copyright (C) 2017-2020 Free Software Foundation, Inc.
cef8759bSmrg
cef8759bSmrgThis file is part of GCC.
cef8759bSmrg
cef8759bSmrgGCC is free software; you can redistribute it and/or modify it under
cef8759bSmrgthe terms of the GNU General Public License as published by the Free
cef8759bSmrgSoftware Foundation; either version 3, or (at your option) any later
cef8759bSmrgversion.
cef8759bSmrg
cef8759bSmrgGCC is distributed in the hope that it will be useful, but WITHOUT ANY
cef8759bSmrgWARRANTY; without even the implied warranty of MERCHANTABILITY or
cef8759bSmrgFITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
cef8759bSmrgfor more details.
cef8759bSmrg
cef8759bSmrgYou should have received a copy of the GNU General Public License
cef8759bSmrgalong with GCC; see the file COPYING3.  If not see
cef8759bSmrg<http://www.gnu.org/licenses/>.  */
cef8759bSmrg
cef8759bSmrg#ifndef GCC_VECTOR_BUILDER_H
cef8759bSmrg#define GCC_VECTOR_BUILDER_H
cef8759bSmrg
cef8759bSmrg/* This class is a wrapper around auto_vec<T> for building vectors of T.
cef8759bSmrg   It aims to encode each vector as npatterns interleaved patterns,
cef8759bSmrg   where each pattern represents a sequence:
cef8759bSmrg
cef8759bSmrg     { BASE0, BASE1, BASE1 + STEP, BASE1 + STEP*2, BASE1 + STEP*3, ... }
cef8759bSmrg
cef8759bSmrg   The first three elements in each pattern provide enough information
cef8759bSmrg   to derive the other elements.  If all patterns have a STEP of zero,
cef8759bSmrg   we only need to encode the first two elements in each pattern.
cef8759bSmrg   If BASE1 is also equal to BASE0 for all patterns, we only need to
cef8759bSmrg   encode the first element in each pattern.  The number of encoded
cef8759bSmrg   elements per pattern is given by nelts_per_pattern.
cef8759bSmrg
cef8759bSmrg   The class can be used in two ways:
cef8759bSmrg
cef8759bSmrg   1. It can be used to build a full image of the vector, which is then
cef8759bSmrg      canonicalized by finalize ().  In this case npatterns is initially
cef8759bSmrg      the number of elements in the vector and nelts_per_pattern is
cef8759bSmrg      initially 1.
cef8759bSmrg
cef8759bSmrg   2. It can be used to build a vector that already has a known encoding.
cef8759bSmrg      This is preferred since it is more efficient and copes with
cef8759bSmrg      variable-length vectors.  finalize () then canonicalizes the encoding
cef8759bSmrg      to a simpler form if possible.
cef8759bSmrg
*4c3eb207Smrg   Shape is the type that specifies the number of elements in the vector
*4c3eb207Smrg   and (where relevant) the type of each element.
*4c3eb207Smrg
*4c3eb207Smrg   The derived class Derived provides the functionality of this class
*4c3eb207Smrg   for specific Ts.  Derived needs to provide the following interface:
cef8759bSmrg
cef8759bSmrg      bool equal_p (T elt1, T elt2) const;
cef8759bSmrg
cef8759bSmrg	  Return true if elements ELT1 and ELT2 are equal.
cef8759bSmrg
cef8759bSmrg      bool allow_steps_p () const;
cef8759bSmrg
cef8759bSmrg	  Return true if a stepped representation is OK.  We don't allow
cef8759bSmrg	  linear series for anything other than integers, to avoid problems
cef8759bSmrg	  with rounding.
cef8759bSmrg
cef8759bSmrg      bool integral_p (T elt) const;
cef8759bSmrg
cef8759bSmrg	  Return true if element ELT can be interpreted as an integer.
cef8759bSmrg
cef8759bSmrg      StepType step (T elt1, T elt2) const;
cef8759bSmrg
cef8759bSmrg	  Return the value of element ELT2 minus the value of element ELT1,
cef8759bSmrg	  given integral_p (ELT1) && integral_p (ELT2).  There is no fixed
cef8759bSmrg	  choice of StepType.
cef8759bSmrg
cef8759bSmrg      T apply_step (T base, unsigned int factor, StepType step) const;
cef8759bSmrg
cef8759bSmrg	  Return a vector element with the value BASE + FACTOR * STEP.
cef8759bSmrg
cef8759bSmrg      bool can_elide_p (T elt) const;
cef8759bSmrg
cef8759bSmrg	  Return true if we can drop element ELT, even if the retained
cef8759bSmrg	  elements are different.  This is provided for TREE_OVERFLOW
cef8759bSmrg	  handling.
cef8759bSmrg
cef8759bSmrg      void note_representative (T *elt1_ptr, T elt2);
cef8759bSmrg
cef8759bSmrg	  Record that ELT2 is being elided, given that ELT1_PTR points to
cef8759bSmrg	  the last encoded element for the containing pattern.  This is
*4c3eb207Smrg	  again provided for TREE_OVERFLOW handling.
cef8759bSmrg
*4c3eb207Smrg      static poly_uint64 shape_nelts (Shape shape);
*4c3eb207Smrg
*4c3eb207Smrg	  Return the number of elements in SHAPE.
*4c3eb207Smrg
*4c3eb207Smrg    The class provides additional functionality for the case in which
*4c3eb207Smrg    T can describe a vector constant as well as an individual element.
*4c3eb207Smrg    This functionality requires:
*4c3eb207Smrg
*4c3eb207Smrg      static poly_uint64 nelts_of (T x);
*4c3eb207Smrg
*4c3eb207Smrg	  Return the number of elements in vector constant X.
*4c3eb207Smrg
*4c3eb207Smrg      static unsigned int npatterns_of (T x);
*4c3eb207Smrg
*4c3eb207Smrg	  Return the number of patterns used to encode vector constant X.
*4c3eb207Smrg
*4c3eb207Smrg      static unsigned int nelts_per_pattern_of (T x);
*4c3eb207Smrg
*4c3eb207Smrg	  Return the number of elements used to encode each pattern
*4c3eb207Smrg	  in vector constant X.  */
*4c3eb207Smrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
cef8759bSmrgclass vector_builder : public auto_vec<T, 32>
cef8759bSmrg{
cef8759bSmrgpublic:
cef8759bSmrg  vector_builder ();
cef8759bSmrg
cef8759bSmrg  poly_uint64 full_nelts () const { return m_full_nelts; }
cef8759bSmrg  unsigned int npatterns () const { return m_npatterns; }
cef8759bSmrg  unsigned int nelts_per_pattern () const { return m_nelts_per_pattern; }
cef8759bSmrg  unsigned int encoded_nelts () const;
cef8759bSmrg  bool encoded_full_vector_p () const;
cef8759bSmrg  T elt (unsigned int) const;
*4c3eb207Smrg  unsigned int count_dups (int, int, int) const;
cef8759bSmrg
cef8759bSmrg  bool operator == (const Derived &) const;
cef8759bSmrg  bool operator != (const Derived &x) const { return !operator == (x); }
cef8759bSmrg
*4c3eb207Smrg  bool new_unary_operation (Shape, T, bool);
*4c3eb207Smrg  bool new_binary_operation (Shape, T, T, bool);
*4c3eb207Smrg
cef8759bSmrg  void finalize ();
cef8759bSmrg
*4c3eb207Smrg  static unsigned int binary_encoded_nelts (T, T);
*4c3eb207Smrg
cef8759bSmrgprotected:
cef8759bSmrg  void new_vector (poly_uint64, unsigned int, unsigned int);
cef8759bSmrg  void reshape (unsigned int, unsigned int);
cef8759bSmrg  bool repeating_sequence_p (unsigned int, unsigned int, unsigned int);
cef8759bSmrg  bool stepped_sequence_p (unsigned int, unsigned int, unsigned int);
cef8759bSmrg  bool try_npatterns (unsigned int);
cef8759bSmrg
cef8759bSmrgprivate:
cef8759bSmrg  vector_builder (const vector_builder &);
cef8759bSmrg  vector_builder &operator= (const vector_builder &);
cef8759bSmrg  Derived *derived () { return static_cast<Derived *> (this); }
cef8759bSmrg  const Derived *derived () const;
cef8759bSmrg
cef8759bSmrg  poly_uint64 m_full_nelts;
cef8759bSmrg  unsigned int m_npatterns;
cef8759bSmrg  unsigned int m_nelts_per_pattern;
cef8759bSmrg};
cef8759bSmrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
cef8759bSmrginline const Derived *
*4c3eb207Smrgvector_builder<T, Shape, Derived>::derived () const
cef8759bSmrg{
cef8759bSmrg  return static_cast<const Derived *> (this);
cef8759bSmrg}
cef8759bSmrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
cef8759bSmrginline
*4c3eb207Smrgvector_builder<T, Shape, Derived>::vector_builder ()
cef8759bSmrg  : m_full_nelts (0),
cef8759bSmrg    m_npatterns (0),
cef8759bSmrg    m_nelts_per_pattern (0)
cef8759bSmrg{}
cef8759bSmrg
cef8759bSmrg/* Return the number of elements that are explicitly encoded.  The vec
cef8759bSmrg   starts with these explicitly-encoded elements and may contain additional
cef8759bSmrg   elided elements.  */
cef8759bSmrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
cef8759bSmrginline unsigned int
*4c3eb207Smrgvector_builder<T, Shape, Derived>::encoded_nelts () const
cef8759bSmrg{
cef8759bSmrg  return m_npatterns * m_nelts_per_pattern;
cef8759bSmrg}
cef8759bSmrg
cef8759bSmrg/* Return true if every element of the vector is explicitly encoded.  */
cef8759bSmrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
cef8759bSmrginline bool
*4c3eb207Smrgvector_builder<T, Shape, Derived>::encoded_full_vector_p () const
cef8759bSmrg{
cef8759bSmrg  return known_eq (m_npatterns * m_nelts_per_pattern, m_full_nelts);
cef8759bSmrg}
cef8759bSmrg
cef8759bSmrg/* Start building a vector that has FULL_NELTS elements.  Initially
cef8759bSmrg   encode it using NPATTERNS patterns with NELTS_PER_PATTERN each.  */
cef8759bSmrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
cef8759bSmrgvoid
*4c3eb207Smrgvector_builder<T, Shape, Derived>::new_vector (poly_uint64 full_nelts,
cef8759bSmrg					       unsigned int npatterns,
cef8759bSmrg					       unsigned int nelts_per_pattern)
cef8759bSmrg{
cef8759bSmrg  m_full_nelts = full_nelts;
cef8759bSmrg  m_npatterns = npatterns;
cef8759bSmrg  m_nelts_per_pattern = nelts_per_pattern;
cef8759bSmrg  this->reserve (encoded_nelts ());
cef8759bSmrg  this->truncate (0);
cef8759bSmrg}
cef8759bSmrg
cef8759bSmrg/* Return true if this vector and OTHER have the same elements and
cef8759bSmrg   are encoded in the same way.  */
cef8759bSmrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
cef8759bSmrgbool
*4c3eb207Smrgvector_builder<T, Shape, Derived>::operator == (const Derived &other) const
cef8759bSmrg{
cef8759bSmrg  if (maybe_ne (m_full_nelts, other.m_full_nelts)
cef8759bSmrg      || m_npatterns != other.m_npatterns
cef8759bSmrg      || m_nelts_per_pattern != other.m_nelts_per_pattern)
cef8759bSmrg    return false;
cef8759bSmrg
cef8759bSmrg  unsigned int nelts = encoded_nelts ();
cef8759bSmrg  for (unsigned int i = 0; i < nelts; ++i)
cef8759bSmrg    if (!derived ()->equal_p ((*this)[i], other[i]))
cef8759bSmrg      return false;
cef8759bSmrg
cef8759bSmrg  return true;
cef8759bSmrg}
cef8759bSmrg
cef8759bSmrg/* Return the value of vector element I, which might or might not be
cef8759bSmrg   encoded explicitly.  */
cef8759bSmrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
cef8759bSmrgT
*4c3eb207Smrgvector_builder<T, Shape, Derived>::elt (unsigned int i) const
cef8759bSmrg{
cef8759bSmrg  /* First handle elements that are already present in the underlying
cef8759bSmrg     vector, regardless of whether they're part of the encoding or not.  */
cef8759bSmrg  if (i < this->length ())
cef8759bSmrg    return (*this)[i];
cef8759bSmrg
*4c3eb207Smrg  /* Extrapolation is only possible if the encoding has been fully
*4c3eb207Smrg     populated.  */
*4c3eb207Smrg  gcc_checking_assert (encoded_nelts () <= this->length ());
*4c3eb207Smrg
cef8759bSmrg  /* Identify the pattern that contains element I and work out the index of
cef8759bSmrg     the last encoded element for that pattern.  */
cef8759bSmrg  unsigned int pattern = i % m_npatterns;
cef8759bSmrg  unsigned int count = i / m_npatterns;
cef8759bSmrg  unsigned int final_i = encoded_nelts () - m_npatterns + pattern;
cef8759bSmrg  T final = (*this)[final_i];
cef8759bSmrg
cef8759bSmrg  /* If there are no steps, the final encoded value is the right one.  */
cef8759bSmrg  if (m_nelts_per_pattern <= 2)
cef8759bSmrg    return final;
cef8759bSmrg
cef8759bSmrg  /* Otherwise work out the value from the last two encoded elements.  */
cef8759bSmrg  T prev = (*this)[final_i - m_npatterns];
cef8759bSmrg  return derived ()->apply_step (final, count - 2,
cef8759bSmrg				 derived ()->step (prev, final));
cef8759bSmrg}
cef8759bSmrg
*4c3eb207Smrg/* Try to start building a new vector of shape SHAPE that holds the result of
*4c3eb207Smrg   a unary operation on vector constant VEC.  ALLOW_STEPPED_P is true if the
*4c3eb207Smrg   operation can handle stepped encodings directly, without having to expand
*4c3eb207Smrg   the full sequence.
*4c3eb207Smrg
*4c3eb207Smrg   Return true if the operation is possible, which it always is when
*4c3eb207Smrg   ALLOW_STEPPED_P is true.  Leave the builder unchanged otherwise.  */
*4c3eb207Smrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
*4c3eb207Smrgbool
*4c3eb207Smrgvector_builder<T, Shape, Derived>::new_unary_operation (Shape shape, T vec,
*4c3eb207Smrg							bool allow_stepped_p)
*4c3eb207Smrg{
*4c3eb207Smrg  poly_uint64 full_nelts = Derived::shape_nelts (shape);
*4c3eb207Smrg  gcc_assert (known_eq (full_nelts, Derived::nelts_of (vec)));
*4c3eb207Smrg  unsigned int npatterns = Derived::npatterns_of (vec);
*4c3eb207Smrg  unsigned int nelts_per_pattern = Derived::nelts_per_pattern_of (vec);
*4c3eb207Smrg  if (!allow_stepped_p && nelts_per_pattern > 2)
*4c3eb207Smrg    {
*4c3eb207Smrg      if (!full_nelts.is_constant ())
*4c3eb207Smrg	return false;
*4c3eb207Smrg      npatterns = full_nelts.to_constant ();
*4c3eb207Smrg      nelts_per_pattern = 1;
*4c3eb207Smrg    }
*4c3eb207Smrg  derived ()->new_vector (shape, npatterns, nelts_per_pattern);
*4c3eb207Smrg  return true;
*4c3eb207Smrg}
*4c3eb207Smrg
*4c3eb207Smrg/* Try to start building a new vector of shape SHAPE that holds the result of
*4c3eb207Smrg   a binary operation on vector constants VEC1 and VEC2.  ALLOW_STEPPED_P is
*4c3eb207Smrg   true if the operation can handle stepped encodings directly, without
*4c3eb207Smrg   having to expand the full sequence.
*4c3eb207Smrg
*4c3eb207Smrg   Return true if the operation is possible.  Leave the builder unchanged
*4c3eb207Smrg   otherwise.  */
*4c3eb207Smrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
*4c3eb207Smrgbool
*4c3eb207Smrgvector_builder<T, Shape, Derived>::new_binary_operation (Shape shape,
*4c3eb207Smrg							 T vec1, T vec2,
*4c3eb207Smrg							 bool allow_stepped_p)
*4c3eb207Smrg{
*4c3eb207Smrg  poly_uint64 full_nelts = Derived::shape_nelts (shape);
*4c3eb207Smrg  gcc_assert (known_eq (full_nelts, Derived::nelts_of (vec1))
*4c3eb207Smrg	      && known_eq (full_nelts, Derived::nelts_of (vec2)));
*4c3eb207Smrg  /* Conceptually we split the patterns in VEC1 and VEC2 until we have
*4c3eb207Smrg     an equal number for both.  Each split pattern requires the same
*4c3eb207Smrg     number of elements per pattern as the original.  E.g. splitting:
*4c3eb207Smrg
*4c3eb207Smrg       { 1, 2, 3, ... }
*4c3eb207Smrg
*4c3eb207Smrg     into two gives:
*4c3eb207Smrg
*4c3eb207Smrg       { 1, 3, 5, ... }
*4c3eb207Smrg       { 2, 4, 6, ... }
*4c3eb207Smrg
*4c3eb207Smrg     while splitting:
*4c3eb207Smrg
*4c3eb207Smrg       { 1, 0, ... }
*4c3eb207Smrg
*4c3eb207Smrg     into two gives:
*4c3eb207Smrg
*4c3eb207Smrg       { 1, 0, ... }
*4c3eb207Smrg       { 0, 0, ... }.  */
*4c3eb207Smrg  unsigned int npatterns
*4c3eb207Smrg    = least_common_multiple (Derived::npatterns_of (vec1),
*4c3eb207Smrg			     Derived::npatterns_of (vec2));
*4c3eb207Smrg  unsigned int nelts_per_pattern
*4c3eb207Smrg    = MAX (Derived::nelts_per_pattern_of (vec1),
*4c3eb207Smrg	   Derived::nelts_per_pattern_of (vec2));
*4c3eb207Smrg  if (!allow_stepped_p && nelts_per_pattern > 2)
*4c3eb207Smrg    {
*4c3eb207Smrg      if (!full_nelts.is_constant ())
*4c3eb207Smrg	return false;
*4c3eb207Smrg      npatterns = full_nelts.to_constant ();
*4c3eb207Smrg      nelts_per_pattern = 1;
*4c3eb207Smrg    }
*4c3eb207Smrg  derived ()->new_vector (shape, npatterns, nelts_per_pattern);
*4c3eb207Smrg  return true;
*4c3eb207Smrg}
*4c3eb207Smrg
*4c3eb207Smrg/* Return the number of elements that the caller needs to operate on in
*4c3eb207Smrg   order to handle a binary operation on vector constants VEC1 and VEC2.
*4c3eb207Smrg   This static function is used instead of new_binary_operation if the
*4c3eb207Smrg   result of the operation is not a constant vector.  */
*4c3eb207Smrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
*4c3eb207Smrgunsigned int
*4c3eb207Smrgvector_builder<T, Shape, Derived>::binary_encoded_nelts (T vec1, T vec2)
*4c3eb207Smrg{
*4c3eb207Smrg  poly_uint64 nelts = Derived::nelts_of (vec1);
*4c3eb207Smrg  gcc_assert (known_eq (nelts, Derived::nelts_of (vec2)));
*4c3eb207Smrg  /* See new_binary_operation for details.  */
*4c3eb207Smrg  unsigned int npatterns
*4c3eb207Smrg    = least_common_multiple (Derived::npatterns_of (vec1),
*4c3eb207Smrg			     Derived::npatterns_of (vec2));
*4c3eb207Smrg  unsigned int nelts_per_pattern
*4c3eb207Smrg    = MAX (Derived::nelts_per_pattern_of (vec1),
*4c3eb207Smrg	   Derived::nelts_per_pattern_of (vec2));
*4c3eb207Smrg  unsigned HOST_WIDE_INT const_nelts;
*4c3eb207Smrg  if (nelts.is_constant (&const_nelts))
*4c3eb207Smrg    return MIN (npatterns * nelts_per_pattern, const_nelts);
*4c3eb207Smrg  return npatterns * nelts_per_pattern;
*4c3eb207Smrg}
*4c3eb207Smrg
*4c3eb207Smrg/* Return the number of leading duplicate elements in the range
*4c3eb207Smrg   [START:END:STEP].  The value is always at least 1.  */
*4c3eb207Smrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
*4c3eb207Smrgunsigned int
*4c3eb207Smrgvector_builder<T, Shape, Derived>::count_dups (int start, int end,
*4c3eb207Smrg					       int step) const
*4c3eb207Smrg{
*4c3eb207Smrg  gcc_assert ((end - start) % step == 0);
*4c3eb207Smrg
*4c3eb207Smrg  unsigned int ndups = 1;
*4c3eb207Smrg  for (int i = start + step;
*4c3eb207Smrg       i != end && derived ()->equal_p (elt (i), elt (start));
*4c3eb207Smrg       i += step)
*4c3eb207Smrg    ndups++;
*4c3eb207Smrg  return ndups;
*4c3eb207Smrg}
*4c3eb207Smrg
cef8759bSmrg/* Change the encoding to NPATTERNS patterns of NELTS_PER_PATTERN each,
cef8759bSmrg   but without changing the underlying vector.  */
cef8759bSmrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
cef8759bSmrgvoid
*4c3eb207Smrgvector_builder<T, Shape, Derived>::reshape (unsigned int npatterns,
cef8759bSmrg					    unsigned int nelts_per_pattern)
cef8759bSmrg{
cef8759bSmrg  unsigned int old_encoded_nelts = encoded_nelts ();
cef8759bSmrg  unsigned int new_encoded_nelts = npatterns * nelts_per_pattern;
cef8759bSmrg  gcc_checking_assert (new_encoded_nelts <= old_encoded_nelts);
cef8759bSmrg  unsigned int next = new_encoded_nelts - npatterns;
cef8759bSmrg  for (unsigned int i = new_encoded_nelts; i < old_encoded_nelts; ++i)
cef8759bSmrg    {
cef8759bSmrg      derived ()->note_representative (&(*this)[next], (*this)[i]);
cef8759bSmrg      next += 1;
cef8759bSmrg      if (next == new_encoded_nelts)
cef8759bSmrg	next -= npatterns;
cef8759bSmrg    }
cef8759bSmrg  m_npatterns = npatterns;
cef8759bSmrg  m_nelts_per_pattern = nelts_per_pattern;
cef8759bSmrg}
cef8759bSmrg
cef8759bSmrg/* Return true if elements [START, END) contain a repeating sequence of
cef8759bSmrg   STEP elements.  */
cef8759bSmrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
cef8759bSmrgbool
*4c3eb207Smrgvector_builder<T, Shape, Derived>::repeating_sequence_p (unsigned int start,
cef8759bSmrg							 unsigned int end,
cef8759bSmrg							 unsigned int step)
cef8759bSmrg{
cef8759bSmrg  for (unsigned int i = start; i < end - step; ++i)
cef8759bSmrg    if (!derived ()->equal_p ((*this)[i], (*this)[i + step]))
cef8759bSmrg      return false;
cef8759bSmrg  return true;
cef8759bSmrg}
cef8759bSmrg
cef8759bSmrg/* Return true if elements [START, END) contain STEP interleaved linear
cef8759bSmrg   series.  */
cef8759bSmrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
cef8759bSmrgbool
*4c3eb207Smrgvector_builder<T, Shape, Derived>::stepped_sequence_p (unsigned int start,
cef8759bSmrg						       unsigned int end,
cef8759bSmrg						       unsigned int step)
cef8759bSmrg{
cef8759bSmrg  if (!derived ()->allow_steps_p ())
cef8759bSmrg    return false;
cef8759bSmrg
cef8759bSmrg  for (unsigned int i = start + step * 2; i < end; ++i)
cef8759bSmrg    {
cef8759bSmrg      T elt1 = (*this)[i - step * 2];
cef8759bSmrg      T elt2 = (*this)[i - step];
cef8759bSmrg      T elt3 = (*this)[i];
cef8759bSmrg
cef8759bSmrg      if (!derived ()->integral_p (elt1)
cef8759bSmrg	  || !derived ()->integral_p (elt2)
cef8759bSmrg	  || !derived ()->integral_p (elt3))
cef8759bSmrg	return false;
cef8759bSmrg
cef8759bSmrg      if (maybe_ne (derived ()->step (elt1, elt2),
cef8759bSmrg		    derived ()->step (elt2, elt3)))
cef8759bSmrg	return false;
cef8759bSmrg
cef8759bSmrg      if (!derived ()->can_elide_p (elt3))
cef8759bSmrg	return false;
cef8759bSmrg    }
cef8759bSmrg  return true;
cef8759bSmrg}
cef8759bSmrg
cef8759bSmrg/* Try to change the number of encoded patterns to NPATTERNS, returning
cef8759bSmrg   true on success.  */
cef8759bSmrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
cef8759bSmrgbool
*4c3eb207Smrgvector_builder<T, Shape, Derived>::try_npatterns (unsigned int npatterns)
cef8759bSmrg{
cef8759bSmrg  if (m_nelts_per_pattern == 1)
cef8759bSmrg    {
cef8759bSmrg      /* See whether NPATTERNS is valid with the current 1-element-per-pattern
cef8759bSmrg	 encoding.  */
cef8759bSmrg      if (repeating_sequence_p (0, encoded_nelts (), npatterns))
cef8759bSmrg	{
cef8759bSmrg	  reshape (npatterns, 1);
cef8759bSmrg	  return true;
cef8759bSmrg	}
cef8759bSmrg
cef8759bSmrg      /* We can only increase the number of elements per pattern if all
cef8759bSmrg	 elements are still encoded explicitly.  */
cef8759bSmrg      if (!encoded_full_vector_p ())
cef8759bSmrg	return false;
cef8759bSmrg    }
cef8759bSmrg
cef8759bSmrg  if (m_nelts_per_pattern <= 2)
cef8759bSmrg    {
cef8759bSmrg      /* See whether NPATTERNS is valid with a 2-element-per-pattern
cef8759bSmrg	 encoding.  */
cef8759bSmrg      if (repeating_sequence_p (npatterns, encoded_nelts (), npatterns))
cef8759bSmrg	{
cef8759bSmrg	  reshape (npatterns, 2);
cef8759bSmrg	  return true;
cef8759bSmrg	}
cef8759bSmrg
cef8759bSmrg      /* We can only increase the number of elements per pattern if all
cef8759bSmrg	 elements are still encoded explicitly.  */
cef8759bSmrg      if (!encoded_full_vector_p ())
cef8759bSmrg	return false;
cef8759bSmrg    }
cef8759bSmrg
cef8759bSmrg  if (m_nelts_per_pattern <= 3)
cef8759bSmrg    {
cef8759bSmrg      /* See whether we have NPATTERNS interleaved linear series,
cef8759bSmrg	 giving a 3-element-per-pattern encoding.  */
cef8759bSmrg      if (stepped_sequence_p (npatterns, encoded_nelts (), npatterns))
cef8759bSmrg	{
cef8759bSmrg	  reshape (npatterns, 3);
cef8759bSmrg	  return true;
cef8759bSmrg	}
cef8759bSmrg      return false;
cef8759bSmrg    }
cef8759bSmrg
cef8759bSmrg  gcc_unreachable ();
cef8759bSmrg}
cef8759bSmrg
cef8759bSmrg/* Replace the current encoding with the canonical form.  */
cef8759bSmrg
*4c3eb207Smrgtemplate<typename T, typename Shape, typename Derived>
cef8759bSmrgvoid
*4c3eb207Smrgvector_builder<T, Shape, Derived>::finalize ()
cef8759bSmrg{
cef8759bSmrg  /* The encoding requires the same number of elements to come from each
cef8759bSmrg     pattern.  */
cef8759bSmrg  gcc_assert (multiple_p (m_full_nelts, m_npatterns));
cef8759bSmrg
cef8759bSmrg  /* Allow the caller to build more elements than necessary.  For example,
cef8759bSmrg     it's often convenient to build a stepped vector from the natural
cef8759bSmrg     encoding of three elements even if the vector itself only has two.  */
cef8759bSmrg  unsigned HOST_WIDE_INT const_full_nelts;
cef8759bSmrg  if (m_full_nelts.is_constant (&const_full_nelts)
cef8759bSmrg      && const_full_nelts <= encoded_nelts ())
cef8759bSmrg    {
cef8759bSmrg      m_npatterns = const_full_nelts;
cef8759bSmrg      m_nelts_per_pattern = 1;
cef8759bSmrg    }
cef8759bSmrg
cef8759bSmrg  /* Try to whittle down the number of elements per pattern.  That is:
cef8759bSmrg
cef8759bSmrg     1. If we have stepped patterns whose steps are all 0, reduce the
cef8759bSmrg        number of elements per pattern from 3 to 2.
cef8759bSmrg
cef8759bSmrg     2. If we have background fill values that are the same as the
cef8759bSmrg        foreground values, reduce the number of elements per pattern
cef8759bSmrg        from 2 to 1.  */
cef8759bSmrg  while (m_nelts_per_pattern > 1
cef8759bSmrg	 && repeating_sequence_p (encoded_nelts () - m_npatterns * 2,
cef8759bSmrg				  encoded_nelts (), m_npatterns))
cef8759bSmrg    /* The last two sequences of M_NPATTERNS elements are equal,
cef8759bSmrg       so remove the last one.  */
cef8759bSmrg    reshape (m_npatterns, m_nelts_per_pattern - 1);
cef8759bSmrg
cef8759bSmrg  if (pow2p_hwi (m_npatterns))
cef8759bSmrg    {
cef8759bSmrg      /* Try to halve the number of patterns while doing so gives a
cef8759bSmrg	 valid pattern.  This approach is linear in the number of
cef8759bSmrg	 elements, whereas searcing from 1 up would be O(n*log(n)).
cef8759bSmrg
cef8759bSmrg	 Each halving step tries to keep the number of elements per pattern
cef8759bSmrg	 the same.  If that isn't possible, and if all elements are still
cef8759bSmrg	 explicitly encoded, the halving step can instead increase the number
cef8759bSmrg	 of elements per pattern.
cef8759bSmrg
cef8759bSmrg	 E.g. for:
cef8759bSmrg
cef8759bSmrg	     { 0, 2, 3, 4, 5, 6, 7, 8 }  npatterns == 8  full_nelts == 8
cef8759bSmrg
cef8759bSmrg	 we first realize that the second half of the sequence is not
cef8759bSmrg	 equal to the first, so we cannot maintain 1 element per pattern
cef8759bSmrg	 for npatterns == 4.  Instead we halve the number of patterns
cef8759bSmrg	 and double the number of elements per pattern, treating this
cef8759bSmrg	 as a "foreground" { 0, 2, 3, 4 } against a "background" of
cef8759bSmrg	 { 5, 6, 7, 8 | 5, 6, 7, 8 ... }:
cef8759bSmrg
cef8759bSmrg	     { 0, 2, 3, 4 | 5, 6, 7, 8 }  npatterns == 4
cef8759bSmrg
cef8759bSmrg	 Next we realize that this is *not* a foreround of { 0, 2 }
cef8759bSmrg	 against a background of { 3, 4 | 3, 4 ... }, so the only
cef8759bSmrg	 remaining option for reducing the number of patterns is
cef8759bSmrg	 to use a foreground of { 0, 2 } against a stepped background
cef8759bSmrg	 of { 1, 2 | 3, 4 | 5, 6 ... }.  This is valid because we still
cef8759bSmrg	 haven't elided any elements:
cef8759bSmrg
cef8759bSmrg	     { 0, 2 | 3, 4 | 5, 6 }  npatterns == 2
cef8759bSmrg
cef8759bSmrg	 This in turn can be reduced to a foreground of { 0 } against a
cef8759bSmrg	 stepped background of { 1 | 2 | 3 ... }:
cef8759bSmrg
cef8759bSmrg	     { 0 | 2 | 3 }  npatterns == 1
cef8759bSmrg
cef8759bSmrg	 This last step would not have been possible for:
cef8759bSmrg
cef8759bSmrg	     { 0, 0 | 3, 4 | 5, 6 }  npatterns == 2.  */
cef8759bSmrg      while ((m_npatterns & 1) == 0 && try_npatterns (m_npatterns / 2))
cef8759bSmrg	continue;
cef8759bSmrg
cef8759bSmrg      /* Builders of arbitrary fixed-length vectors can use:
cef8759bSmrg
cef8759bSmrg	     new_vector (x, x, 1)
cef8759bSmrg
cef8759bSmrg	 so that every element is specified explicitly.  Handle cases
cef8759bSmrg	 that are actually wrapping series, like { 0, 1, 2, 3, 0, 1, 2, 3 }
cef8759bSmrg	 would be for 2-bit elements.  We'll have treated them as
cef8759bSmrg	 duplicates in the loop above.  */
cef8759bSmrg      if (m_nelts_per_pattern == 1
cef8759bSmrg	  && m_full_nelts.is_constant (&const_full_nelts)
cef8759bSmrg	  && this->length () >= const_full_nelts
cef8759bSmrg	  && (m_npatterns & 3) == 0
cef8759bSmrg	  && stepped_sequence_p (m_npatterns / 4, const_full_nelts,
cef8759bSmrg				 m_npatterns / 4))
cef8759bSmrg	{
cef8759bSmrg	  reshape (m_npatterns / 4, 3);
cef8759bSmrg	  while ((m_npatterns & 1) == 0 && try_npatterns (m_npatterns / 2))
cef8759bSmrg	    continue;
cef8759bSmrg	}
cef8759bSmrg    }
cef8759bSmrg  else
cef8759bSmrg    /* For the non-power-of-2 case, do a simple search up from 1.  */
cef8759bSmrg    for (unsigned int i = 1; i <= m_npatterns / 2; ++i)
cef8759bSmrg      if (m_npatterns % i == 0 && try_npatterns (i))
cef8759bSmrg	break;
cef8759bSmrg}
cef8759bSmrg
cef8759bSmrg#endif