doxygen/ScopBuilder_8cpp_source.html

//===- ScopBuilder.cpp ----------------------------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// Create a polyhedral description for a static control flow region.

//

// The pass creates a polyhedral description of the Scops detected by the SCoP

// detection derived from their LLVM-IR code.

//

//===----------------------------------------------------------------------===//


#include "polly/ScopBuilder.h"

#include "polly/Options.h"

#include "polly/ScopDetection.h"

#include "polly/ScopInfo.h"

#include "polly/Support/GICHelper.h"

#include "polly/Support/ISLTools.h"

#include "polly/Support/SCEVValidator.h"

#include "polly/Support/ScopHelper.h"

#include "polly/Support/VirtualInstruction.h"

#include "llvm/ADT/ArrayRef.h"

#include "llvm/ADT/EquivalenceClasses.h"

#include "llvm/ADT/PostOrderIterator.h"

#include "llvm/ADT/Sequence.h"

#include "llvm/ADT/SmallSet.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/Analysis/AliasAnalysis.h"

#include "llvm/Analysis/AssumptionCache.h"

#include "llvm/Analysis/Delinearization.h"

#include "llvm/Analysis/Loads.h"

#include "llvm/Analysis/LoopInfo.h"

#include "llvm/Analysis/OptimizationRemarkEmitter.h"

#include "llvm/Analysis/RegionInfo.h"

#include "llvm/Analysis/RegionIterator.h"

#include "llvm/Analysis/ScalarEvolution.h"

#include "llvm/Analysis/ScalarEvolutionExpressions.h"

#include "llvm/IR/BasicBlock.h"

#include "llvm/IR/DataLayout.h"

#include "llvm/IR/DebugLoc.h"

#include "llvm/IR/DerivedTypes.h"

#include "llvm/IR/Dominators.h"

#include "llvm/IR/Function.h"

#include "llvm/IR/InstrTypes.h"

#include "llvm/IR/Instruction.h"

#include "llvm/IR/Instructions.h"

#include "llvm/IR/Type.h"

#include "llvm/IR/Use.h"

#include "llvm/IR/Value.h"

#include "llvm/Support/CommandLine.h"

#include "llvm/Support/Compiler.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Support/raw_ostream.h"

#include <cassert>


using namespace llvm;

using namespace polly;


#include "polly/Support/PollyDebug.h"

#define DEBUG_TYPE "polly-scops"


STATISTIC(ScopFound, "Number of valid Scops");

STATISTIC(RichScopFound, "Number of Scops containing a loop");

STATISTIC(InfeasibleScops,

          "Number of SCoPs with statically infeasible context.");


bool polly::ModelReadOnlyScalars;


// The maximal number of dimensions we allow during invariant load construction.

// More complex access ranges will result in very high compile time and are also

// unlikely to result in good code. This value is very high and should only

// trigger for corner cases (e.g., the "dct_luma" function in h264, SPEC2006).

static unsigned const MaxDimensionsInAccessRange = 9;


static cl::opt<bool, true> XModelReadOnlyScalars(

    "polly-analyze-read-only-scalars",

    cl::desc("Model read-only scalar values in the scop description"),

    cl::location(ModelReadOnlyScalars), cl::Hidden, cl::init(true),

    cl::cat(PollyCategory));


static cl::opt<int>

    OptComputeOut("polly-analysis-computeout",

                  cl::desc("Bound the scop analysis by a maximal amount of "

                           "computational steps (0 means no bound)"),

                  cl::Hidden, cl::init(800000), cl::cat(PollyCategory));


static cl::opt<bool> PollyAllowDereferenceOfAllFunctionParams(

    "polly-allow-dereference-of-all-function-parameters",

    cl::desc(

        "Treat all parameters to functions that are pointers as dereferencible."

        " This is useful for invariant load hoisting, since we can generate"

        " less runtime checks. This is only valid if all pointers to functions"

        " are always initialized, so that Polly can choose to hoist"

        " their loads. "),

    cl::Hidden, cl::init(false), cl::cat(PollyCategory));


static cl::opt<bool>

    PollyIgnoreInbounds("polly-ignore-inbounds",

                        cl::desc("Do not take inbounds assumptions at all"),

                        cl::Hidden, cl::init(false), cl::cat(PollyCategory));


static cl::opt<unsigned> RunTimeChecksMaxArraysPerGroup(

    "polly-rtc-max-arrays-per-group",

    cl::desc("The maximal number of arrays to compare in each alias group."),

    cl::Hidden, cl::init(20), cl::cat(PollyCategory));


static cl::opt<unsigned> RunTimeChecksMaxAccessDisjuncts(

    "polly-rtc-max-array-disjuncts",

    cl::desc("The maximal number of disjunts allowed in memory accesses to "

             "to build RTCs."),

    cl::Hidden, cl::init(8), cl::cat(PollyCategory));


static cl::opt<unsigned> RunTimeChecksMaxParameters(

    "polly-rtc-max-parameters",

    cl::desc("The maximal number of parameters allowed in RTCs."), cl::Hidden,

    cl::init(8), cl::cat(PollyCategory));


static cl::opt<bool> UnprofitableScalarAccs(

    "polly-unprofitable-scalar-accs",

    cl::desc("Count statements with scalar accesses as not optimizable"),

    cl::Hidden, cl::init(false), cl::cat(PollyCategory));


static cl::opt<std::string> UserContextStr(

    "polly-context", cl::value_desc("isl parameter set"),

    cl::desc("Provide additional constraints on the context parameters"),

    cl::init(""), cl::cat(PollyCategory));


static cl::opt<bool> DetectReductions("polly-detect-reductions",

                                      cl::desc("Detect and exploit reductions"),

                                      cl::Hidden, cl::init(true),

                                      cl::cat(PollyCategory));


// Multiplicative reductions can be disabled separately as these kind of

// operations can overflow easily. Additive reductions and bit operations

// are in contrast pretty stable.

static cl::opt<bool> DisableMultiplicativeReductions(

    "polly-disable-multiplicative-reductions",

    cl::desc("Disable multiplicative reductions"), cl::Hidden,

    cl::cat(PollyCategory));


enum class GranularityChoice { BasicBlocks, ScalarIndependence, Stores };


static cl::opt<GranularityChoice> StmtGranularity(

    "polly-stmt-granularity",

    cl::desc(

        "Algorithm to use for splitting basic blocks into multiple statements"),

    cl::values(clEnumValN(GranularityChoice::BasicBlocks, "bb",

                          "One statement per basic block"),

               clEnumValN(GranularityChoice::ScalarIndependence, "scalar-indep",

                          "Scalar independence heuristic"),

               clEnumValN(GranularityChoice::Stores, "store",

                          "Store-level granularity")),

    cl::init(GranularityChoice::ScalarIndependence), cl::cat(PollyCategory));


/// Helper to treat non-affine regions and basic blocks the same.

///

///{


/// Return the block that is the representing block for @p RN.

static inline BasicBlock *getRegionNodeBasicBlock(RegionNode *RN) {

  return RN->isSubRegion() ? RN->getNodeAs<Region>()->getEntry()

                           : RN->getNodeAs<BasicBlock>();

}


/// Return the @p idx'th block that is executed after @p RN.

static inline BasicBlock *

getRegionNodeSuccessor(RegionNode *RN, Instruction *TI, unsigned idx) {

  if (RN->isSubRegion()) {

    assert(idx == 0);

    return RN->getNodeAs<Region>()->getExit();

  }

  return TI->getSuccessor(idx);

}


static bool containsErrorBlock(RegionNode *RN, const Region &R,

                               ScopDetection *SD) {

  if (!RN->isSubRegion())

    return SD->isErrorBlock(*RN->getNodeAs<BasicBlock>(), R);

  for (BasicBlock *BB : RN->getNodeAs<Region>()->blocks())

    if (SD->isErrorBlock(*BB, R))

      return true;

  return false;

}


///}


/// Create a map to map from a given iteration to a subsequent iteration.

///

/// This map maps from SetSpace -> SetSpace where the dimensions @p Dim

/// is incremented by one and all other dimensions are equal, e.g.,

///             [i0, i1, i2, i3] -> [i0, i1, i2 + 1, i3]

///

/// if @p Dim is 2 and @p SetSpace has 4 dimensions.

static isl::map createNextIterationMap(isl::space SetSpace, unsigned Dim) {

  isl::space MapSpace = SetSpace.map_from_set();

  isl::map NextIterationMap = isl::map::universe(MapSpace);

  for (unsigned u : rangeIslSize(0, NextIterationMap.domain_tuple_dim()))

    if (u != Dim)

      NextIterationMap =

          NextIterationMap.equate(isl::dim::in, u, isl::dim::out, u);

  isl::constraint C =

      isl::constraint::alloc_equality(isl::local_space(MapSpace));

  C = C.set_constant_si(1);

  C = C.set_coefficient_si(isl::dim::in, Dim, 1);

  C = C.set_coefficient_si(isl::dim::out, Dim, -1);

  NextIterationMap = NextIterationMap.add_constraint(C);

  return NextIterationMap;

}


/// Add @p BSet to set @p BoundedParts if @p BSet is bounded.

static isl::set collectBoundedParts(isl::set S) {

  isl::set BoundedParts = isl::set::empty(S.get_space());

  for (isl::basic_set BSet : S.get_basic_set_list())

    if (BSet.is_bounded())

      BoundedParts = BoundedParts.unite(isl::set(BSet));

  return BoundedParts;

}


/// Compute the (un)bounded parts of @p S wrt. to dimension @p Dim.

///

/// @returns A separation of @p S into first an unbounded then a bounded subset,

///          both with regards to the dimension @p Dim.

static std::pair<isl::set, isl::set> partitionSetParts(isl::set S,

                                                       unsigned Dim) {

  for (unsigned u : rangeIslSize(0, S.tuple_dim()))

    S = S.lower_bound_si(isl::dim::set, u, 0);


  unsigned NumDimsS = unsignedFromIslSize(S.tuple_dim());

  isl::set OnlyDimS = S;


  // Remove dimensions that are greater than Dim as they are not interesting.

  assert(NumDimsS >= Dim + 1);

  OnlyDimS = OnlyDimS.project_out(isl::dim::set, Dim + 1, NumDimsS - Dim - 1);


  // Create artificial parametric upper bounds for dimensions smaller than Dim

  // as we are not interested in them.

  OnlyDimS = OnlyDimS.insert_dims(isl::dim::param, 0, Dim);


  for (unsigned u = 0; u < Dim; u++) {

    isl::constraint C = isl::constraint::alloc_inequality(

        isl::local_space(OnlyDimS.get_space()));

    C = C.set_coefficient_si(isl::dim::param, u, 1);

    C = C.set_coefficient_si(isl::dim::set, u, -1);

    OnlyDimS = OnlyDimS.add_constraint(C);

  }


  // Collect all bounded parts of OnlyDimS.

  isl::set BoundedParts = collectBoundedParts(OnlyDimS);


  // Create the dimensions greater than Dim again.

  BoundedParts =

      BoundedParts.insert_dims(isl::dim::set, Dim + 1, NumDimsS - Dim - 1);


  // Remove the artificial upper bound parameters again.

  BoundedParts = BoundedParts.remove_dims(isl::dim::param, 0, Dim);


  isl::set UnboundedParts = S.subtract(BoundedParts);

  return std::make_pair(UnboundedParts, BoundedParts);

}


/// Create the conditions under which @p L @p Pred @p R is true.

static isl::set buildConditionSet(ICmpInst::Predicate Pred, isl::pw_aff L,

                                  isl::pw_aff R) {

  switch (Pred) {

  case ICmpInst::ICMP_EQ:

    return L.eq_set(R);

  case ICmpInst::ICMP_NE:

    return L.ne_set(R);

  case ICmpInst::ICMP_SLT:

    return L.lt_set(R);

  case ICmpInst::ICMP_SLE:

    return L.le_set(R);

  case ICmpInst::ICMP_SGT:

    return L.gt_set(R);

  case ICmpInst::ICMP_SGE:

    return L.ge_set(R);

  case ICmpInst::ICMP_ULT:

    return L.lt_set(R);

  case ICmpInst::ICMP_UGT:

    return L.gt_set(R);

  case ICmpInst::ICMP_ULE:

    return L.le_set(R);

  case ICmpInst::ICMP_UGE:

    return L.ge_set(R);

  default:

    llvm_unreachable("Non integer predicate not supported");

  }

}


isl::set ScopBuilder::adjustDomainDimensions(isl::set Dom, Loop *OldL,

                                             Loop *NewL) {

  // If the loops are the same there is nothing to do.

  if (NewL == OldL)

    return Dom;


  int OldDepth = scop->getRelativeLoopDepth(OldL);

  int NewDepth = scop->getRelativeLoopDepth(NewL);

  // If both loops are non-affine loops there is nothing to do.

  if (OldDepth == -1 && NewDepth == -1)

    return Dom;


  // Distinguish three cases:

  //   1) The depth is the same but the loops are not.

  //      => One loop was left one was entered.

  //   2) The depth increased from OldL to NewL.

  //      => One loop was entered, none was left.

  //   3) The depth decreased from OldL to NewL.

  //      => Loops were left were difference of the depths defines how many.

  if (OldDepth == NewDepth) {

    assert(OldL->getParentLoop() == NewL->getParentLoop());

    Dom = Dom.project_out(isl::dim::set, NewDepth, 1);

    Dom = Dom.add_dims(isl::dim::set, 1);

  } else if (OldDepth < NewDepth) {

    assert(OldDepth + 1 == NewDepth);

    auto &R = scop->getRegion();

    (void)R;

    assert(NewL->getParentLoop() == OldL ||

           ((!OldL || !R.contains(OldL)) && R.contains(NewL)));

    Dom = Dom.add_dims(isl::dim::set, 1);

  } else {

    assert(OldDepth > NewDepth);

    unsigned Diff = OldDepth - NewDepth;

    unsigned NumDim = unsignedFromIslSize(Dom.tuple_dim());

    assert(NumDim >= Diff);

    Dom = Dom.project_out(isl::dim::set, NumDim - Diff, Diff);

  }


  return Dom;

}


/// Compute the isl representation for the SCEV @p E in this BB.

///

/// @param BB               The BB for which isl representation is to be

/// computed.

/// @param InvalidDomainMap A map of BB to their invalid domains.

/// @param E                The SCEV that should be translated.

/// @param NonNegative      Flag to indicate the @p E has to be non-negative.

///

/// Note that this function will also adjust the invalid context accordingly.


__isl_give isl_pw_aff *

ScopBuilder::getPwAff(BasicBlock *BB,

                      DenseMap<BasicBlock *, isl::set> &InvalidDomainMap,

                      const SCEV *E, bool NonNegative) {

  PWACtx PWAC = scop->getPwAff(E, BB, NonNegative, &RecordedAssumptions);

  InvalidDomainMap[BB] = InvalidDomainMap[BB].unite(PWAC.second);

  return PWAC.first.release();

}


/// Build condition sets for unsigned ICmpInst(s).

/// Special handling is required for unsigned operands to ensure that if

/// MSB (aka the Sign bit) is set for an operands in an unsigned ICmpInst

/// it should wrap around.

///

/// @param IsStrictUpperBound holds information on the predicate relation

/// between TestVal and UpperBound, i.e,

/// TestVal < UpperBound  OR  TestVal <= UpperBound

__isl_give isl_set *ScopBuilder::buildUnsignedConditionSets(

    BasicBlock *BB, Value *Condition, __isl_keep isl_set *Domain,

    const SCEV *SCEV_TestVal, const SCEV *SCEV_UpperBound,

    DenseMap<BasicBlock *, isl::set> &InvalidDomainMap,

    bool IsStrictUpperBound) {

  // Do not take NonNeg assumption on TestVal

  // as it might have MSB (Sign bit) set.

  isl_pw_aff *TestVal = getPwAff(BB, InvalidDomainMap, SCEV_TestVal, false);

  // Take NonNeg assumption on UpperBound.

  isl_pw_aff *UpperBound =

      getPwAff(BB, InvalidDomainMap, SCEV_UpperBound, true);


  // 0 <= TestVal

  isl_set *First =

      isl_pw_aff_le_set(isl_pw_aff_zero_on_domain(isl_local_space_from_space(

                            isl_pw_aff_get_domain_space(TestVal))),

                        isl_pw_aff_copy(TestVal));


  isl_set *Second;

  if (IsStrictUpperBound)

    // TestVal < UpperBound

    Second = isl_pw_aff_lt_set(TestVal, UpperBound);

  else

    // TestVal <= UpperBound

    Second = isl_pw_aff_le_set(TestVal, UpperBound);


  isl_set *ConsequenceCondSet = isl_set_intersect(First, Second);

  return ConsequenceCondSet;

}


bool ScopBuilder::buildConditionSets(

    BasicBlock *BB, SwitchInst *SI, Loop *L, __isl_keep isl_set *Domain,

    DenseMap<BasicBlock *, isl::set> &InvalidDomainMap,

    SmallVectorImpl<__isl_give isl_set *> &ConditionSets) {

  Value *Condition = getConditionFromTerminator(SI);

  assert(Condition && "No condition for switch");


  isl_pw_aff *LHS, *RHS;

  LHS = getPwAff(BB, InvalidDomainMap, SE.getSCEVAtScope(Condition, L));


  unsigned NumSuccessors = SI->getNumSuccessors();

  ConditionSets.resize(NumSuccessors);

  for (auto &Case : SI->cases()) {

    unsigned Idx = Case.getSuccessorIndex();

    ConstantInt *CaseValue = Case.getCaseValue();


    RHS = getPwAff(BB, InvalidDomainMap, SE.getSCEV(CaseValue));

    isl_set *CaseConditionSet =

        buildConditionSet(ICmpInst::ICMP_EQ, isl::manage_copy(LHS),

                          isl::manage(RHS))

            .release();

    ConditionSets[Idx] = isl_set_coalesce(

        isl_set_intersect(CaseConditionSet, isl_set_copy(Domain)));

  }


  assert(ConditionSets[0] == nullptr && "Default condition set was set");

  isl_set *ConditionSetUnion = isl_set_copy(ConditionSets[1]);

  for (unsigned u = 2; u < NumSuccessors; u++)

    ConditionSetUnion =

        isl_set_union(ConditionSetUnion, isl_set_copy(ConditionSets[u]));

  ConditionSets[0] = isl_set_subtract(isl_set_copy(Domain), ConditionSetUnion);


  isl_pw_aff_free(LHS);


  return true;

}


bool ScopBuilder::buildConditionSets(

    BasicBlock *BB, Value *Condition, Instruction *TI, Loop *L,

    __isl_keep isl_set *Domain,

    DenseMap<BasicBlock *, isl::set> &InvalidDomainMap,

    SmallVectorImpl<__isl_give isl_set *> &ConditionSets) {

  isl_set *ConsequenceCondSet = nullptr;


  if (auto Load = dyn_cast<LoadInst>(Condition)) {

    const SCEV *LHSSCEV = SE.getSCEVAtScope(Load, L);

    const SCEV *RHSSCEV = SE.getZero(LHSSCEV->getType());

    bool NonNeg = false;

    isl_pw_aff *LHS = getPwAff(BB, InvalidDomainMap, LHSSCEV, NonNeg);

    isl_pw_aff *RHS = getPwAff(BB, InvalidDomainMap, RHSSCEV, NonNeg);

    ConsequenceCondSet = buildConditionSet(ICmpInst::ICMP_SLE, isl::manage(LHS),

                                           isl::manage(RHS))

                             .release();

  } else if (auto *PHI = dyn_cast<PHINode>(Condition)) {

    auto *Unique = dyn_cast<ConstantInt>(

        getUniqueNonErrorValue(PHI, &scop->getRegion(), &SD));

    assert(Unique &&

           "A PHINode condition should only be accepted by ScopDetection if "

           "getUniqueNonErrorValue returns non-NULL");


    if (Unique->isZero())

      ConsequenceCondSet = isl_set_empty(isl_set_get_space(Domain));

    else

      ConsequenceCondSet = isl_set_universe(isl_set_get_space(Domain));

  } else if (auto *CCond = dyn_cast<ConstantInt>(Condition)) {

    if (CCond->isZero())

      ConsequenceCondSet = isl_set_empty(isl_set_get_space(Domain));

    else

      ConsequenceCondSet = isl_set_universe(isl_set_get_space(Domain));

  } else if (BinaryOperator *BinOp = dyn_cast<BinaryOperator>(Condition)) {

    auto Opcode = BinOp->getOpcode();

    assert(Opcode == Instruction::And || Opcode == Instruction::Or);


    bool Valid = buildConditionSets(BB, BinOp->getOperand(0), TI, L, Domain,

                                    InvalidDomainMap, ConditionSets) &&

                 buildConditionSets(BB, BinOp->getOperand(1), TI, L, Domain,

                                    InvalidDomainMap, ConditionSets);

    if (!Valid) {

      while (!ConditionSets.empty())

        isl_set_free(ConditionSets.pop_back_val());

      return false;

    }


    isl_set_free(ConditionSets.pop_back_val());

    isl_set *ConsCondPart0 = ConditionSets.pop_back_val();

    isl_set_free(ConditionSets.pop_back_val());

    isl_set *ConsCondPart1 = ConditionSets.pop_back_val();


    if (Opcode == Instruction::And)

      ConsequenceCondSet = isl_set_intersect(ConsCondPart0, ConsCondPart1);

    else

      ConsequenceCondSet = isl_set_union(ConsCondPart0, ConsCondPart1);

  } else {

    auto *ICond = dyn_cast<ICmpInst>(Condition);

    assert(ICond &&

           "Condition of exiting branch was neither constant nor ICmp!");


    Region &R = scop->getRegion();


    isl_pw_aff *LHS, *RHS;

    // For unsigned comparisons we assumed the signed bit of neither operand

    // to be set. The comparison is equal to a signed comparison under this

    // assumption.

    bool NonNeg = ICond->isUnsigned();

    const SCEV *LeftOperand = SE.getSCEVAtScope(ICond->getOperand(0), L),

               *RightOperand = SE.getSCEVAtScope(ICond->getOperand(1), L);


    LeftOperand = tryForwardThroughPHI(LeftOperand, R, SE, &SD);

    RightOperand = tryForwardThroughPHI(RightOperand, R, SE, &SD);


    switch (ICond->getPredicate()) {

    case ICmpInst::ICMP_ULT:

      ConsequenceCondSet =

          buildUnsignedConditionSets(BB, Condition, Domain, LeftOperand,

                                     RightOperand, InvalidDomainMap, true);

      break;

    case ICmpInst::ICMP_ULE:

      ConsequenceCondSet =

          buildUnsignedConditionSets(BB, Condition, Domain, LeftOperand,

                                     RightOperand, InvalidDomainMap, false);

      break;

    case ICmpInst::ICMP_UGT:

      ConsequenceCondSet =

          buildUnsignedConditionSets(BB, Condition, Domain, RightOperand,

                                     LeftOperand, InvalidDomainMap, true);

      break;

    case ICmpInst::ICMP_UGE:

      ConsequenceCondSet =

          buildUnsignedConditionSets(BB, Condition, Domain, RightOperand,

                                     LeftOperand, InvalidDomainMap, false);

      break;

    default:

      LHS = getPwAff(BB, InvalidDomainMap, LeftOperand, NonNeg);

      RHS = getPwAff(BB, InvalidDomainMap, RightOperand, NonNeg);

      ConsequenceCondSet = buildConditionSet(ICond->getPredicate(),

                                             isl::manage(LHS), isl::manage(RHS))

                               .release();

      break;

    }

  }


  // If no terminator was given we are only looking for parameter constraints

  // under which @p Condition is true/false.

  if (!TI)

    ConsequenceCondSet = isl_set_params(ConsequenceCondSet);

  assert(ConsequenceCondSet);

  ConsequenceCondSet = isl_set_coalesce(

      isl_set_intersect(ConsequenceCondSet, isl_set_copy(Domain)));


  isl_set *AlternativeCondSet = nullptr;

  bool TooComplex =

      isl_set_n_basic_set(ConsequenceCondSet) >= (int)MaxDisjunctsInDomain;


  if (!TooComplex) {

    AlternativeCondSet = isl_set_subtract(isl_set_copy(Domain),

                                          isl_set_copy(ConsequenceCondSet));

    TooComplex =

        isl_set_n_basic_set(AlternativeCondSet) >= (int)MaxDisjunctsInDomain;

  }


  if (TooComplex) {

    scop->invalidate(COMPLEXITY, TI ? TI->getDebugLoc() : DebugLoc(),

                     TI ? TI->getParent() : nullptr /* BasicBlock */);

    isl_set_free(AlternativeCondSet);

    isl_set_free(ConsequenceCondSet);

    return false;

  }


  ConditionSets.push_back(ConsequenceCondSet);

  ConditionSets.push_back(isl_set_coalesce(AlternativeCondSet));


  return true;

}


bool ScopBuilder::buildConditionSets(

    BasicBlock *BB, Instruction *TI, Loop *L, __isl_keep isl_set *Domain,

    DenseMap<BasicBlock *, isl::set> &InvalidDomainMap,

    SmallVectorImpl<__isl_give isl_set *> &ConditionSets) {

  if (SwitchInst *SI = dyn_cast<SwitchInst>(TI))

    return buildConditionSets(BB, SI, L, Domain, InvalidDomainMap,

                              ConditionSets);


  assert(isa<BranchInst>(TI) && "Terminator was neither branch nor switch.");


  if (TI->getNumSuccessors() == 1) {

    ConditionSets.push_back(isl_set_copy(Domain));

    return true;

  }


  Value *Condition = getConditionFromTerminator(TI);

  assert(Condition && "No condition for Terminator");


  return buildConditionSets(BB, Condition, TI, L, Domain, InvalidDomainMap,

                            ConditionSets);

}


bool ScopBuilder::propagateDomainConstraints(

    Region *R, DenseMap<BasicBlock *, isl::set> &InvalidDomainMap) {

  // Iterate over the region R and propagate the domain constrains from the

  // predecessors to the current node. In contrast to the

  // buildDomainsWithBranchConstraints function, this one will pull the domain

  // information from the predecessors instead of pushing it to the successors.

  // Additionally, we assume the domains to be already present in the domain

  // map here. However, we iterate again in reverse post order so we know all

  // predecessors have been visited before a block or non-affine subregion is

  // visited.


  ReversePostOrderTraversal<Region *> RTraversal(R);

  for (auto *RN : RTraversal) {

    // Recurse for affine subregions but go on for basic blocks and non-affine

    // subregions.

    if (RN->isSubRegion()) {

      Region *SubRegion = RN->getNodeAs<Region>();

      if (!scop->isNonAffineSubRegion(SubRegion)) {

        if (!propagateDomainConstraints(SubRegion, InvalidDomainMap))

          return false;

        continue;

      }

    }


    BasicBlock *BB = getRegionNodeBasicBlock(RN);

    isl::set &Domain = scop->getOrInitEmptyDomain(BB);

    assert(!Domain.is_null());


    // Under the union of all predecessor conditions we can reach this block.

    isl::set PredDom = getPredecessorDomainConstraints(BB, Domain);

    Domain = Domain.intersect(PredDom).coalesce();

    Domain = Domain.align_params(scop->getParamSpace());


    Loop *BBLoop = getRegionNodeLoop(RN, LI);

    if (BBLoop && BBLoop->getHeader() == BB && scop->contains(BBLoop))

      if (!addLoopBoundsToHeaderDomain(BBLoop, InvalidDomainMap))

        return false;

  }


  return true;

}


void ScopBuilder::propagateDomainConstraintsToRegionExit(

    BasicBlock *BB, Loop *BBLoop,

    SmallPtrSetImpl<BasicBlock *> &FinishedExitBlocks,

    DenseMap<BasicBlock *, isl::set> &InvalidDomainMap) {

  // Check if the block @p BB is the entry of a region. If so we propagate it's

  // domain to the exit block of the region. Otherwise we are done.

  auto *RI = scop->getRegion().getRegionInfo();

  auto *BBReg = RI ? RI->getRegionFor(BB) : nullptr;

  auto *ExitBB = BBReg ? BBReg->getExit() : nullptr;

  if (!BBReg || BBReg->getEntry() != BB || !scop->contains(ExitBB))

    return;


  // Do not propagate the domain if there is a loop backedge inside the region

  // that would prevent the exit block from being executed.

  auto *L = BBLoop;

  while (L && scop->contains(L)) {

    SmallVector<BasicBlock *, 4> LatchBBs;

    BBLoop->getLoopLatches(LatchBBs);

    for (auto *LatchBB : LatchBBs)

      if (BB != LatchBB && BBReg->contains(LatchBB))

        return;

    L = L->getParentLoop();

  }


  isl::set Domain = scop->getOrInitEmptyDomain(BB);

  assert(!Domain.is_null() && "Cannot propagate a nullptr");


  Loop *ExitBBLoop = getFirstNonBoxedLoopFor(ExitBB, LI, scop->getBoxedLoops());


  // Since the dimensions of @p BB and @p ExitBB might be different we have to

  // adjust the domain before we can propagate it.

  isl::set AdjustedDomain = adjustDomainDimensions(Domain, BBLoop, ExitBBLoop);

  isl::set &ExitDomain = scop->getOrInitEmptyDomain(ExitBB);


  // If the exit domain is not yet created we set it otherwise we "add" the

  // current domain.

  ExitDomain =

      !ExitDomain.is_null() ? AdjustedDomain.unite(ExitDomain) : AdjustedDomain;


  // Initialize the invalid domain.

  InvalidDomainMap[ExitBB] = ExitDomain.empty(ExitDomain.get_space());


  FinishedExitBlocks.insert(ExitBB);

}


isl::set ScopBuilder::getPredecessorDomainConstraints(BasicBlock *BB,

                                                      isl::set Domain) {

  // If @p BB is the ScopEntry we are done

  if (scop->getRegion().getEntry() == BB)

    return isl::set::universe(Domain.get_space());


  // The region info of this function.

  auto &RI = *scop->getRegion().getRegionInfo();


  Loop *BBLoop = getFirstNonBoxedLoopFor(BB, LI, scop->getBoxedLoops());


  // A domain to collect all predecessor domains, thus all conditions under

  // which the block is executed. To this end we start with the empty domain.

  isl::set PredDom = isl::set::empty(Domain.get_space());


  // Set of regions of which the entry block domain has been propagated to BB.

  // all predecessors inside any of the regions can be skipped.

  SmallSet<Region *, 8> PropagatedRegions;


  for (auto *PredBB : predecessors(BB)) {

    // Skip backedges.

    if (DT.dominates(BB, PredBB))

      continue;


    // If the predecessor is in a region we used for propagation we can skip it.

    auto PredBBInRegion = [PredBB](Region *PR) { return PR->contains(PredBB); };

    if (llvm::any_of(PropagatedRegions, PredBBInRegion)) {

      continue;

    }


    // Check if there is a valid region we can use for propagation, thus look

    // for a region that contains the predecessor and has @p BB as exit block.

    // FIXME: This was an side-effect-free (and possibly infinite) loop when

    //        committed and seems not to be needed.

    auto *PredR = RI.getRegionFor(PredBB);

    while (PredR->getExit() != BB && !PredR->contains(BB))

      PredR = PredR->getParent();


    // If a valid region for propagation was found use the entry of that region

    // for propagation, otherwise the PredBB directly.

    if (PredR->getExit() == BB) {

      PredBB = PredR->getEntry();

      PropagatedRegions.insert(PredR);

    }


    isl::set PredBBDom = scop->getDomainConditions(PredBB);

    Loop *PredBBLoop =

        getFirstNonBoxedLoopFor(PredBB, LI, scop->getBoxedLoops());

    PredBBDom = adjustDomainDimensions(PredBBDom, PredBBLoop, BBLoop);

    PredDom = PredDom.unite(PredBBDom);

  }


  return PredDom;

}


bool ScopBuilder::addLoopBoundsToHeaderDomain(

    Loop *L, DenseMap<BasicBlock *, isl::set> &InvalidDomainMap) {

  int LoopDepth = scop->getRelativeLoopDepth(L);

  assert(LoopDepth >= 0 && "Loop in region should have at least depth one");


  BasicBlock *HeaderBB = L->getHeader();

  assert(scop->isDomainDefined(HeaderBB));

  isl::set &HeaderBBDom = scop->getOrInitEmptyDomain(HeaderBB);


  isl::map NextIterationMap =

      createNextIterationMap(HeaderBBDom.get_space(), LoopDepth);


  isl::set UnionBackedgeCondition = HeaderBBDom.empty(HeaderBBDom.get_space());


  SmallVector<BasicBlock *, 4> LatchBlocks;

  L->getLoopLatches(LatchBlocks);


  for (BasicBlock *LatchBB : LatchBlocks) {

    // If the latch is only reachable via error statements we skip it.

    if (!scop->isDomainDefined(LatchBB))

      continue;


    isl::set LatchBBDom = scop->getDomainConditions(LatchBB);


    isl::set BackedgeCondition;


    Instruction *TI = LatchBB->getTerminator();

    BranchInst *BI = dyn_cast<BranchInst>(TI);

    assert(BI && "Only branch instructions allowed in loop latches");


    if (BI->isUnconditional())

      BackedgeCondition = LatchBBDom;

    else {

      SmallVector<isl_set *, 8> ConditionSets;

      int idx = BI->getSuccessor(0) != HeaderBB;

      if (!buildConditionSets(LatchBB, TI, L, LatchBBDom.get(),

                              InvalidDomainMap, ConditionSets))

        return false;


      // Free the non back edge condition set as we do not need it.

      isl_set_free(ConditionSets[1 - idx]);


      BackedgeCondition = isl::manage(ConditionSets[idx]);

    }


    int LatchLoopDepth = scop->getRelativeLoopDepth(LI.getLoopFor(LatchBB));

    assert(LatchLoopDepth >= LoopDepth);

    BackedgeCondition = BackedgeCondition.project_out(

        isl::dim::set, LoopDepth + 1, LatchLoopDepth - LoopDepth);

    UnionBackedgeCondition = UnionBackedgeCondition.unite(BackedgeCondition);

  }


  isl::map ForwardMap = ForwardMap.lex_le(HeaderBBDom.get_space());

  for (int i = 0; i < LoopDepth; i++)

    ForwardMap = ForwardMap.equate(isl::dim::in, i, isl::dim::out, i);


  isl::set UnionBackedgeConditionComplement =

      UnionBackedgeCondition.complement();

  UnionBackedgeConditionComplement =

      UnionBackedgeConditionComplement.lower_bound_si(isl::dim::set, LoopDepth,

                                                      0);

  UnionBackedgeConditionComplement =

      UnionBackedgeConditionComplement.apply(ForwardMap);

  HeaderBBDom = HeaderBBDom.subtract(UnionBackedgeConditionComplement);

  HeaderBBDom = HeaderBBDom.apply(NextIterationMap);


  auto Parts = partitionSetParts(HeaderBBDom, LoopDepth);

  HeaderBBDom = Parts.second;


  // Check if there is a <nsw> tagged AddRec for this loop and if so do not

  // require a runtime check. The assumption is already implied by the <nsw>

  // tag.

  bool RequiresRTC = !scop->hasNSWAddRecForLoop(L);


  isl::set UnboundedCtx = Parts.first.params();

  recordAssumption(&RecordedAssumptions, INFINITELOOP, UnboundedCtx,

                   HeaderBB->getTerminator()->getDebugLoc(), AS_RESTRICTION,

                   nullptr, RequiresRTC);

  return true;

}


void ScopBuilder::buildInvariantEquivalenceClasses() {

  DenseMap<std::pair<const SCEV *, Type *>, LoadInst *> EquivClasses;


  const InvariantLoadsSetTy &RIL = scop->getRequiredInvariantLoads();

  for (LoadInst *LInst : RIL) {

    const SCEV *PointerSCEV = SE.getSCEV(LInst->getPointerOperand());


    Type *Ty = LInst->getType();

    LoadInst *&ClassRep = EquivClasses[std::make_pair(PointerSCEV, Ty)];

    if (ClassRep) {

      scop->addInvariantLoadMapping(LInst, ClassRep);

      continue;

    }


    ClassRep = LInst;

    scop->addInvariantEquivClass(

        InvariantEquivClassTy{PointerSCEV, MemoryAccessList(), {}, Ty});

  }

}


bool ScopBuilder::buildDomains(

    Region *R, DenseMap<BasicBlock *, isl::set> &InvalidDomainMap) {

  bool IsOnlyNonAffineRegion = scop->isNonAffineSubRegion(R);

  auto *EntryBB = R->getEntry();

  auto *L = IsOnlyNonAffineRegion ? nullptr : LI.getLoopFor(EntryBB);

  int LD = scop->getRelativeLoopDepth(L);

  auto *S =

      isl_set_universe(isl_space_set_alloc(scop->getIslCtx().get(), 0, LD + 1));


  InvalidDomainMap[EntryBB] = isl::manage(isl_set_empty(isl_set_get_space(S)));

  isl::set Domain = isl::manage(S);

  scop->setDomain(EntryBB, Domain);


  if (IsOnlyNonAffineRegion)

    return !containsErrorBlock(R->getNode(), *R, &SD);


  if (!buildDomainsWithBranchConstraints(R, InvalidDomainMap))

    return false;


  if (!propagateDomainConstraints(R, InvalidDomainMap))

    return false;


  // Error blocks and blocks dominated by them have been assumed to never be

  // executed. Representing them in the Scop does not add any value. In fact,

  // it is likely to cause issues during construction of the ScopStmts. The

  // contents of error blocks have not been verified to be expressible and

  // will cause problems when building up a ScopStmt for them.

  // Furthermore, basic blocks dominated by error blocks may reference

  // instructions in the error block which, if the error block is not modeled,

  // can themselves not be constructed properly. To this end we will replace

  // the domains of error blocks and those only reachable via error blocks

  // with an empty set. Additionally, we will record for each block under which

  // parameter combination it would be reached via an error block in its

  // InvalidDomain. This information is needed during load hoisting.

  if (!propagateInvalidStmtDomains(R, InvalidDomainMap))

    return false;


  return true;

}


bool ScopBuilder::buildDomainsWithBranchConstraints(

    Region *R, DenseMap<BasicBlock *, isl::set> &InvalidDomainMap) {

  // To create the domain for each block in R we iterate over all blocks and

  // subregions in R and propagate the conditions under which the current region

  // element is executed. To this end we iterate in reverse post order over R as

  // it ensures that we first visit all predecessors of a region node (either a

  // basic block or a subregion) before we visit the region node itself.

  // Initially, only the domain for the SCoP region entry block is set and from

  // there we propagate the current domain to all successors, however we add the

  // condition that the successor is actually executed next.

  // As we are only interested in non-loop carried constraints here we can

  // simply skip loop back edges.


  SmallPtrSet<BasicBlock *, 8> FinishedExitBlocks;

  ReversePostOrderTraversal<Region *> RTraversal(R);

  for (auto *RN : RTraversal) {

    // Recurse for affine subregions but go on for basic blocks and non-affine

    // subregions.

    if (RN->isSubRegion()) {

      Region *SubRegion = RN->getNodeAs<Region>();

      if (!scop->isNonAffineSubRegion(SubRegion)) {

        if (!buildDomainsWithBranchConstraints(SubRegion, InvalidDomainMap))

          return false;

        continue;

      }

    }


    if (containsErrorBlock(RN, scop->getRegion(), &SD))

      scop->notifyErrorBlock();

    ;


    BasicBlock *BB = getRegionNodeBasicBlock(RN);

    Instruction *TI = BB->getTerminator();


    if (isa<UnreachableInst>(TI))

      continue;


    if (!scop->isDomainDefined(BB))

      continue;

    isl::set Domain = scop->getDomainConditions(BB);


    scop->updateMaxLoopDepth(unsignedFromIslSize(Domain.tuple_dim()));


    auto *BBLoop = getRegionNodeLoop(RN, LI);

    // Propagate the domain from BB directly to blocks that have a superset

    // domain, at the moment only region exit nodes of regions that start in BB.

    propagateDomainConstraintsToRegionExit(BB, BBLoop, FinishedExitBlocks,

                                           InvalidDomainMap);


    // If all successors of BB have been set a domain through the propagation

    // above we do not need to build condition sets but can just skip this

    // block. However, it is important to note that this is a local property

    // with regards to the region @p R. To this end FinishedExitBlocks is a

    // local variable.

    auto IsFinishedRegionExit = [&FinishedExitBlocks](BasicBlock *SuccBB) {

      return FinishedExitBlocks.count(SuccBB);

    };

    if (std::all_of(succ_begin(BB), succ_end(BB), IsFinishedRegionExit))

      continue;


    // Build the condition sets for the successor nodes of the current region

    // node. If it is a non-affine subregion we will always execute the single

    // exit node, hence the single entry node domain is the condition set. For

    // basic blocks we use the helper function buildConditionSets.

    SmallVector<isl_set *, 8> ConditionSets;

    if (RN->isSubRegion())

      ConditionSets.push_back(Domain.copy());

    else if (!buildConditionSets(BB, TI, BBLoop, Domain.get(), InvalidDomainMap,

                                 ConditionSets))

      return false;


    // Now iterate over the successors and set their initial domain based on

    // their condition set. We skip back edges here and have to be careful when

    // we leave a loop not to keep constraints over a dimension that doesn't

    // exist anymore.

    assert(RN->isSubRegion() || TI->getNumSuccessors() == ConditionSets.size());

    for (unsigned u = 0, e = ConditionSets.size(); u < e; u++) {

      isl::set CondSet = isl::manage(ConditionSets[u]);

      BasicBlock *SuccBB = getRegionNodeSuccessor(RN, TI, u);


      // Skip blocks outside the region.

      if (!scop->contains(SuccBB))

        continue;


      // If we propagate the domain of some block to "SuccBB" we do not have to

      // adjust the domain.

      if (FinishedExitBlocks.count(SuccBB))

        continue;


      // Skip back edges.

      if (DT.dominates(SuccBB, BB))

        continue;


      Loop *SuccBBLoop =

          getFirstNonBoxedLoopFor(SuccBB, LI, scop->getBoxedLoops());


      CondSet = adjustDomainDimensions(CondSet, BBLoop, SuccBBLoop);


      // Set the domain for the successor or merge it with an existing domain in

      // case there are multiple paths (without loop back edges) to the

      // successor block.

      isl::set &SuccDomain = scop->getOrInitEmptyDomain(SuccBB);


      if (!SuccDomain.is_null()) {

        SuccDomain = SuccDomain.unite(CondSet).coalesce();

      } else {

        // Initialize the invalid domain.

        InvalidDomainMap[SuccBB] = CondSet.empty(CondSet.get_space());

        SuccDomain = CondSet;

      }


      SuccDomain = SuccDomain.detect_equalities();


      // Check if the maximal number of domain disjunctions was reached.

      // In case this happens we will clean up and bail.

      if (unsignedFromIslSize(SuccDomain.n_basic_set()) < MaxDisjunctsInDomain)

        continue;


      scop->invalidate(COMPLEXITY, DebugLoc());

      while (++u < ConditionSets.size())

        isl_set_free(ConditionSets[u]);

      return false;

    }

  }


  return true;

}


bool ScopBuilder::propagateInvalidStmtDomains(

    Region *R, DenseMap<BasicBlock *, isl::set> &InvalidDomainMap) {

  ReversePostOrderTraversal<Region *> RTraversal(R);

  for (auto *RN : RTraversal) {


    // Recurse for affine subregions but go on for basic blocks and non-affine

    // subregions.

    if (RN->isSubRegion()) {

      Region *SubRegion = RN->getNodeAs<Region>();

      if (!scop->isNonAffineSubRegion(SubRegion)) {

        propagateInvalidStmtDomains(SubRegion, InvalidDomainMap);

        continue;

      }

    }


    bool ContainsErrorBlock = containsErrorBlock(RN, scop->getRegion(), &SD);

    BasicBlock *BB = getRegionNodeBasicBlock(RN);

    isl::set &Domain = scop->getOrInitEmptyDomain(BB);

    assert(!Domain.is_null() && "Cannot propagate a nullptr");


    isl::set InvalidDomain = InvalidDomainMap[BB];


    bool IsInvalidBlock = ContainsErrorBlock || Domain.is_subset(InvalidDomain);


    if (!IsInvalidBlock) {

      InvalidDomain = InvalidDomain.intersect(Domain);

    } else {

      InvalidDomain = Domain;

      isl::set DomPar = Domain.params();

      recordAssumption(&RecordedAssumptions, ERRORBLOCK, DomPar,

                       BB->getTerminator()->getDebugLoc(), AS_RESTRICTION);

      Domain = isl::set::empty(Domain.get_space());

    }


    if (InvalidDomain.is_empty()) {

      InvalidDomainMap[BB] = InvalidDomain;

      continue;

    }


    auto *BBLoop = getRegionNodeLoop(RN, LI);

    auto *TI = BB->getTerminator();

    unsigned NumSuccs = RN->isSubRegion() ? 1 : TI->getNumSuccessors();

    for (unsigned u = 0; u < NumSuccs; u++) {

      auto *SuccBB = getRegionNodeSuccessor(RN, TI, u);


      // Skip successors outside the SCoP.

      if (!scop->contains(SuccBB))

        continue;


      // Skip backedges.

      if (DT.dominates(SuccBB, BB))

        continue;


      Loop *SuccBBLoop =

          getFirstNonBoxedLoopFor(SuccBB, LI, scop->getBoxedLoops());


      auto AdjustedInvalidDomain =

          adjustDomainDimensions(InvalidDomain, BBLoop, SuccBBLoop);


      isl::set SuccInvalidDomain = InvalidDomainMap[SuccBB];

      SuccInvalidDomain = SuccInvalidDomain.unite(AdjustedInvalidDomain);

      SuccInvalidDomain = SuccInvalidDomain.coalesce();


      InvalidDomainMap[SuccBB] = SuccInvalidDomain;


      // Check if the maximal number of domain disjunctions was reached.

      // In case this happens we will bail.

      if (unsignedFromIslSize(SuccInvalidDomain.n_basic_set()) <

          MaxDisjunctsInDomain)

        continue;


      InvalidDomainMap.erase(BB);

      scop->invalidate(COMPLEXITY, TI->getDebugLoc(), TI->getParent());

      return false;

    }


    InvalidDomainMap[BB] = InvalidDomain;

  }


  return true;

}


void ScopBuilder::buildPHIAccesses(ScopStmt *PHIStmt, PHINode *PHI,

                                   Region *NonAffineSubRegion,

                                   bool IsExitBlock) {

  // PHI nodes that are in the exit block of the region, hence if IsExitBlock is

  // true, are not modeled as ordinary PHI nodes as they are not part of the

  // region. However, we model the operands in the predecessor blocks that are

  // part of the region as regular scalar accesses.


  // If we can synthesize a PHI we can skip it, however only if it is in

  // the region. If it is not it can only be in the exit block of the region.

  // In this case we model the operands but not the PHI itself.

  auto *Scope = LI.getLoopFor(PHI->getParent());

  if (!IsExitBlock && canSynthesize(PHI, *scop, &SE, Scope))

    return;


  // PHI nodes are modeled as if they had been demoted prior to the SCoP

  // detection. Hence, the PHI is a load of a new memory location in which the

  // incoming value was written at the end of the incoming basic block.

  bool OnlyNonAffineSubRegionOperands = true;

  for (unsigned u = 0; u < PHI->getNumIncomingValues(); u++) {

    Value *Op = PHI->getIncomingValue(u);

    BasicBlock *OpBB = PHI->getIncomingBlock(u);

    ScopStmt *OpStmt = scop->getIncomingStmtFor(PHI->getOperandUse(u));


    // Do not build PHI dependences inside a non-affine subregion, but make

    // sure that the necessary scalar values are still made available.

    if (NonAffineSubRegion && NonAffineSubRegion->contains(OpBB)) {

      auto *OpInst = dyn_cast<Instruction>(Op);

      if (!OpInst || !NonAffineSubRegion->contains(OpInst))

        ensureValueRead(Op, OpStmt);

      continue;

    }


    OnlyNonAffineSubRegionOperands = false;

    ensurePHIWrite(PHI, OpStmt, OpBB, Op, IsExitBlock);

  }


  if (!OnlyNonAffineSubRegionOperands && !IsExitBlock) {

    addPHIReadAccess(PHIStmt, PHI);

  }

}


void ScopBuilder::buildScalarDependences(ScopStmt *UserStmt,

                                         Instruction *Inst) {

  assert(!isa<PHINode>(Inst));


  // Pull-in required operands.

  for (Use &Op : Inst->operands())

    ensureValueRead(Op.get(), UserStmt);

}


// Create a sequence of two schedules. Either argument may be null and is

// interpreted as the empty schedule. Can also return null if both schedules are

// empty.

static isl::schedule combineInSequence(isl::schedule Prev, isl::schedule Succ) {

  if (Prev.is_null())

    return Succ;

  if (Succ.is_null())

    return Prev;


  return Prev.sequence(Succ);

}


// Create an isl_multi_union_aff that defines an identity mapping from the

// elements of USet to their N-th dimension.

//

// # Example:

//

//            Domain: { A[i,j]; B[i,j,k] }

//                 N: 1

//

// Resulting Mapping: { {A[i,j] -> [(j)]; B[i,j,k] -> [(j)] }

//

// @param USet   A union set describing the elements for which to generate a

//               mapping.

// @param N      The dimension to map to.

// @returns      A mapping from USet to its N-th dimension.

static isl::multi_union_pw_aff mapToDimension(isl::union_set USet, unsigned N) {

  assert(!USet.is_null());

  assert(!USet.is_empty());


  auto Result = isl::union_pw_multi_aff::empty(USet.get_space());


  for (isl::set S : USet.get_set_list()) {

    unsigned Dim = unsignedFromIslSize(S.tuple_dim());

    assert(Dim >= N);

    auto PMA = isl::pw_multi_aff::project_out_map(S.get_space(), isl::dim::set,

                                                  N, Dim - N);

    if (N > 1)

      PMA = PMA.drop_dims(isl::dim::out, 0, N - 1);


    Result = Result.add_pw_multi_aff(PMA);

  }


  return isl::multi_union_pw_aff(isl::union_pw_multi_aff(Result));

}


void ScopBuilder::buildSchedule() {

  Loop *L = getLoopSurroundingScop(*scop, LI);

  LoopStackTy LoopStack({LoopStackElementTy(L, {}, 0)});

  buildSchedule(scop->getRegion().getNode(), LoopStack);

  assert(LoopStack.size() == 1 && LoopStack.back().L == L);

  scop->setScheduleTree(LoopStack[0].Schedule);

}


/// To generate a schedule for the elements in a Region we traverse the Region

/// in reverse-post-order and add the contained RegionNodes in traversal order

/// to the schedule of the loop that is currently at the top of the LoopStack.

/// For loop-free codes, this results in a correct sequential ordering.

///

/// Example:

///           bb1(0)

///         /     \.

///      bb2(1)   bb3(2)

///         \    /  \.

///          bb4(3)  bb5(4)

///             \   /

///              bb6(5)

///

/// Including loops requires additional processing. Whenever a loop header is

/// encountered, the corresponding loop is added to the @p LoopStack. Starting

/// from an empty schedule, we first process all RegionNodes that are within

/// this loop and complete the sequential schedule at this loop-level before

/// processing about any other nodes. To implement this

/// loop-nodes-first-processing, the reverse post-order traversal is

/// insufficient. Hence, we additionally check if the traversal yields

/// sub-regions or blocks that are outside the last loop on the @p LoopStack.

/// These region-nodes are then queue and only traverse after the all nodes

/// within the current loop have been processed.

void ScopBuilder::buildSchedule(Region *R, LoopStackTy &LoopStack) {

  Loop *OuterScopLoop = getLoopSurroundingScop(*scop, LI);


  ReversePostOrderTraversal<Region *> RTraversal(R);

  std::deque<RegionNode *> WorkList(RTraversal.begin(), RTraversal.end());

  std::deque<RegionNode *> DelayList;

  bool LastRNWaiting = false;


  // Iterate over the region @p R in reverse post-order but queue

  // sub-regions/blocks iff they are not part of the last encountered but not

  // completely traversed loop. The variable LastRNWaiting is a flag to indicate

  // that we queued the last sub-region/block from the reverse post-order

  // iterator. If it is set we have to explore the next sub-region/block from

  // the iterator (if any) to guarantee progress. If it is not set we first try

  // the next queued sub-region/blocks.

  while (!WorkList.empty() || !DelayList.empty()) {

    RegionNode *RN;


    if ((LastRNWaiting && !WorkList.empty()) || DelayList.empty()) {

      RN = WorkList.front();

      WorkList.pop_front();

      LastRNWaiting = false;

    } else {

      RN = DelayList.front();

      DelayList.pop_front();

    }


    Loop *L = getRegionNodeLoop(RN, LI);

    if (!scop->contains(L))

      L = OuterScopLoop;


    Loop *LastLoop = LoopStack.back().L;

    if (LastLoop != L) {

      if (LastLoop && !LastLoop->contains(L)) {

        LastRNWaiting = true;

        DelayList.push_back(RN);

        continue;

      }

      LoopStack.push_back({L, {}, 0});

    }

    buildSchedule(RN, LoopStack);

  }

}


void ScopBuilder::buildSchedule(RegionNode *RN, LoopStackTy &LoopStack) {

  if (RN->isSubRegion()) {

    auto *LocalRegion = RN->getNodeAs<Region>();

    if (!scop->isNonAffineSubRegion(LocalRegion)) {

      buildSchedule(LocalRegion, LoopStack);

      return;

    }

  }


  assert(LoopStack.rbegin() != LoopStack.rend());

  auto LoopData = LoopStack.rbegin();

  LoopData->NumBlocksProcessed += getNumBlocksInRegionNode(RN);


  for (auto *Stmt : scop->getStmtListFor(RN)) {

    isl::union_set UDomain{Stmt->getDomain()};

    auto StmtSchedule = isl::schedule::from_domain(UDomain);

    LoopData->Schedule = combineInSequence(LoopData->Schedule, StmtSchedule);

  }


  // Check if we just processed the last node in this loop. If we did, finalize

  // the loop by:

  //

  //   - adding new schedule dimensions

  //   - folding the resulting schedule into the parent loop schedule

  //   - dropping the loop schedule from the LoopStack.

  //

  // Then continue to check surrounding loops, which might also have been

  // completed by this node.

  size_t Dimension = LoopStack.size();

  while (LoopData->L &&

         LoopData->NumBlocksProcessed == getNumBlocksInLoop(LoopData->L)) {

    isl::schedule Schedule = LoopData->Schedule;

    auto NumBlocksProcessed = LoopData->NumBlocksProcessed;


    assert(std::next(LoopData) != LoopStack.rend());

    Loop *L = LoopData->L;

    ++LoopData;

    --Dimension;


    if (!Schedule.is_null()) {

      isl::union_set Domain = Schedule.get_domain();

      isl::multi_union_pw_aff MUPA = mapToDimension(Domain, Dimension);

      Schedule = Schedule.insert_partial_schedule(MUPA);


      if (hasDisableAllTransformsHint(L)) {

        /// If any of the loops has a disable_nonforced heuristic, mark the

        /// entire SCoP as such. The ISL rescheduler can only reschedule the

        /// SCoP in its entirety.

        /// TODO: ScopDetection could avoid including such loops or warp them as

        /// boxed loop. It still needs to pass-through loop with user-defined

        /// metadata.

        scop->markDisableHeuristics();

      }


      // It is easier to insert the marks here that do it retroactively.

      isl::id IslLoopId = createIslLoopAttr(scop->getIslCtx(), L);

      if (!IslLoopId.is_null())

        Schedule =

            Schedule.get_root().child(0).insert_mark(IslLoopId).get_schedule();


      LoopData->Schedule = combineInSequence(LoopData->Schedule, Schedule);

    }


    LoopData->NumBlocksProcessed += NumBlocksProcessed;

  }

  // Now pop all loops processed up there from the LoopStack

  LoopStack.erase(LoopStack.begin() + Dimension, LoopStack.end());

}


void ScopBuilder::buildEscapingDependences(Instruction *Inst) {

  // Check for uses of this instruction outside the scop. Because we do not

  // iterate over such instructions and therefore did not "ensure" the existence

  // of a write, we must determine such use here.

  if (scop->isEscaping(Inst))

    ensureValueWrite(Inst);

}


void ScopBuilder::addRecordedAssumptions() {

  for (auto &AS : llvm::reverse(RecordedAssumptions)) {


    if (!AS.BB) {

      scop->addAssumption(AS.Kind, AS.Set, AS.Loc, AS.Sign,

                          nullptr /* BasicBlock */, AS.RequiresRTC);

      continue;

    }


    // If the domain was deleted the assumptions are void.

    isl_set *Dom = scop->getDomainConditions(AS.BB).release();

    if (!Dom)

      continue;


    // If a basic block was given use its domain to simplify the assumption.

    // In case of restrictions we know they only have to hold on the domain,

    // thus we can intersect them with the domain of the block. However, for

    // assumptions the domain has to imply them, thus:

    //                     _              _____

    //   Dom => S   <==>   A v B   <==>   A - B

    //

    // To avoid the complement we will register A - B as a restriction not an

    // assumption.

    isl_set *S = AS.Set.copy();

    if (AS.Sign == AS_RESTRICTION)

      S = isl_set_params(isl_set_intersect(S, Dom));

    else /* (AS.Sign == AS_ASSUMPTION) */

      S = isl_set_params(isl_set_subtract(Dom, S));


    scop->addAssumption(AS.Kind, isl::manage(S), AS.Loc, AS_RESTRICTION, AS.BB,

                        AS.RequiresRTC);

  }

}


void ScopBuilder::addUserAssumptions(

    AssumptionCache &AC, DenseMap<BasicBlock *, isl::set> &InvalidDomainMap) {

  for (auto &Assumption : AC.assumptions()) {

    auto *CI = dyn_cast_or_null<CallInst>(Assumption);

    if (!CI || CI->arg_size() != 1)

      continue;


    bool InScop = scop->contains(CI);

    if (!InScop && !scop->isDominatedBy(DT, CI->getParent()))

      continue;


    auto *L = LI.getLoopFor(CI->getParent());

    auto *Val = CI->getArgOperand(0);

    ParameterSetTy DetectedParams;

    auto &R = scop->getRegion();

    if (!isAffineConstraint(Val, &R, L, SE, DetectedParams)) {

      ORE.emit(

          OptimizationRemarkAnalysis(DEBUG_TYPE, "IgnoreUserAssumption", CI)

          << "Non-affine user assumption ignored.");

      continue;

    }


    // Collect all newly introduced parameters.

    ParameterSetTy NewParams;

    for (auto *Param : DetectedParams) {

      Param = extractConstantFactor(Param, SE).second;

      Param = scop->getRepresentingInvariantLoadSCEV(Param);

      if (scop->isParam(Param))

        continue;

      NewParams.insert(Param);

    }


    SmallVector<isl_set *, 2> ConditionSets;

    auto *TI = InScop ? CI->getParent()->getTerminator() : nullptr;

    BasicBlock *BB = InScop ? CI->getParent() : R.getEntry();

    auto *Dom = InScop ? isl_set_copy(scop->getDomainConditions(BB).get())

                       : isl_set_copy(scop->getContext().get());

    assert(Dom && "Cannot propagate a nullptr.");

    bool Valid = buildConditionSets(BB, Val, TI, L, Dom, InvalidDomainMap,

                                    ConditionSets);

    isl_set_free(Dom);


    if (!Valid)

      continue;


    isl_set *AssumptionCtx = nullptr;

    if (InScop) {

      AssumptionCtx = isl_set_complement(isl_set_params(ConditionSets[1]));

      isl_set_free(ConditionSets[0]);

    } else {

      AssumptionCtx = isl_set_complement(ConditionSets[1]);

      AssumptionCtx = isl_set_intersect(AssumptionCtx, ConditionSets[0]);

    }


    // Project out newly introduced parameters as they are not otherwise useful.

    if (!NewParams.empty()) {

      for (isl_size u = 0; u < isl_set_n_param(AssumptionCtx); u++) {

        auto *Id = isl_set_get_dim_id(AssumptionCtx, isl_dim_param, u);

        auto *Param = static_cast<const SCEV *>(isl_id_get_user(Id));

        isl_id_free(Id);


        if (!NewParams.count(Param))

          continue;


        AssumptionCtx =

            isl_set_project_out(AssumptionCtx, isl_dim_param, u--, 1);

      }

    }

    ORE.emit(OptimizationRemarkAnalysis(DEBUG_TYPE, "UserAssumption", CI)

             << "Use user assumption: "

             << stringFromIslObj(AssumptionCtx, "null"));

    isl::set newContext =

        scop->getContext().intersect(isl::manage(AssumptionCtx));

    scop->setContext(newContext);

  }

}


bool ScopBuilder::buildAccessMultiDimFixed(MemAccInst Inst, ScopStmt *Stmt) {

  // Memory builtins are not considered in this function.

  if (!Inst.isLoad() && !Inst.isStore())

    return false;


  Value *Val = Inst.getValueOperand();

  Type *ElementType = Val->getType();

  Value *Address = Inst.getPointerOperand();

  const SCEV *AccessFunction =

      SE.getSCEVAtScope(Address, LI.getLoopFor(Inst->getParent()));

  const SCEVUnknown *BasePointer =

      dyn_cast<SCEVUnknown>(SE.getPointerBase(AccessFunction));

  enum MemoryAccess::AccessType AccType =

      isa<LoadInst>(Inst) ? MemoryAccess::READ : MemoryAccess::MUST_WRITE;


  if (auto *BitCast = dyn_cast<BitCastInst>(Address))

    Address = BitCast->getOperand(0);


  auto *GEP = dyn_cast<GetElementPtrInst>(Address);

  if (!GEP || DL.getTypeAllocSize(GEP->getResultElementType()) !=

                  DL.getTypeAllocSize(ElementType))

    return false;


  SmallVector<const SCEV *, 4> Subscripts;

  SmallVector<int, 4> Sizes;

  getIndexExpressionsFromGEP(SE, GEP, Subscripts, Sizes);

  auto *BasePtr = GEP->getOperand(0);


  if (auto *BasePtrCast = dyn_cast<BitCastInst>(BasePtr))

    BasePtr = BasePtrCast->getOperand(0);


  // Check for identical base pointers to ensure that we do not miss index

  // offsets that have been added before this GEP is applied.

  if (BasePtr != BasePointer->getValue())

    return false;


  std::vector<const SCEV *> SizesSCEV;


  const InvariantLoadsSetTy &ScopRIL = scop->getRequiredInvariantLoads();


  Loop *SurroundingLoop = Stmt->getSurroundingLoop();

  for (auto *Subscript : Subscripts) {

    InvariantLoadsSetTy AccessILS;

    if (!isAffineExpr(&scop->getRegion(), SurroundingLoop, Subscript, SE,

                      &AccessILS))

      return false;


    for (LoadInst *LInst : AccessILS)

      if (!ScopRIL.count(LInst))

        return false;

  }


  if (Sizes.empty())

    return false;


  SizesSCEV.push_back(nullptr);


  for (auto V : Sizes)

    SizesSCEV.push_back(SE.getSCEV(

        ConstantInt::get(IntegerType::getInt64Ty(BasePtr->getContext()), V)));


  addArrayAccess(Stmt, Inst, AccType, BasePointer->getValue(), ElementType,

                 true, Subscripts, SizesSCEV, Val);

  return true;

}


bool ScopBuilder::buildAccessMultiDimParam(MemAccInst Inst, ScopStmt *Stmt) {

  // Memory builtins are not considered by this function.

  if (!Inst.isLoad() && !Inst.isStore())

    return false;


  if (!PollyDelinearize)

    return false;


  Value *Address = Inst.getPointerOperand();

  Value *Val = Inst.getValueOperand();

  Type *ElementType = Val->getType();

  unsigned ElementSize = DL.getTypeAllocSize(ElementType);

  enum MemoryAccess::AccessType AccType =

      isa<LoadInst>(Inst) ? MemoryAccess::READ : MemoryAccess::MUST_WRITE;


  const SCEV *AccessFunction =

      SE.getSCEVAtScope(Address, LI.getLoopFor(Inst->getParent()));

  const SCEVUnknown *BasePointer =

      dyn_cast<SCEVUnknown>(SE.getPointerBase(AccessFunction));


  assert(BasePointer && "Could not find base pointer");


  auto &InsnToMemAcc = scop->getInsnToMemAccMap();

  auto AccItr = InsnToMemAcc.find(Inst);

  if (AccItr == InsnToMemAcc.end())

    return false;


  std::vector<const SCEV *> Sizes = {nullptr};


  Sizes.insert(Sizes.end(), AccItr->second.Shape->DelinearizedSizes.begin(),

               AccItr->second.Shape->DelinearizedSizes.end());


  // In case only the element size is contained in the 'Sizes' array, the

  // access does not access a real multi-dimensional array. Hence, we allow

  // the normal single-dimensional access construction to handle this.

  if (Sizes.size() == 1)

    return false;


  // Remove the element size. This information is already provided by the

  // ElementSize parameter. In case the element size of this access and the

  // element size used for delinearization differs the delinearization is

  // incorrect. Hence, we invalidate the scop.

  //

  // TODO: Handle delinearization with differing element sizes.

  auto DelinearizedSize =

      cast<SCEVConstant>(Sizes.back())->getAPInt().getSExtValue();

  Sizes.pop_back();

  if (ElementSize != DelinearizedSize)

    scop->invalidate(DELINEARIZATION, Inst->getDebugLoc(), Inst->getParent());


  addArrayAccess(Stmt, Inst, AccType, BasePointer->getValue(), ElementType,

                 true, AccItr->second.DelinearizedSubscripts, Sizes, Val);

  return true;

}


bool ScopBuilder::buildAccessMemIntrinsic(MemAccInst Inst, ScopStmt *Stmt) {

  auto *MemIntr = dyn_cast_or_null<MemIntrinsic>(Inst);


  if (MemIntr == nullptr)

    return false;


  auto *L = LI.getLoopFor(Inst->getParent());

  const SCEV *LengthVal = SE.getSCEVAtScope(MemIntr->getLength(), L);

  assert(LengthVal);


  // Check if the length val is actually affine or if we overapproximate it

  InvariantLoadsSetTy AccessILS;

  const InvariantLoadsSetTy &ScopRIL = scop->getRequiredInvariantLoads();


  Loop *SurroundingLoop = Stmt->getSurroundingLoop();

  bool LengthIsAffine = isAffineExpr(&scop->getRegion(), SurroundingLoop,

                                     LengthVal, SE, &AccessILS);

  for (LoadInst *LInst : AccessILS)

    if (!ScopRIL.count(LInst))

      LengthIsAffine = false;

  if (!LengthIsAffine)

    LengthVal = nullptr;


  auto *DestPtrVal = MemIntr->getDest();

  assert(DestPtrVal);


  const SCEV *DestAccFunc = SE.getSCEVAtScope(DestPtrVal, L);

  assert(DestAccFunc);

  // Ignore accesses to "NULL".

  // TODO: We could use this to optimize the region further, e.g., intersect

  //       the context with

  //          isl_set_complement(isl_set_params(getDomain()))

  //       as we know it would be undefined to execute this instruction anyway.

  if (DestAccFunc->isZero())

    return true;


  if (auto *U = dyn_cast<SCEVUnknown>(DestAccFunc)) {

    if (isa<ConstantPointerNull>(U->getValue()))

      return true;

  }


  auto *DestPtrSCEV = dyn_cast<SCEVUnknown>(SE.getPointerBase(DestAccFunc));

  assert(DestPtrSCEV);

  DestAccFunc = SE.getMinusSCEV(DestAccFunc, DestPtrSCEV);

  addArrayAccess(Stmt, Inst, MemoryAccess::MUST_WRITE, DestPtrSCEV->getValue(),

                 IntegerType::getInt8Ty(DestPtrVal->getContext()),

                 LengthIsAffine, {DestAccFunc, LengthVal}, {nullptr},

                 Inst.getValueOperand());


  auto *MemTrans = dyn_cast<MemTransferInst>(MemIntr);

  if (!MemTrans)

    return true;


  auto *SrcPtrVal = MemTrans->getSource();

  assert(SrcPtrVal);


  const SCEV *SrcAccFunc = SE.getSCEVAtScope(SrcPtrVal, L);

  assert(SrcAccFunc);

  // Ignore accesses to "NULL".

  // TODO: See above TODO

  if (SrcAccFunc->isZero())

    return true;


  auto *SrcPtrSCEV = dyn_cast<SCEVUnknown>(SE.getPointerBase(SrcAccFunc));

  assert(SrcPtrSCEV);

  SrcAccFunc = SE.getMinusSCEV(SrcAccFunc, SrcPtrSCEV);

  addArrayAccess(Stmt, Inst, MemoryAccess::READ, SrcPtrSCEV->getValue(),

                 IntegerType::getInt8Ty(SrcPtrVal->getContext()),

                 LengthIsAffine, {SrcAccFunc, LengthVal}, {nullptr},

                 Inst.getValueOperand());


  return true;

}


bool ScopBuilder::buildAccessCallInst(MemAccInst Inst, ScopStmt *Stmt) {

  auto *CI = dyn_cast_or_null<CallInst>(Inst);


  if (CI == nullptr)

    return false;


  if (CI->doesNotAccessMemory() || isIgnoredIntrinsic(CI) || isDebugCall(CI))

    return true;


  const SCEV *AF = SE.getConstant(IntegerType::getInt64Ty(CI->getContext()), 0);

  auto *CalledFunction = CI->getCalledFunction();

  MemoryEffects ME = AA.getMemoryEffects(CalledFunction);

  if (ME.doesNotAccessMemory())

    return true;


  if (ME.onlyAccessesArgPointees()) {

    ModRefInfo ArgMR = ME.getModRef(IRMemLocation::ArgMem);

    auto AccType =

        !isModSet(ArgMR) ? MemoryAccess::READ : MemoryAccess::MAY_WRITE;

    Loop *L = LI.getLoopFor(Inst->getParent());

    for (const auto &Arg : CI->args()) {

      if (!Arg->getType()->isPointerTy())

        continue;


      const SCEV *ArgSCEV = SE.getSCEVAtScope(Arg, L);

      if (ArgSCEV->isZero())

        continue;


      if (auto *U = dyn_cast<SCEVUnknown>(ArgSCEV)) {

        if (isa<ConstantPointerNull>(U->getValue()))

          return true;

      }


      auto *ArgBasePtr = cast<SCEVUnknown>(SE.getPointerBase(ArgSCEV));

      addArrayAccess(Stmt, Inst, AccType, ArgBasePtr->getValue(),

                     ArgBasePtr->getType(), false, {AF}, {nullptr}, CI);

    }

    return true;

  }


  if (ME.onlyReadsMemory()) {

    GlobalReads.emplace_back(Stmt, CI);

    return true;

  }

  return false;

}


bool ScopBuilder::buildAccessSingleDim(MemAccInst Inst, ScopStmt *Stmt) {

  // Memory builtins are not considered by this function.

  if (!Inst.isLoad() && !Inst.isStore())

    return false;


  Value *Address = Inst.getPointerOperand();

  Value *Val = Inst.getValueOperand();

  Type *ElementType = Val->getType();

  enum MemoryAccess::AccessType AccType =

      isa<LoadInst>(Inst) ? MemoryAccess::READ : MemoryAccess::MUST_WRITE;


  const SCEV *AccessFunction =

      SE.getSCEVAtScope(Address, LI.getLoopFor(Inst->getParent()));

  const SCEVUnknown *BasePointer =

      dyn_cast<SCEVUnknown>(SE.getPointerBase(AccessFunction));


  assert(BasePointer && "Could not find base pointer");

  AccessFunction = SE.getMinusSCEV(AccessFunction, BasePointer);


  // Check if the access depends on a loop contained in a non-affine subregion.

  bool isVariantInNonAffineLoop = false;

  SetVector<const Loop *> Loops;

  findLoops(AccessFunction, Loops);

  for (const Loop *L : Loops)

    if (Stmt->contains(L)) {

      isVariantInNonAffineLoop = true;

      break;

    }


  InvariantLoadsSetTy AccessILS;


  Loop *SurroundingLoop = Stmt->getSurroundingLoop();

  bool IsAffine = !isVariantInNonAffineLoop &&

                  isAffineExpr(&scop->getRegion(), SurroundingLoop,

                               AccessFunction, SE, &AccessILS);


  const InvariantLoadsSetTy &ScopRIL = scop->getRequiredInvariantLoads();

  for (LoadInst *LInst : AccessILS)

    if (!ScopRIL.count(LInst))

      IsAffine = false;


  if (!IsAffine && AccType == MemoryAccess::MUST_WRITE)

    AccType = MemoryAccess::MAY_WRITE;


  addArrayAccess(Stmt, Inst, AccType, BasePointer->getValue(), ElementType,

                 IsAffine, {AccessFunction}, {nullptr}, Val);

  return true;

}


void ScopBuilder::buildMemoryAccess(MemAccInst Inst, ScopStmt *Stmt) {

  if (buildAccessMemIntrinsic(Inst, Stmt))

    return;


  if (buildAccessCallInst(Inst, Stmt))

    return;


  if (buildAccessMultiDimFixed(Inst, Stmt))

    return;


  if (buildAccessMultiDimParam(Inst, Stmt))

    return;


  if (buildAccessSingleDim(Inst, Stmt))

    return;


  llvm_unreachable(

      "At least one of the buildAccess functions must handled this access, or "

      "ScopDetection should have rejected this SCoP");

}


void ScopBuilder::buildAccessFunctions() {

  for (auto &Stmt : *scop) {

    if (Stmt.isBlockStmt()) {

      buildAccessFunctions(&Stmt, *Stmt.getBasicBlock());

      continue;

    }


    Region *R = Stmt.getRegion();

    for (BasicBlock *BB : R->blocks())

      buildAccessFunctions(&Stmt, *BB, R);

  }


  // Build write accesses for values that are used after the SCoP.

  // The instructions defining them might be synthesizable and therefore not

  // contained in any statement, hence we iterate over the original instructions

  // to identify all escaping values.

  for (BasicBlock *BB : scop->getRegion().blocks()) {

    for (Instruction &Inst : *BB)

      buildEscapingDependences(&Inst);

  }

}


bool ScopBuilder::shouldModelInst(Instruction *Inst, Loop *L) {

  return !Inst->isTerminator() && !isIgnoredIntrinsic(Inst) &&

         !canSynthesize(Inst, *scop, &SE, L);

}


/// Generate a name for a statement.

///

/// @param BB     The basic block the statement will represent.

/// @param BBIdx  The index of the @p BB relative to other BBs/regions.

/// @param Count  The index of the created statement in @p BB.

/// @param IsMain Whether this is the main of all statement for @p BB. If true,

///               no suffix will be added.

/// @param IsLast Uses a special indicator for the last statement of a BB.

static std::string makeStmtName(BasicBlock *BB, long BBIdx, int Count,

                                bool IsMain, bool IsLast = false) {

  std::string Suffix;

  if (!IsMain) {

    if (UseInstructionNames)

      Suffix = '_';

    if (IsLast)

      Suffix += "last";

    else if (Count < 26)

      Suffix += 'a' + Count;

    else

      Suffix += std::to_string(Count);

  }

  return getIslCompatibleName("Stmt", BB, BBIdx, Suffix, UseInstructionNames);

}


/// Generate a name for a statement that represents a non-affine subregion.

///

/// @param R    The region the statement will represent.

/// @param RIdx The index of the @p R relative to other BBs/regions.

static std::string makeStmtName(Region *R, long RIdx) {

  return getIslCompatibleName("Stmt", R->getNameStr(), RIdx, "",

                              UseInstructionNames);

}


void ScopBuilder::buildSequentialBlockStmts(BasicBlock *BB, bool SplitOnStore) {

  Loop *SurroundingLoop = LI.getLoopFor(BB);


  int Count = 0;

  long BBIdx = scop->getNextStmtIdx();

  std::vector<Instruction *> Instructions;

  for (Instruction &Inst : *BB) {

    if (shouldModelInst(&Inst, SurroundingLoop))

      Instructions.push_back(&Inst);

    if (Inst.getMetadata("polly_split_after") ||

        (SplitOnStore && isa<StoreInst>(Inst))) {

      std::string Name = makeStmtName(BB, BBIdx, Count, Count == 0);

      scop->addScopStmt(BB, Name, SurroundingLoop, Instructions);

      Count++;

      Instructions.clear();

    }

  }


  std::string Name = makeStmtName(BB, BBIdx, Count, Count == 0);

  scop->addScopStmt(BB, Name, SurroundingLoop, Instructions);

}


/// Is @p Inst an ordered instruction?

///

/// An unordered instruction is an instruction, such that a sequence of

/// unordered instructions can be permuted without changing semantics. Any

/// instruction for which this is not always the case is ordered.

static bool isOrderedInstruction(Instruction *Inst) {

  return Inst->mayHaveSideEffects() || Inst->mayReadOrWriteMemory();

}


/// Join instructions to the same statement if one uses the scalar result of the

/// other.

static void joinOperandTree(EquivalenceClasses<Instruction *> &UnionFind,

                            ArrayRef<Instruction *> ModeledInsts) {

  for (Instruction *Inst : ModeledInsts) {

    if (isa<PHINode>(Inst))

      continue;


    for (Use &Op : Inst->operands()) {

      Instruction *OpInst = dyn_cast<Instruction>(Op.get());

      if (!OpInst)

        continue;


      // Check if OpInst is in the BB and is a modeled instruction.

      auto OpVal = UnionFind.findValue(OpInst);

      if (OpVal == UnionFind.end())

        continue;


      UnionFind.unionSets(Inst, OpInst);

    }

  }

}


/// Ensure that the order of ordered instructions does not change.

///

/// If we encounter an ordered instruction enclosed in instructions belonging to

/// a different statement (which might as well contain ordered instructions, but

/// this is not tested here), join them.

static void

joinOrderedInstructions(EquivalenceClasses<Instruction *> &UnionFind,

                        ArrayRef<Instruction *> ModeledInsts) {

  SetVector<Instruction *> SeenLeaders;

  for (Instruction *Inst : ModeledInsts) {

    if (!isOrderedInstruction(Inst))

      continue;


    Instruction *Leader = UnionFind.getLeaderValue(Inst);

    // Since previous iterations might have merged sets, some items in

    // SeenLeaders are not leaders anymore. However, The new leader of

    // previously merged instructions must be one of the former leaders of

    // these merged instructions.

    bool Inserted = SeenLeaders.insert(Leader);

    if (Inserted)

      continue;


    // Merge statements to close holes. Say, we have already seen statements A

    // and B, in this order. Then we see an instruction of A again and we would

    // see the pattern "A B A". This function joins all statements until the

    // only seen occurrence of A.

    for (Instruction *Prev : reverse(SeenLeaders)) {

      // We are backtracking from the last element until we see Inst's leader

      // in SeenLeaders and merge all into one set. Although leaders of

      // instructions change during the execution of this loop, it's irrelevant

      // as we are just searching for the element that we already confirmed is

      // in the list.

      if (Prev == Leader)

        break;

      UnionFind.unionSets(Prev, Leader);

    }

  }

}


/// If the BasicBlock has an edge from itself, ensure that the PHI WRITEs for

/// the incoming values from this block are executed after the PHI READ.

///

/// Otherwise it could overwrite the incoming value from before the BB with the

/// value for the next execution. This can happen if the PHI WRITE is added to

/// the statement with the instruction that defines the incoming value (instead

/// of the last statement of the same BB). To ensure that the PHI READ and WRITE

/// are in order, we put both into the statement. PHI WRITEs are always executed

/// after PHI READs when they are in the same statement.

///

/// TODO: This is an overpessimization. We only have to ensure that the PHI

/// WRITE is not put into a statement containing the PHI itself. That could also

/// be done by

/// - having all (strongly connected) PHIs in a single statement,

/// - unite only the PHIs in the operand tree of the PHI WRITE (because it only

///   has a chance of being lifted before a PHI by being in a statement with a

///   PHI that comes before in the basic block), or

/// - when uniting statements, ensure that no (relevant) PHIs are overtaken.

static void joinOrderedPHIs(EquivalenceClasses<Instruction *> &UnionFind,

                            ArrayRef<Instruction *> ModeledInsts) {

  for (Instruction *Inst : ModeledInsts) {

    PHINode *PHI = dyn_cast<PHINode>(Inst);

    if (!PHI)

      continue;


    int Idx = PHI->getBasicBlockIndex(PHI->getParent());

    if (Idx < 0)

      continue;


    Instruction *IncomingVal =

        dyn_cast<Instruction>(PHI->getIncomingValue(Idx));

    if (!IncomingVal)

      continue;


    UnionFind.unionSets(PHI, IncomingVal);

  }

}


void ScopBuilder::buildEqivClassBlockStmts(BasicBlock *BB) {

  Loop *L = LI.getLoopFor(BB);


  // Extracting out modeled instructions saves us from checking

  // shouldModelInst() repeatedly.

  SmallVector<Instruction *, 32> ModeledInsts;

  EquivalenceClasses<Instruction *> UnionFind;

  Instruction *MainInst = nullptr, *MainLeader = nullptr;

  for (Instruction &Inst : *BB) {

    if (!shouldModelInst(&Inst, L))

      continue;

    ModeledInsts.push_back(&Inst);

    UnionFind.insert(&Inst);


    // When a BB is split into multiple statements, the main statement is the

    // one containing the 'main' instruction. We select the first instruction

    // that is unlikely to be removed (because it has side-effects) as the main

    // one. It is used to ensure that at least one statement from the bb has the

    // same name as with -polly-stmt-granularity=bb.

    if (!MainInst && (isa<StoreInst>(Inst) ||

                      (isa<CallInst>(Inst) && !isa<IntrinsicInst>(Inst))))

      MainInst = &Inst;

  }


  joinOperandTree(UnionFind, ModeledInsts);

  joinOrderedInstructions(UnionFind, ModeledInsts);

  joinOrderedPHIs(UnionFind, ModeledInsts);


  // The list of instructions for statement (statement represented by the leader

  // instruction).

  MapVector<Instruction *, std::vector<Instruction *>> LeaderToInstList;


  // The order of statements must be preserved w.r.t. their ordered

  // instructions. Without this explicit scan, we would also use non-ordered

  // instructions (whose order is arbitrary) to determine statement order.

  for (Instruction *Inst : ModeledInsts) {

    if (!isOrderedInstruction(Inst))

      continue;


    auto LeaderIt = UnionFind.findLeader(Inst);

    if (LeaderIt == UnionFind.member_end())

      continue;


    // Insert element for the leader instruction.

    (void)LeaderToInstList[*LeaderIt];

  }


  // Collect the instructions of all leaders. UnionFind's member iterator

  // unfortunately are not in any specific order.

  for (Instruction *Inst : ModeledInsts) {

    auto LeaderIt = UnionFind.findLeader(Inst);

    if (LeaderIt == UnionFind.member_end())

      continue;


    if (Inst == MainInst)

      MainLeader = *LeaderIt;

    std::vector<Instruction *> &InstList = LeaderToInstList[*LeaderIt];

    InstList.push_back(Inst);

  }


  // Finally build the statements.

  int Count = 0;

  long BBIdx = scop->getNextStmtIdx();

  for (auto &Instructions : LeaderToInstList) {

    std::vector<Instruction *> &InstList = Instructions.second;


    // If there is no main instruction, make the first statement the main.

    bool IsMain = (MainInst ? MainLeader == Instructions.first : Count == 0);


    std::string Name = makeStmtName(BB, BBIdx, Count, IsMain);

    scop->addScopStmt(BB, Name, L, std::move(InstList));

    Count += 1;

  }


  // Unconditionally add an epilogue (last statement). It contains no

  // instructions, but holds the PHI write accesses for successor basic blocks,

  // if the incoming value is not defined in another statement if the same BB.

  // The epilogue becomes the main statement only if there is no other

  // statement that could become main.

  // The epilogue will be removed if no PHIWrite is added to it.

  std::string EpilogueName = makeStmtName(BB, BBIdx, Count, Count == 0, true);

  scop->addScopStmt(BB, EpilogueName, L, {});

}


void ScopBuilder::buildStmts(Region &SR) {

  if (scop->isNonAffineSubRegion(&SR)) {

    std::vector<Instruction *> Instructions;

    Loop *SurroundingLoop =

        getFirstNonBoxedLoopFor(SR.getEntry(), LI, scop->getBoxedLoops());

    for (Instruction &Inst : *SR.getEntry())

      if (shouldModelInst(&Inst, SurroundingLoop))

        Instructions.push_back(&Inst);

    long RIdx = scop->getNextStmtIdx();

    std::string Name = makeStmtName(&SR, RIdx);

    scop->addScopStmt(&SR, Name, SurroundingLoop, Instructions);

    return;

  }


  for (auto I = SR.element_begin(), E = SR.element_end(); I != E; ++I)

    if (I->isSubRegion())

      buildStmts(*I->getNodeAs<Region>());

    else {

      BasicBlock *BB = I->getNodeAs<BasicBlock>();

      switch (StmtGranularity) {

      case GranularityChoice::BasicBlocks:

        buildSequentialBlockStmts(BB);

        break;

      case GranularityChoice::ScalarIndependence:

        buildEqivClassBlockStmts(BB);

        break;

      case GranularityChoice::Stores:

        buildSequentialBlockStmts(BB, true);

        break;

      }

    }

}


void ScopBuilder::buildAccessFunctions(ScopStmt *Stmt, BasicBlock &BB,

                                       Region *NonAffineSubRegion) {

  assert(

      Stmt &&

      "The exit BB is the only one that cannot be represented by a statement");

  assert(Stmt->represents(&BB));


  // We do not build access functions for error blocks, as they may contain

  // instructions we can not model.

  if (SD.isErrorBlock(BB, scop->getRegion()))

    return;


  auto BuildAccessesForInst = [this, Stmt,

                               NonAffineSubRegion](Instruction *Inst) {

    PHINode *PHI = dyn_cast<PHINode>(Inst);

    if (PHI)

      buildPHIAccesses(Stmt, PHI, NonAffineSubRegion, false);


    if (auto MemInst = MemAccInst::dyn_cast(*Inst)) {

      assert(Stmt && "Cannot build access function in non-existing statement");

      buildMemoryAccess(MemInst, Stmt);

    }


    // PHI nodes have already been modeled above and terminators that are

    // not part of a non-affine subregion are fully modeled and regenerated

    // from the polyhedral domains. Hence, they do not need to be modeled as

    // explicit data dependences.

    if (!PHI)

      buildScalarDependences(Stmt, Inst);

  };


  const InvariantLoadsSetTy &RIL = scop->getRequiredInvariantLoads();

  bool IsEntryBlock = (Stmt->getEntryBlock() == &BB);

  if (IsEntryBlock) {

    for (Instruction *Inst : Stmt->getInstructions())

      BuildAccessesForInst(Inst);

    if (Stmt->isRegionStmt())

      BuildAccessesForInst(BB.getTerminator());

  } else {

    for (Instruction &Inst : BB) {

      if (isIgnoredIntrinsic(&Inst))

        continue;


      // Invariant loads already have been processed.

      if (isa<LoadInst>(Inst) && RIL.count(cast<LoadInst>(&Inst)))

        continue;


      BuildAccessesForInst(&Inst);

    }

  }

}


MemoryAccess *ScopBuilder::addMemoryAccess(

    ScopStmt *Stmt, Instruction *Inst, MemoryAccess::AccessType AccType,

    Value *BaseAddress, Type *ElementType, bool Affine, Value *AccessValue,

    ArrayRef<const SCEV *> Subscripts, ArrayRef<const SCEV *> Sizes,

    MemoryKind Kind) {

  bool isKnownMustAccess = false;


  // Accesses in single-basic block statements are always executed.

  if (Stmt->isBlockStmt())

    isKnownMustAccess = true;


  if (Stmt->isRegionStmt()) {

    // Accesses that dominate the exit block of a non-affine region are always

    // executed. In non-affine regions there may exist MemoryKind::Values that

    // do not dominate the exit. MemoryKind::Values will always dominate the

    // exit and MemoryKind::PHIs only if there is at most one PHI_WRITE in the

    // non-affine region.

    if (Inst && DT.dominates(Inst->getParent(), Stmt->getRegion()->getExit()))

      isKnownMustAccess = true;

  }


  // Non-affine PHI writes do not "happen" at a particular instruction, but

  // after exiting the statement. Therefore they are guaranteed to execute and

  // overwrite the old value.

  if (Kind == MemoryKind::PHI || Kind == MemoryKind::ExitPHI)

    isKnownMustAccess = true;


  if (!isKnownMustAccess && AccType == MemoryAccess::MUST_WRITE)

    AccType = MemoryAccess::MAY_WRITE;


  auto *Access = new MemoryAccess(Stmt, Inst, AccType, BaseAddress, ElementType,

                                  Affine, Subscripts, Sizes, AccessValue, Kind);


  scop->addAccessFunction(Access);

  Stmt->addAccess(Access);

  return Access;

}


void ScopBuilder::addArrayAccess(ScopStmt *Stmt, MemAccInst MemAccInst,

                                 MemoryAccess::AccessType AccType,

                                 Value *BaseAddress, Type *ElementType,

                                 bool IsAffine,

                                 ArrayRef<const SCEV *> Subscripts,

                                 ArrayRef<const SCEV *> Sizes,

                                 Value *AccessValue) {

  ArrayBasePointers.insert(BaseAddress);

  addMemoryAccess(Stmt, MemAccInst, AccType, BaseAddress, ElementType, IsAffine,

                  AccessValue, Subscripts, Sizes, MemoryKind::Array);

}


/// Check if @p Expr is divisible by @p Size.

static bool isDivisible(const SCEV *Expr, unsigned Size, ScalarEvolution &SE) {

  assert(Size != 0);

  if (Size == 1)

    return true;


  // Only one factor needs to be divisible.

  if (auto *MulExpr = dyn_cast<SCEVMulExpr>(Expr)) {

    for (const SCEV *FactorExpr : MulExpr->operands())

      if (isDivisible(FactorExpr, Size, SE))

        return true;

    return false;

  }


  // For other n-ary expressions (Add, AddRec, Max,...) all operands need

  // to be divisible.

  if (auto *NAryExpr = dyn_cast<SCEVNAryExpr>(Expr)) {

    for (const SCEV *OpExpr : NAryExpr->operands())

      if (!isDivisible(OpExpr, Size, SE))

        return false;

    return true;

  }


  const SCEV *SizeSCEV = SE.getConstant(Expr->getType(), Size);

  const SCEV *UDivSCEV = SE.getUDivExpr(Expr, SizeSCEV);

  const SCEV *MulSCEV = SE.getMulExpr(UDivSCEV, SizeSCEV);

  return MulSCEV == Expr;

}


void ScopBuilder::foldSizeConstantsToRight() {

  isl::union_set Accessed = scop->getAccesses().range();


  for (auto Array : scop->arrays()) {

    if (Array->getNumberOfDimensions() <= 1)

      continue;


    isl::space Space = Array->getSpace();

    Space = Space.align_params(Accessed.get_space());


    if (!Accessed.contains(Space))

      continue;


    isl::set Elements = Accessed.extract_set(Space);

    isl::map Transform = isl::map::universe(Array->getSpace().map_from_set());


    std::vector<int> Int;

    unsigned Dims = unsignedFromIslSize(Elements.tuple_dim());

    for (unsigned i = 0; i < Dims; i++) {

      isl::set DimOnly = isl::set(Elements).project_out(isl::dim::set, 0, i);

      DimOnly = DimOnly.project_out(isl::dim::set, 1, Dims - i - 1);

      DimOnly = DimOnly.lower_bound_si(isl::dim::set, 0, 0);


      isl::basic_set DimHull = DimOnly.affine_hull();


      if (i == Dims - 1) {

        Int.push_back(1);

        Transform = Transform.equate(isl::dim::in, i, isl::dim::out, i);

        continue;

      }


      if (unsignedFromIslSize(DimHull.dim(isl::dim::div)) == 1) {

        isl::aff Diff = DimHull.get_div(0);

        isl::val Val = Diff.get_denominator_val();


        int ValInt = 1;

        if (Val.is_int()) {

          auto ValAPInt = APIntFromVal(Val);

          if (ValAPInt.isSignedIntN(32))

            ValInt = ValAPInt.getSExtValue();

        } else {

        }


        Int.push_back(ValInt);

        isl::constraint C = isl::constraint::alloc_equality(

            isl::local_space(Transform.get_space()));

        C = C.set_coefficient_si(isl::dim::out, i, ValInt);

        C = C.set_coefficient_si(isl::dim::in, i, -1);

        Transform = Transform.add_constraint(C);

        continue;

      }


      isl::basic_set ZeroSet = isl::basic_set(DimHull);

      ZeroSet = ZeroSet.fix_si(isl::dim::set, 0, 0);


      int ValInt = 1;

      if (ZeroSet.is_equal(DimHull)) {

        ValInt = 0;

      }


      Int.push_back(ValInt);

      Transform = Transform.equate(isl::dim::in, i, isl::dim::out, i);

    }


    isl::set MappedElements = isl::map(Transform).domain();

    if (!Elements.is_subset(MappedElements))

      continue;


    bool CanFold = true;

    if (Int[0] <= 1)

      CanFold = false;


    unsigned NumDims = Array->getNumberOfDimensions();

    for (unsigned i = 1; i < NumDims - 1; i++)

      if (Int[0] != Int[i] && Int[i])

        CanFold = false;


    if (!CanFold)

      continue;


    for (auto &Access : scop->access_functions())

      if (Access->getScopArrayInfo() == Array)

        Access->setAccessRelation(

            Access->getAccessRelation().apply_range(Transform));


    std::vector<const SCEV *> Sizes;

    for (unsigned i = 0; i < NumDims; i++) {

      auto Size = Array->getDimensionSize(i);


      if (i == NumDims - 1)

        Size = SE.getMulExpr(Size, SE.getConstant(Size->getType(), Int[0]));

      Sizes.push_back(Size);

    }


    Array->updateSizes(Sizes, false /* CheckConsistency */);

  }

}


void ScopBuilder::finalizeAccesses() {

  updateAccessDimensionality();

  foldSizeConstantsToRight();

  foldAccessRelations();

  assumeNoOutOfBounds();

}


void ScopBuilder::updateAccessDimensionality() {

  // Check all array accesses for each base pointer and find a (virtual) element

  // size for the base pointer that divides all access functions.

  for (ScopStmt &Stmt : *scop)

    for (MemoryAccess *Access : Stmt) {

      if (!Access->isArrayKind())

        continue;

      ScopArrayInfo *Array =

          const_cast<ScopArrayInfo *>(Access->getScopArrayInfo());


      if (Array->getNumberOfDimensions() != 1)

        continue;

      unsigned DivisibleSize = Array->getElemSizeInBytes();

      const SCEV *Subscript = Access->getSubscript(0);

      while (!isDivisible(Subscript, DivisibleSize, SE))

        DivisibleSize /= 2;

      auto *Ty = IntegerType::get(SE.getContext(), DivisibleSize * 8);

      Array->updateElementType(Ty);

    }


  for (auto &Stmt : *scop)

    for (auto &Access : Stmt)

      Access->updateDimensionality();

}


void ScopBuilder::foldAccessRelations() {

  for (auto &Stmt : *scop)

    for (auto &Access : Stmt)

      Access->foldAccessRelation();

}


void ScopBuilder::assumeNoOutOfBounds() {

  if (PollyIgnoreInbounds)

    return;

  for (auto &Stmt : *scop)

    for (auto &Access : Stmt) {

      isl::set Outside = Access->assumeNoOutOfBound();

      const auto &Loc = Access->getAccessInstruction()

                            ? Access->getAccessInstruction()->getDebugLoc()

                            : DebugLoc();

      recordAssumption(&RecordedAssumptions, INBOUNDS, Outside, Loc,

                       AS_ASSUMPTION);

    }

}


void ScopBuilder::ensureValueWrite(Instruction *Inst) {

  // Find the statement that defines the value of Inst. That statement has to

  // write the value to make it available to those statements that read it.

  ScopStmt *Stmt = scop->getStmtFor(Inst);


  // It is possible that the value is synthesizable within a loop (such that it

  // is not part of any statement), but not after the loop (where you need the

  // number of loop round-trips to synthesize it). In LCSSA-form a PHI node will

  // avoid this. In case the IR has no such PHI, use the last statement (where

  // the value is synthesizable) to write the value.

  if (!Stmt)

    Stmt = scop->getLastStmtFor(Inst->getParent());


  // Inst not defined within this SCoP.

  if (!Stmt)

    return;


  // Do not process further if the instruction is already written.

  if (Stmt->lookupValueWriteOf(Inst))

    return;


  addMemoryAccess(Stmt, Inst, MemoryAccess::MUST_WRITE, Inst, Inst->getType(),

                  true, Inst, ArrayRef<const SCEV *>(),

                  ArrayRef<const SCEV *>(), MemoryKind::Value);

}


void ScopBuilder::ensureValueRead(Value *V, ScopStmt *UserStmt) {

  // TODO: Make ScopStmt::ensureValueRead(Value*) offer the same functionality

  // to be able to replace this one. Currently, there is a split responsibility.

  // In a first step, the MemoryAccess is created, but without the

  // AccessRelation. In the second step by ScopStmt::buildAccessRelations(), the

  // AccessRelation is created. At least for scalar accesses, there is no new

  // information available at ScopStmt::buildAccessRelations(), so we could

  // create the AccessRelation right away. This is what

  // ScopStmt::ensureValueRead(Value*) does.


  auto *Scope = UserStmt->getSurroundingLoop();

  auto VUse = VirtualUse::create(scop.get(), UserStmt, Scope, V, false);

  switch (VUse.getKind()) {

  case VirtualUse::Constant:

  case VirtualUse::Block:

  case VirtualUse::Synthesizable:

  case VirtualUse::Hoisted:

  case VirtualUse::Intra:

    // Uses of these kinds do not need a MemoryAccess.

    break;


  case VirtualUse::ReadOnly:

    // Add MemoryAccess for invariant values only if requested.

    if (!ModelReadOnlyScalars)

      break;


    [[fallthrough]];

  case VirtualUse::Inter:


    // Do not create another MemoryAccess for reloading the value if one already

    // exists.

    if (UserStmt->lookupValueReadOf(V))

      break;


    addMemoryAccess(UserStmt, nullptr, MemoryAccess::READ, V, V->getType(),

                    true, V, ArrayRef<const SCEV *>(), ArrayRef<const SCEV *>(),

                    MemoryKind::Value);


    // Inter-statement uses need to write the value in their defining statement.

    if (VUse.isInter())

      ensureValueWrite(cast<Instruction>(V));

    break;

  }

}


void ScopBuilder::ensurePHIWrite(PHINode *PHI, ScopStmt *IncomingStmt,

                                 BasicBlock *IncomingBlock,

                                 Value *IncomingValue, bool IsExitBlock) {

  // As the incoming block might turn out to be an error statement ensure we

  // will create an exit PHI SAI object. It is needed during code generation

  // and would be created later anyway.

  if (IsExitBlock)

    scop->getOrCreateScopArrayInfo(PHI, PHI->getType(), {},

                                   MemoryKind::ExitPHI);


  // This is possible if PHI is in the SCoP's entry block. The incoming blocks

  // from outside the SCoP's region have no statement representation.

  if (!IncomingStmt)

    return;


  // Take care for the incoming value being available in the incoming block.

  // This must be done before the check for multiple PHI writes because multiple

  // exiting edges from subregion each can be the effective written value of the

  // subregion. As such, all of them must be made available in the subregion

  // statement.

  ensureValueRead(IncomingValue, IncomingStmt);


  // Do not add more than one MemoryAccess per PHINode and ScopStmt.

  if (MemoryAccess *Acc = IncomingStmt->lookupPHIWriteOf(PHI)) {

    assert(Acc->getAccessInstruction() == PHI);

    Acc->addIncoming(IncomingBlock, IncomingValue);

    return;

  }


  MemoryAccess *Acc = addMemoryAccess(

      IncomingStmt, PHI, MemoryAccess::MUST_WRITE, PHI, PHI->getType(), true,

      PHI, ArrayRef<const SCEV *>(), ArrayRef<const SCEV *>(),

      IsExitBlock ? MemoryKind::ExitPHI : MemoryKind::PHI);

  assert(Acc);

  Acc->addIncoming(IncomingBlock, IncomingValue);

}


void ScopBuilder::addPHIReadAccess(ScopStmt *PHIStmt, PHINode *PHI) {

  addMemoryAccess(PHIStmt, PHI, MemoryAccess::READ, PHI, PHI->getType(), true,

                  PHI, ArrayRef<const SCEV *>(), ArrayRef<const SCEV *>(),

                  MemoryKind::PHI);

}


void ScopBuilder::buildDomain(ScopStmt &Stmt) {

  isl::id Id = isl::id::alloc(scop->getIslCtx(), Stmt.getBaseName(), &Stmt);


  Stmt.Domain = scop->getDomainConditions(&Stmt);

  Stmt.Domain = Stmt.Domain.set_tuple_id(Id);

}


void ScopBuilder::collectSurroundingLoops(ScopStmt &Stmt) {

  isl::set Domain = Stmt.getDomain();

  BasicBlock *BB = Stmt.getEntryBlock();


  Loop *L = LI.getLoopFor(BB);


  while (L && Stmt.isRegionStmt() && Stmt.getRegion()->contains(L))

    L = L->getParentLoop();


  SmallVector<llvm::Loop *, 8> Loops;


  while (L && Stmt.getParent()->getRegion().contains(L)) {

    Loops.push_back(L);

    L = L->getParentLoop();

  }


  Stmt.NestLoops.insert(Stmt.NestLoops.begin(), Loops.rbegin(), Loops.rend());

}


/// Return the reduction type for a given binary operator.

static MemoryAccess::ReductionType

getReductionType(const BinaryOperator *BinOp) {

  if (!BinOp)

    return MemoryAccess::RT_NONE;

  switch (BinOp->getOpcode()) {

  case Instruction::FAdd:

    if (!BinOp->isFast())

      return MemoryAccess::RT_NONE;

    [[fallthrough]];

  case Instruction::Add:

    return MemoryAccess::RT_ADD;

  case Instruction::Or:

    return MemoryAccess::RT_BOR;

  case Instruction::Xor:

    return MemoryAccess::RT_BXOR;

  case Instruction::And:

    return MemoryAccess::RT_BAND;

  case Instruction::FMul:

    if (!BinOp->isFast())

      return MemoryAccess::RT_NONE;

    [[fallthrough]];

  case Instruction::Mul:

    if (DisableMultiplicativeReductions)

      return MemoryAccess::RT_NONE;

    return MemoryAccess::RT_MUL;

  default:

    return MemoryAccess::RT_NONE;

  }

}


/// @brief Combine two reduction types

static MemoryAccess::ReductionType

combineReductionType(MemoryAccess::ReductionType RT0,

                     MemoryAccess::ReductionType RT1) {

  if (RT0 == MemoryAccess::RT_BOTTOM)

    return RT1;

  if (RT0 == RT1)

    return RT1;

  return MemoryAccess::RT_NONE;

}


///  True if @p AllAccs intersects with @p MemAccs execpt @p LoadMA and @p

///  StoreMA

bool hasIntersectingAccesses(isl::set AllAccs, MemoryAccess *LoadMA,

                             MemoryAccess *StoreMA, isl::set Domain,

                             SmallVector<MemoryAccess *, 8> &MemAccs) {

  bool HasIntersectingAccs = false;

  auto AllAccsNoParams = AllAccs.project_out_all_params();


  for (MemoryAccess *MA : MemAccs) {

    if (MA == LoadMA || MA == StoreMA)

      continue;

    auto AccRel = MA->getAccessRelation().intersect_domain(Domain);

    auto Accs = AccRel.range();

    auto AccsNoParams = Accs.project_out_all_params();


    bool CompatibleSpace = AllAccsNoParams.has_equal_space(AccsNoParams);


    if (CompatibleSpace) {

      auto OverlapAccs = Accs.intersect(AllAccs);

      bool DoesIntersect = !OverlapAccs.is_empty();

      HasIntersectingAccs |= DoesIntersect;

    }

  }

  return HasIntersectingAccs;

}


///  Test if the accesses of @p LoadMA and @p StoreMA can form a reduction

bool checkCandidatePairAccesses(MemoryAccess *LoadMA, MemoryAccess *StoreMA,

                                isl::set Domain,

                                SmallVector<MemoryAccess *, 8> &MemAccs) {

  // First check if the base value is the same.

  isl::map LoadAccs = LoadMA->getAccessRelation();

  isl::map StoreAccs = StoreMA->getAccessRelation();

  bool Valid = LoadAccs.has_equal_space(StoreAccs);

  POLLY_DEBUG(dbgs() << " == The accessed space below is "

                     << (Valid ? "" : "not ") << "equal!\n");

  POLLY_DEBUG(LoadMA->dump(); StoreMA->dump());


  if (Valid) {

    // Then check if they actually access the same memory.

    isl::map R = isl::manage(LoadAccs.copy())

                     .intersect_domain(isl::manage(Domain.copy()));

    isl::map W = isl::manage(StoreAccs.copy())

                     .intersect_domain(isl::manage(Domain.copy()));

    isl::set RS = R.range();

    isl::set WS = W.range();


    isl::set InterAccs =

        isl::manage(RS.copy()).intersect(isl::manage(WS.copy()));

    Valid = !InterAccs.is_empty();

    POLLY_DEBUG(dbgs() << " == The accessed memory is " << (Valid ? "" : "not ")

                       << "overlapping!\n");

  }


  if (Valid) {

    // Finally, check if they are no other instructions accessing this memory

    isl::map AllAccsRel = LoadAccs.unite(StoreAccs);

    AllAccsRel = AllAccsRel.intersect_domain(Domain);

    isl::set AllAccs = AllAccsRel.range();

    Valid = !hasIntersectingAccesses(AllAccs, LoadMA, StoreMA, Domain, MemAccs);

    POLLY_DEBUG(dbgs() << " == The accessed memory is " << (Valid ? "not " : "")

                       << "accessed by other instructions!\n");

  }


  return Valid;

}


void ScopBuilder::checkForReductions(ScopStmt &Stmt) {

  // Perform a data flow analysis on the current scop statement to propagate the

  // uses of loaded values. Then check and mark the memory accesses which are

  // part of reduction like chains.

  // During the data flow analysis we use the State variable to keep track of

  // the used "load-instructions" for each instruction in the scop statement.

  // This includes the LLVM-IR of the load and the "number of uses" (or the

  // number of paths in the operand tree which end in this load).

  using StatePairTy = std::pair<unsigned, MemoryAccess::ReductionType>;

  using FlowInSetTy = MapVector<const LoadInst *, StatePairTy>;

  using StateTy = MapVector<const Instruction *, FlowInSetTy>;

  StateTy State;


  // Invalid loads are loads which have uses we can't track properly in the

  // state map. This includes loads which:

  //   o do not form a reduction when they flow into a memory location:

  //     (e.g., A[i] = B[i] * 3 and  A[i] = A[i] * A[i] + A[i])

  //   o are used by a non binary operator or one which is not commutative

  //     and associative (e.g., A[i] = A[i] % 3)

  //   o might change the control flow            (e.g., if (A[i]))

  //   o are used in indirect memory accesses     (e.g., A[B[i]])

  //   o are used outside the current scop statement

  SmallPtrSet<const Instruction *, 8> InvalidLoads;

  SmallVector<BasicBlock *, 8> ScopBlocks;

  BasicBlock *BB = Stmt.getBasicBlock();

  if (BB)

    ScopBlocks.push_back(BB);

  else

    for (BasicBlock *Block : Stmt.getRegion()->blocks())

      ScopBlocks.push_back(Block);

  // Run the data flow analysis for all values in the scop statement

  for (BasicBlock *Block : ScopBlocks) {

    for (Instruction &Inst : *Block) {

      if ((Stmt.getParent())->getStmtFor(&Inst) != &Stmt)

        continue;

      bool UsedOutsideStmt = any_of(Inst.users(), [&Stmt](User *U) {

        return (Stmt.getParent())->getStmtFor(cast<Instruction>(U)) != &Stmt;

      });

      //  Treat loads and stores special

      if (auto *Load = dyn_cast<LoadInst>(&Inst)) {

        // Invalidate all loads used which feed into the address of this load.

        if (auto *Ptr = dyn_cast<Instruction>(Load->getPointerOperand())) {

          const auto &It = State.find(Ptr);

          if (It != State.end())

            for (const auto &FlowInSetElem : It->second)

              InvalidLoads.insert(FlowInSetElem.first);

        }


        // If this load is used outside this stmt, invalidate it.

        if (UsedOutsideStmt)

          InvalidLoads.insert(Load);


        // And indicate that this load uses itself once but without specifying

        // any reduction operator.

        State[Load].insert(

            std::make_pair(Load, std::make_pair(1, MemoryAccess::RT_BOTTOM)));

        continue;

      }


      if (auto *Store = dyn_cast<StoreInst>(&Inst)) {

        // Invalidate all loads which feed into the address of this store.

        if (const Instruction *Ptr =

                dyn_cast<Instruction>(Store->getPointerOperand())) {

          const auto &It = State.find(Ptr);

          if (It != State.end())

            for (const auto &FlowInSetElem : It->second)

              InvalidLoads.insert(FlowInSetElem.first);

        }


        // Propagate the uses of the value operand to the store

        if (auto *ValueInst = dyn_cast<Instruction>(Store->getValueOperand()))

          State.insert(std::make_pair(Store, State[ValueInst]));

        continue;

      }


      // Non load and store instructions are either binary operators or they

      // will invalidate all used loads.

      auto *BinOp = dyn_cast<BinaryOperator>(&Inst);

      MemoryAccess::ReductionType CurRedType = getReductionType(BinOp);

      POLLY_DEBUG(dbgs() << "CurInst: " << Inst << " RT: " << CurRedType

                         << "\n");


      // Iterate over all operands and propagate their input loads to

      // instruction.

      FlowInSetTy &InstInFlowSet = State[&Inst];

      for (Use &Op : Inst.operands()) {

        auto *OpInst = dyn_cast<Instruction>(Op);

        if (!OpInst)

          continue;


        POLLY_DEBUG(dbgs().indent(4) << "Op Inst: " << *OpInst << "\n");

        const StateTy::iterator &OpInFlowSetIt = State.find(OpInst);

        if (OpInFlowSetIt == State.end())

          continue;


        // Iterate over all the input loads of the operand and combine them

        // with the input loads of current instruction.

        FlowInSetTy &OpInFlowSet = OpInFlowSetIt->second;

        for (auto &OpInFlowPair : OpInFlowSet) {

          unsigned OpFlowIn = OpInFlowPair.second.first;

          unsigned InstFlowIn = InstInFlowSet[OpInFlowPair.first].first;


          MemoryAccess::ReductionType OpRedType = OpInFlowPair.second.second;

          MemoryAccess::ReductionType InstRedType =

              InstInFlowSet[OpInFlowPair.first].second;


          MemoryAccess::ReductionType NewRedType =

              combineReductionType(OpRedType, CurRedType);

          if (InstFlowIn)

            NewRedType = combineReductionType(NewRedType, InstRedType);


          POLLY_DEBUG(dbgs().indent(8) << "OpRedType: " << OpRedType << "\n");

          POLLY_DEBUG(dbgs().indent(8) << "NewRedType: " << NewRedType << "\n");

          InstInFlowSet[OpInFlowPair.first] =

              std::make_pair(OpFlowIn + InstFlowIn, NewRedType);

        }

      }


      // If this operation is used outside the stmt, invalidate all the loads

      // which feed into it.

      if (UsedOutsideStmt)

        for (const auto &FlowInSetElem : InstInFlowSet)

          InvalidLoads.insert(FlowInSetElem.first);

    }

  }


  // All used loads are propagated through the whole basic block; now try to

  // find valid reduction-like candidate pairs. These load-store pairs fulfill

  // all reduction like properties with regards to only this load-store chain.

  // We later have to check if the loaded value was invalidated by an

  // instruction not in that chain.

  using MemAccPair = std::pair<MemoryAccess *, MemoryAccess *>;

  DenseMap<MemAccPair, MemoryAccess::ReductionType> ValidCandidates;


  // Iterate over all write memory accesses and check the loads flowing into

  // it for reduction candidate pairs.

  for (MemoryAccess *WriteMA : Stmt.MemAccs) {

    if (WriteMA->isRead())

      continue;

    StoreInst *St = dyn_cast<StoreInst>(WriteMA->getAccessInstruction());

    if (!St)

      continue;

    assert(!St->isVolatile());


    FlowInSetTy &MaInFlowSet = State[WriteMA->getAccessInstruction()];

    for (auto &MaInFlowSetElem : MaInFlowSet) {

      MemoryAccess *ReadMA = &Stmt.getArrayAccessFor(MaInFlowSetElem.first);

      assert(ReadMA && "Couldn't find memory access for incoming load!");


      POLLY_DEBUG(dbgs() << "'" << *ReadMA->getAccessInstruction()

                         << "'\n\tflows into\n'"

                         << *WriteMA->getAccessInstruction() << "'\n\t #"

                         << MaInFlowSetElem.second.first << " times & RT: "

                         << MaInFlowSetElem.second.second << "\n");


      MemoryAccess::ReductionType RT = MaInFlowSetElem.second.second;

      unsigned NumAllowableInFlow = 1;


      // We allow the load to flow in exactly once for binary reductions

      bool Valid = (MaInFlowSetElem.second.first == NumAllowableInFlow);


      // Check if we saw a valid chain of binary operators.

      Valid = Valid && RT != MemoryAccess::RT_BOTTOM;

      Valid = Valid && RT != MemoryAccess::RT_NONE;


      // Then check if the memory accesses allow a reduction.

      Valid = Valid && checkCandidatePairAccesses(

                           ReadMA, WriteMA, Stmt.getDomain(), Stmt.MemAccs);


      // Finally, mark the pair as a candidate or the load as a invalid one.

      if (Valid)

        ValidCandidates[std::make_pair(ReadMA, WriteMA)] = RT;

      else

        InvalidLoads.insert(ReadMA->getAccessInstruction());

    }

  }


  // In the last step mark the memory accesses of candidate pairs as reduction

  // like if the load wasn't marked invalid in the previous step.

  for (auto &CandidatePair : ValidCandidates) {

    MemoryAccess *LoadMA = CandidatePair.first.first;

    if (InvalidLoads.count(LoadMA->getAccessInstruction()))

      continue;

    POLLY_DEBUG(

        dbgs() << " Load :: "

               << *((CandidatePair.first.first)->getAccessInstruction())

               << "\n Store :: "

               << *((CandidatePair.first.second)->getAccessInstruction())

               << "\n are marked as reduction like\n");

    MemoryAccess::ReductionType RT = CandidatePair.second;

    CandidatePair.first.first->markAsReductionLike(RT);

    CandidatePair.first.second->markAsReductionLike(RT);

  }

}


void ScopBuilder::verifyInvariantLoads() {

  auto &RIL = scop->getRequiredInvariantLoads();

  for (LoadInst *LI : RIL) {

    assert(LI && scop->contains(LI));

    // If there exists a statement in the scop which has a memory access for

    // @p LI, then mark this scop as infeasible for optimization.

    for (ScopStmt &Stmt : *scop)

      if (Stmt.getArrayAccessOrNULLFor(LI)) {

        scop->invalidate(INVARIANTLOAD, LI->getDebugLoc(), LI->getParent());

        return;

      }

  }

}


void ScopBuilder::hoistInvariantLoads() {

  if (!PollyInvariantLoadHoisting)

    return;


  isl::union_map Writes = scop->getWrites();

  for (ScopStmt &Stmt : *scop) {

    InvariantAccessesTy InvariantAccesses;


    for (MemoryAccess *Access : Stmt) {

      isl::set NHCtx = getNonHoistableCtx(Access, Writes);

      if (!NHCtx.is_null())

        InvariantAccesses.push_back({Access, NHCtx});

    }


    // Transfer the memory access from the statement to the SCoP.

    for (auto InvMA : InvariantAccesses)

      Stmt.removeMemoryAccess(InvMA.MA);

    addInvariantLoads(Stmt, InvariantAccesses);

  }

}


/// Check if an access range is too complex.

///

/// An access range is too complex, if it contains either many disjuncts or

/// very complex expressions. As a simple heuristic, we assume if a set to

/// be too complex if the sum of existentially quantified dimensions and

/// set dimensions is larger than a threshold. This reliably detects both

/// sets with many disjuncts as well as sets with many divisions as they

/// arise in h264.

///

/// @param AccessRange The range to check for complexity.

///

/// @returns True if the access range is too complex.

static bool isAccessRangeTooComplex(isl::set AccessRange) {

  unsigned NumTotalDims = 0;


  for (isl::basic_set BSet : AccessRange.get_basic_set_list()) {

    NumTotalDims += unsignedFromIslSize(BSet.dim(isl::dim::div));

    NumTotalDims += unsignedFromIslSize(BSet.dim(isl::dim::set));

  }


  if (NumTotalDims > MaxDimensionsInAccessRange)

    return true;


  return false;

}


bool ScopBuilder::hasNonHoistableBasePtrInScop(MemoryAccess *MA,

                                               isl::union_map Writes) {

  if (auto *BasePtrMA = scop->lookupBasePtrAccess(MA)) {

    return getNonHoistableCtx(BasePtrMA, Writes).is_null();

  }


  Value *BaseAddr = MA->getOriginalBaseAddr();

  if (auto *BasePtrInst = dyn_cast<Instruction>(BaseAddr))

    if (!isa<LoadInst>(BasePtrInst))

      return scop->contains(BasePtrInst);


  return false;

}


void ScopBuilder::addUserContext() {

  if (UserContextStr.empty())

    return;


  isl::set UserContext = isl::set(scop->getIslCtx(), UserContextStr.c_str());

  isl::space Space = scop->getParamSpace();

  isl::size SpaceParams = Space.dim(isl::dim::param);

  if (unsignedFromIslSize(SpaceParams) !=

      unsignedFromIslSize(UserContext.dim(isl::dim::param))) {

    std::string SpaceStr = stringFromIslObj(Space, "null");

    errs() << "Error: the context provided in -polly-context has not the same "

           << "number of dimensions than the computed context. Due to this "

           << "mismatch, the -polly-context option is ignored. Please provide "

           << "the context in the parameter space: " << SpaceStr << ".\n";

    return;

  }


  for (auto i : rangeIslSize(0, SpaceParams)) {

    std::string NameContext =

        scop->getContext().get_dim_name(isl::dim::param, i);

    std::string NameUserContext = UserContext.get_dim_name(isl::dim::param, i);


    if (NameContext != NameUserContext) {

      std::string SpaceStr = stringFromIslObj(Space, "null");

      errs() << "Error: the name of dimension " << i

             << " provided in -polly-context "

             << "is '" << NameUserContext << "', but the name in the computed "

             << "context is '" << NameContext

             << "'. Due to this name mismatch, "

             << "the -polly-context option is ignored. Please provide "

             << "the context in the parameter space: " << SpaceStr << ".\n";

      return;

    }


    UserContext = UserContext.set_dim_id(isl::dim::param, i,

                                         Space.get_dim_id(isl::dim::param, i));

  }

  isl::set newContext = scop->getContext().intersect(UserContext);

  scop->setContext(newContext);

}


isl::set ScopBuilder::getNonHoistableCtx(MemoryAccess *Access,

                                         isl::union_map Writes) {

  // TODO: Loads that are not loop carried, hence are in a statement with

  //       zero iterators, are by construction invariant, though we

  //       currently "hoist" them anyway. This is necessary because we allow

  //       them to be treated as parameters (e.g., in conditions) and our code

  //       generation would otherwise use the old value.


  auto &Stmt = *Access->getStatement();

  BasicBlock *BB = Stmt.getEntryBlock();


  if (Access->isScalarKind() || Access->isWrite() || !Access->isAffine() ||

      Access->isMemoryIntrinsic())

    return {};


  // Skip accesses that have an invariant base pointer which is defined but

  // not loaded inside the SCoP. This can happened e.g., if a readnone call

  // returns a pointer that is used as a base address. However, as we want

  // to hoist indirect pointers, we allow the base pointer to be defined in

  // the region if it is also a memory access. Each ScopArrayInfo object

  // that has a base pointer origin has a base pointer that is loaded and

  // that it is invariant, thus it will be hoisted too. However, if there is

  // no base pointer origin we check that the base pointer is defined

  // outside the region.

  auto *LI = cast<LoadInst>(Access->getAccessInstruction());

  if (hasNonHoistableBasePtrInScop(Access, Writes))

    return {};


  isl::map AccessRelation = Access->getAccessRelation();

  assert(!AccessRelation.is_empty());


  if (AccessRelation.involves_dims(isl::dim::in, 0, Stmt.getNumIterators()))

    return {};


  AccessRelation = AccessRelation.intersect_domain(Stmt.getDomain());

  isl::set SafeToLoad;


  auto &DL = scop->getFunction().getDataLayout();

  if (isSafeToLoadUnconditionally(LI->getPointerOperand(), LI->getType(),

                                  LI->getAlign(), DL, nullptr)) {

    SafeToLoad = isl::set::universe(AccessRelation.get_space().range());

  } else if (BB != LI->getParent()) {

    // Skip accesses in non-affine subregions as they might not be executed

    // under the same condition as the entry of the non-affine subregion.

    return {};

  } else {

    SafeToLoad = AccessRelation.range();

  }


  if (isAccessRangeTooComplex(AccessRelation.range()))

    return {};


  isl::union_map Written = Writes.intersect_range(SafeToLoad);

  isl::set WrittenCtx = Written.params();

  bool IsWritten = !WrittenCtx.is_empty();


  if (!IsWritten)

    return WrittenCtx;


  WrittenCtx = WrittenCtx.remove_divs();

  bool TooComplex =

      unsignedFromIslSize(WrittenCtx.n_basic_set()) >= MaxDisjunctsInDomain;

  if (TooComplex || !isRequiredInvariantLoad(LI))

    return {};


  scop->addAssumption(INVARIANTLOAD, WrittenCtx, LI->getDebugLoc(),

                      AS_RESTRICTION, LI->getParent());

  return WrittenCtx;

}


static bool isAParameter(llvm::Value *maybeParam, const Function &F) {

  for (const llvm::Argument &Arg : F.args())

    if (&Arg == maybeParam)

      return true;


  return false;

}


bool ScopBuilder::canAlwaysBeHoisted(MemoryAccess *MA,

                                     bool StmtInvalidCtxIsEmpty,

                                     bool MAInvalidCtxIsEmpty,

                                     bool NonHoistableCtxIsEmpty) {

  LoadInst *LInst = cast<LoadInst>(MA->getAccessInstruction());

  const DataLayout &DL = LInst->getDataLayout();

  if (PollyAllowDereferenceOfAllFunctionParams &&

      isAParameter(LInst->getPointerOperand(), scop->getFunction()))

    return true;


  // TODO: We can provide more information for better but more expensive

  //       results.

  if (!isDereferenceableAndAlignedPointer(

          LInst->getPointerOperand(), LInst->getType(), LInst->getAlign(), DL))

    return false;


  // If the location might be overwritten we do not hoist it unconditionally.

  //

  // TODO: This is probably too conservative.

  if (!NonHoistableCtxIsEmpty)

    return false;


  // If a dereferenceable load is in a statement that is modeled precisely we

  // can hoist it.

  if (StmtInvalidCtxIsEmpty && MAInvalidCtxIsEmpty)

    return true;


  // Even if the statement is not modeled precisely we can hoist the load if it

  // does not involve any parameters that might have been specialized by the

  // statement domain.

  for (const SCEV *Subscript : MA->subscripts())

    if (!isa<SCEVConstant>(Subscript))

      return false;

  return true;

}


void ScopBuilder::addInvariantLoads(ScopStmt &Stmt,

                                    InvariantAccessesTy &InvMAs) {

  if (InvMAs.empty())

    return;


  isl::set StmtInvalidCtx = Stmt.getInvalidContext();

  bool StmtInvalidCtxIsEmpty = StmtInvalidCtx.is_empty();


  // Get the context under which the statement is executed but remove the error

  // context under which this statement is reached.

  isl::set DomainCtx = Stmt.getDomain().params();

  DomainCtx = DomainCtx.subtract(StmtInvalidCtx);


  if (unsignedFromIslSize(DomainCtx.n_basic_set()) >= MaxDisjunctsInDomain) {

    auto *AccInst = InvMAs.front().MA->getAccessInstruction();

    scop->invalidate(COMPLEXITY, AccInst->getDebugLoc(), AccInst->getParent());

    return;

  }


  // Project out all parameters that relate to loads in the statement. Otherwise

  // we could have cyclic dependences on the constraints under which the

  // hoisted loads are executed and we could not determine an order in which to

  // pre-load them. This happens because not only lower bounds are part of the

  // domain but also upper bounds.

  for (auto &InvMA : InvMAs) {

    auto *MA = InvMA.MA;

    Instruction *AccInst = MA->getAccessInstruction();

    if (SE.isSCEVable(AccInst->getType())) {

      SetVector<Value *> Values;

      for (const SCEV *Parameter : scop->parameters()) {

        Values.clear();

        findValues(Parameter, SE, Values);

        if (!Values.count(AccInst))

          continue;


        isl::id ParamId = scop->getIdForParam(Parameter);

        if (!ParamId.is_null()) {

          int Dim = DomainCtx.find_dim_by_id(isl::dim::param, ParamId);

          if (Dim >= 0)

            DomainCtx = DomainCtx.eliminate(isl::dim::param, Dim, 1);

        }

      }

    }

  }


  for (auto &InvMA : InvMAs) {

    auto *MA = InvMA.MA;

    isl::set NHCtx = InvMA.NonHoistableCtx;


    // Check for another invariant access that accesses the same location as

    // MA and if found consolidate them. Otherwise create a new equivalence

    // class at the end of InvariantEquivClasses.

    LoadInst *LInst = cast<LoadInst>(MA->getAccessInstruction());

    Type *Ty = LInst->getType();

    const SCEV *PointerSCEV = SE.getSCEV(LInst->getPointerOperand());


    isl::set MAInvalidCtx = MA->getInvalidContext();

    bool NonHoistableCtxIsEmpty = NHCtx.is_empty();

    bool MAInvalidCtxIsEmpty = MAInvalidCtx.is_empty();


    isl::set MACtx;

    // Check if we know that this pointer can be speculatively accessed.

    if (canAlwaysBeHoisted(MA, StmtInvalidCtxIsEmpty, MAInvalidCtxIsEmpty,

                           NonHoistableCtxIsEmpty)) {

      MACtx = isl::set::universe(DomainCtx.get_space());

    } else {

      MACtx = DomainCtx;

      MACtx = MACtx.subtract(MAInvalidCtx.unite(NHCtx));

      MACtx = MACtx.gist_params(scop->getContext());

    }


    bool Consolidated = false;

    for (auto &IAClass : scop->invariantEquivClasses()) {

      if (PointerSCEV != IAClass.IdentifyingPointer || Ty != IAClass.AccessType)

        continue;


      // If the pointer and the type is equal check if the access function wrt.

      // to the domain is equal too. It can happen that the domain fixes

      // parameter values and these can be different for distinct part of the

      // SCoP. If this happens we cannot consolidate the loads but need to

      // create a new invariant load equivalence class.

      auto &MAs = IAClass.InvariantAccesses;

      if (!MAs.empty()) {

        auto *LastMA = MAs.front();


        isl::set AR = MA->getAccessRelation().range();

        isl::set LastAR = LastMA->getAccessRelation().range();

        bool SameAR = AR.is_equal(LastAR);


        if (!SameAR)

          continue;

      }


      // Add MA to the list of accesses that are in this class.

      MAs.push_front(MA);


      Consolidated = true;


      // Unify the execution context of the class and this statement.

      isl::set IAClassDomainCtx = IAClass.ExecutionContext;

      if (!IAClassDomainCtx.is_null())

        IAClassDomainCtx = IAClassDomainCtx.unite(MACtx).coalesce();

      else

        IAClassDomainCtx = MACtx;

      IAClass.ExecutionContext = IAClassDomainCtx;

      break;

    }


    if (Consolidated)

      continue;


    MACtx = MACtx.coalesce();


    // If we did not consolidate MA, thus did not find an equivalence class

    // for it, we create a new one.

    scop->addInvariantEquivClass(

        InvariantEquivClassTy{PointerSCEV, MemoryAccessList{MA}, MACtx, Ty});

  }

}


/// Find the canonical scop array info object for a set of invariant load

/// hoisted loads. The canonical array is the one that corresponds to the

/// first load in the list of accesses which is used as base pointer of a

/// scop array.

static const ScopArrayInfo *findCanonicalArray(Scop &S,

                                               MemoryAccessList &Accesses) {

  for (MemoryAccess *Access : Accesses) {

    const ScopArrayInfo *CanonicalArray = S.getScopArrayInfoOrNull(

        Access->getAccessInstruction(), MemoryKind::Array);

    if (CanonicalArray)

      return CanonicalArray;

  }

  return nullptr;

}


/// Check if @p Array severs as base array in an invariant load.

static bool isUsedForIndirectHoistedLoad(Scop &S, const ScopArrayInfo *Array) {

  for (InvariantEquivClassTy &EqClass2 : S.getInvariantAccesses())

    for (MemoryAccess *Access2 : EqClass2.InvariantAccesses)

      if (Access2->getScopArrayInfo() == Array)

        return true;

  return false;

}


/// Replace the base pointer arrays in all memory accesses referencing @p Old,

/// with a reference to @p New.

static void replaceBasePtrArrays(Scop &S, const ScopArrayInfo *Old,

                                 const ScopArrayInfo *New) {

  for (ScopStmt &Stmt : S)

    for (MemoryAccess *Access : Stmt) {

      if (Access->getLatestScopArrayInfo() != Old)

        continue;


      isl::id Id = New->getBasePtrId();

      isl::map Map = Access->getAccessRelation();

      Map = Map.set_tuple_id(isl::dim::out, Id);

      Access->setAccessRelation(Map);

    }

}


void ScopBuilder::canonicalizeDynamicBasePtrs() {

  for (InvariantEquivClassTy &EqClass : scop->InvariantEquivClasses) {

    MemoryAccessList &BasePtrAccesses = EqClass.InvariantAccesses;


    const ScopArrayInfo *CanonicalBasePtrSAI =

        findCanonicalArray(*scop, BasePtrAccesses);


    if (!CanonicalBasePtrSAI)

      continue;


    for (MemoryAccess *BasePtrAccess : BasePtrAccesses) {

      const ScopArrayInfo *BasePtrSAI = scop->getScopArrayInfoOrNull(

          BasePtrAccess->getAccessInstruction(), MemoryKind::Array);

      if (!BasePtrSAI || BasePtrSAI == CanonicalBasePtrSAI ||

          !BasePtrSAI->isCompatibleWith(CanonicalBasePtrSAI))

        continue;


      // we currently do not canonicalize arrays where some accesses are

      // hoisted as invariant loads. If we would, we need to update the access

      // function of the invariant loads as well. However, as this is not a

      // very common situation, we leave this for now to avoid further

      // complexity increases.

      if (isUsedForIndirectHoistedLoad(*scop, BasePtrSAI))

        continue;


      replaceBasePtrArrays(*scop, BasePtrSAI, CanonicalBasePtrSAI);

    }

  }

}


void ScopBuilder::buildAccessRelations(ScopStmt &Stmt) {

  for (MemoryAccess *Access : Stmt.MemAccs) {

    Type *ElementType = Access->getElementType();


    MemoryKind Ty;

    if (Access->isPHIKind())

      Ty = MemoryKind::PHI;

    else if (Access->isExitPHIKind())

      Ty = MemoryKind::ExitPHI;

    else if (Access->isValueKind())

      Ty = MemoryKind::Value;

    else

      Ty = MemoryKind::Array;


    // Create isl::pw_aff for SCEVs which describe sizes. Collect all

    // assumptions which are taken. isl::pw_aff objects are cached internally

    // and they are used later by scop.

    for (const SCEV *Size : Access->Sizes) {

      if (!Size)

        continue;

      scop->getPwAff(Size, nullptr, false, &RecordedAssumptions);

    }

    auto *SAI = scop->getOrCreateScopArrayInfo(Access->getOriginalBaseAddr(),

                                               ElementType, Access->Sizes, Ty);


    // Create isl::pw_aff for SCEVs which describe subscripts. Collect all

    // assumptions which are taken. isl::pw_aff objects are cached internally

    // and they are used later by scop.

    for (const SCEV *Subscript : Access->subscripts()) {

      if (!Access->isAffine() || !Subscript)

        continue;

      scop->getPwAff(Subscript, Stmt.getEntryBlock(), false,

                     &RecordedAssumptions);

    }

    Access->buildAccessRelation(SAI);

    scop->addAccessData(Access);

  }

}


/// Add the minimal/maximal access in @p Set to @p User.

///

/// @return True if more accesses should be added, false if we reached the

///         maximal number of run-time checks to be generated.

static bool buildMinMaxAccess(isl::set Set,

                              Scop::MinMaxVectorTy &MinMaxAccesses, Scop &S) {

  isl::pw_multi_aff MinPMA, MaxPMA;

  isl::pw_aff LastDimAff;

  isl::aff OneAff;

  unsigned Pos;


  Set = Set.remove_divs();

  polly::simplify(Set);


  if (unsignedFromIslSize(Set.n_basic_set()) > RunTimeChecksMaxAccessDisjuncts)

    Set = Set.simple_hull();


  // Restrict the number of parameters involved in the access as the lexmin/

  // lexmax computation will take too long if this number is high.

  //

  // Experiments with a simple test case using an i7 4800MQ:

  //

  //  #Parameters involved | Time (in sec)

  //            6          |     0.01

  //            7          |     0.04

  //            8          |     0.12

  //            9          |     0.40

  //           10          |     1.54

  //           11          |     6.78

  //           12          |    30.38

  //

  if (isl_set_n_param(Set.get()) >

      static_cast<isl_size>(RunTimeChecksMaxParameters)) {

    unsigned InvolvedParams = 0;

    for (unsigned u = 0, e = isl_set_n_param(Set.get()); u < e; u++)

      if (Set.involves_dims(isl::dim::param, u, 1))

        InvolvedParams++;


    if (InvolvedParams > RunTimeChecksMaxParameters)

      return false;

  }


  MinPMA = Set.lexmin_pw_multi_aff();

  MaxPMA = Set.lexmax_pw_multi_aff();


  MinPMA = MinPMA.coalesce();

  MaxPMA = MaxPMA.coalesce();


  if (MaxPMA.is_null())

    return false;


  unsigned MaxOutputSize = unsignedFromIslSize(MaxPMA.dim(isl::dim::out));


  // Adjust the last dimension of the maximal access by one as we want to

  // enclose the accessed memory region by MinPMA and MaxPMA. The pointer

  // we test during code generation might now point after the end of the

  // allocated array but we will never dereference it anyway.

  assert(MaxOutputSize >= 1 && "Assumed at least one output dimension");


  Pos = MaxOutputSize - 1;

  LastDimAff = MaxPMA.at(Pos);

  OneAff = isl::aff(isl::local_space(LastDimAff.get_domain_space()));

  OneAff = OneAff.add_constant_si(1);

  LastDimAff = LastDimAff.add(OneAff);

  MaxPMA = MaxPMA.set_pw_aff(Pos, LastDimAff);


  if (MinPMA.is_null() || MaxPMA.is_null())

    return false;


  MinMaxAccesses.push_back(std::make_pair(MinPMA, MaxPMA));


  return true;

}


/// Wrapper function to calculate minimal/maximal accesses to each array.

bool ScopBuilder::calculateMinMaxAccess(AliasGroupTy AliasGroup,

                                        Scop::MinMaxVectorTy &MinMaxAccesses) {

  MinMaxAccesses.reserve(AliasGroup.size());


  isl::union_set Domains = scop->getDomains();

  isl::union_map Accesses = isl::union_map::empty(scop->getIslCtx());


  for (MemoryAccess *MA : AliasGroup)

    Accesses = Accesses.unite(MA->getAccessRelation());


  Accesses = Accesses.intersect_domain(Domains);

  isl::union_set Locations = Accesses.range();


  bool LimitReached = false;

  for (isl::set Set : Locations.get_set_list()) {

    LimitReached |= !buildMinMaxAccess(Set, MinMaxAccesses, *scop);

    if (LimitReached)

      break;

  }


  return !LimitReached;

}


static isl::set getAccessDomain(MemoryAccess *MA) {

  isl::set Domain = MA->getStatement()->getDomain();

  Domain = Domain.project_out(isl::dim::set, 0,

                              unsignedFromIslSize(Domain.tuple_dim()));

  return Domain.reset_tuple_id();

}


bool ScopBuilder::buildAliasChecks() {

  if (!PollyUseRuntimeAliasChecks)

    return true;


  if (buildAliasGroups()) {

    // Aliasing assumptions do not go through addAssumption but we still want to

    // collect statistics so we do it here explicitly.

    if (scop->getAliasGroups().size())

      Scop::incrementNumberOfAliasingAssumptions(1);

    return true;

  }


  // If a problem occurs while building the alias groups we need to delete

  // this SCoP and pretend it wasn't valid in the first place. To this end

  // we make the assumed context infeasible.

  scop->invalidate(ALIASING, DebugLoc());


  POLLY_DEBUG(dbgs() << "\n\nNOTE: Run time checks for " << scop->getNameStr()

                     << " could not be created. This SCoP has been dismissed.");

  return false;

}


std::tuple<ScopBuilder::AliasGroupVectorTy, DenseSet<const ScopArrayInfo *>>

ScopBuilder::buildAliasGroupsForAccesses() {

  BatchAAResults BAA(AA);

  AliasSetTracker AST(BAA);


  DenseMap<Value *, MemoryAccess *> PtrToAcc;

  DenseSet<const ScopArrayInfo *> HasWriteAccess;

  for (ScopStmt &Stmt : *scop) {


    isl::set StmtDomain = Stmt.getDomain();

    bool StmtDomainEmpty = StmtDomain.is_empty();


    // Statements with an empty domain will never be executed.

    if (StmtDomainEmpty)

      continue;


    for (MemoryAccess *MA : Stmt) {

      if (MA->isScalarKind())

        continue;

      if (!MA->isRead())

        HasWriteAccess.insert(MA->getScopArrayInfo());

      MemAccInst Acc(MA->getAccessInstruction());

      if (MA->isRead() && isa<MemTransferInst>(Acc))

        PtrToAcc[cast<MemTransferInst>(Acc)->getRawSource()] = MA;

      else

        PtrToAcc[Acc.getPointerOperand()] = MA;

      AST.add(Acc);

    }

  }


  AliasGroupVectorTy AliasGroups;

  for (AliasSet &AS : AST) {

    if (AS.isMustAlias() || AS.isForwardingAliasSet())

      continue;

    AliasGroupTy AG;

    for (const Value *Ptr : AS.getPointers())

      AG.push_back(PtrToAcc[const_cast<Value *>(Ptr)]);

    if (AG.size() < 2)

      continue;

    AliasGroups.push_back(std::move(AG));

  }


  return std::make_tuple(AliasGroups, HasWriteAccess);

}


bool ScopBuilder::buildAliasGroups() {

  // To create sound alias checks we perform the following steps:

  //   o) We partition each group into read only and non read only accesses.

  //   o) For each group with more than one base pointer we then compute minimal

  //      and maximal accesses to each array of a group in read only and non

  //      read only partitions separately.

  AliasGroupVectorTy AliasGroups;

  DenseSet<const ScopArrayInfo *> HasWriteAccess;


  std::tie(AliasGroups, HasWriteAccess) = buildAliasGroupsForAccesses();


  splitAliasGroupsByDomain(AliasGroups);


  for (AliasGroupTy &AG : AliasGroups) {

    if (!scop->hasFeasibleRuntimeContext())

      return false;


    {

      IslMaxOperationsGuard MaxOpGuard(scop->getIslCtx().get(), OptComputeOut);

      bool Valid = buildAliasGroup(AG, HasWriteAccess);

      if (!Valid)

        return false;

    }

    if (isl_ctx_last_error(scop->getIslCtx().get()) == isl_error_quota) {

      scop->invalidate(COMPLEXITY, DebugLoc());

      return false;

    }

  }


  return true;

}


bool ScopBuilder::buildAliasGroup(

    AliasGroupTy &AliasGroup, DenseSet<const ScopArrayInfo *> HasWriteAccess) {

  AliasGroupTy ReadOnlyAccesses;

  AliasGroupTy ReadWriteAccesses;

  SmallPtrSet<const ScopArrayInfo *, 4> ReadWriteArrays;

  SmallPtrSet<const ScopArrayInfo *, 4> ReadOnlyArrays;


  if (AliasGroup.size() < 2)

    return true;


  for (MemoryAccess *Access : AliasGroup) {

    ORE.emit(OptimizationRemarkAnalysis(DEBUG_TYPE, "PossibleAlias",

                                        Access->getAccessInstruction())

             << "Possibly aliasing pointer, use restrict keyword.");

    const ScopArrayInfo *Array = Access->getScopArrayInfo();

    if (HasWriteAccess.count(Array)) {

      ReadWriteArrays.insert(Array);

      ReadWriteAccesses.push_back(Access);

    } else {

      ReadOnlyArrays.insert(Array);

      ReadOnlyAccesses.push_back(Access);

    }

  }


  // If there are no read-only pointers, and less than two read-write pointers,

  // no alias check is needed.

  if (ReadOnlyAccesses.empty() && ReadWriteArrays.size() <= 1)

    return true;


  // If there is no read-write pointer, no alias check is needed.

  if (ReadWriteArrays.empty())

    return true;


  // For non-affine accesses, no alias check can be generated as we cannot

  // compute a sufficiently tight lower and upper bound: bail out.

  for (MemoryAccess *MA : AliasGroup) {

    if (!MA->isAffine()) {

      scop->invalidate(ALIASING, MA->getAccessInstruction()->getDebugLoc(),

                       MA->getAccessInstruction()->getParent());

      return false;

    }

  }


  // Ensure that for all memory accesses for which we generate alias checks,

  // their base pointers are available.

  for (MemoryAccess *MA : AliasGroup) {

    if (MemoryAccess *BasePtrMA = scop->lookupBasePtrAccess(MA))

      scop->addRequiredInvariantLoad(

          cast<LoadInst>(BasePtrMA->getAccessInstruction()));

  }


  //  scop->getAliasGroups().emplace_back();

  //  Scop::MinMaxVectorPairTy &pair = scop->getAliasGroups().back();

  Scop::MinMaxVectorTy MinMaxAccessesReadWrite;

  Scop::MinMaxVectorTy MinMaxAccessesReadOnly;


  bool Valid;


  Valid = calculateMinMaxAccess(ReadWriteAccesses, MinMaxAccessesReadWrite);


  if (!Valid)

    return false;


  // Bail out if the number of values we need to compare is too large.

  // This is important as the number of comparisons grows quadratically with

  // the number of values we need to compare.

  if (MinMaxAccessesReadWrite.size() + ReadOnlyArrays.size() >

      RunTimeChecksMaxArraysPerGroup)

    return false;


  Valid = calculateMinMaxAccess(ReadOnlyAccesses, MinMaxAccessesReadOnly);


  scop->addAliasGroup(MinMaxAccessesReadWrite, MinMaxAccessesReadOnly);

  if (!Valid)

    return false;


  return true;

}


void ScopBuilder::splitAliasGroupsByDomain(AliasGroupVectorTy &AliasGroups) {

  for (unsigned u = 0; u < AliasGroups.size(); u++) {

    AliasGroupTy NewAG;

    AliasGroupTy &AG = AliasGroups[u];

    AliasGroupTy::iterator AGI = AG.begin();

    isl::set AGDomain = getAccessDomain(*AGI);

    while (AGI != AG.end()) {

      MemoryAccess *MA = *AGI;

      isl::set MADomain = getAccessDomain(MA);

      if (AGDomain.is_disjoint(MADomain)) {

        NewAG.push_back(MA);

        AGI = AG.erase(AGI);

      } else {

        AGDomain = AGDomain.unite(MADomain);

        AGI++;

      }

    }

    if (NewAG.size() > 1)

      AliasGroups.push_back(std::move(NewAG));

  }

}


#ifndef NDEBUG

static void verifyUse(Scop *S, Use &Op, LoopInfo &LI) {

  auto PhysUse = VirtualUse::create(S, Op, &LI, false);

  auto VirtUse = VirtualUse::create(S, Op, &LI, true);

  assert(PhysUse.getKind() == VirtUse.getKind());

}


/// Check the consistency of every statement's MemoryAccesses.

///

/// The check is carried out by expecting the "physical" kind of use (derived

/// from the BasicBlocks instructions resides in) to be same as the "virtual"

/// kind of use (derived from a statement's MemoryAccess).

///

/// The "physical" uses are taken by ensureValueRead to determine whether to

/// create MemoryAccesses. When done, the kind of scalar access should be the

/// same no matter which way it was derived.

///

/// The MemoryAccesses might be changed by later SCoP-modifying passes and hence

/// can intentionally influence on the kind of uses (not corresponding to the

/// "physical" anymore, hence called "virtual"). The CodeGenerator therefore has

/// to pick up the virtual uses. But here in the code generator, this has not

/// happened yet, such that virtual and physical uses are equivalent.

static void verifyUses(Scop *S, LoopInfo &LI, DominatorTree &DT) {

  for (auto *BB : S->getRegion().blocks()) {

    for (auto &Inst : *BB) {

      auto *Stmt = S->getStmtFor(&Inst);

      if (!Stmt)

        continue;


      if (isIgnoredIntrinsic(&Inst))

        continue;


      // Branch conditions are encoded in the statement domains.

      if (Inst.isTerminator() && Stmt->isBlockStmt())

        continue;


      // Verify all uses.

      for (auto &Op : Inst.operands())

        verifyUse(S, Op, LI);


      // Stores do not produce values used by other statements.

      if (isa<StoreInst>(Inst))

        continue;


      // For every value defined in the block, also check that a use of that

      // value in the same statement would not be an inter-statement use. It can

      // still be synthesizable or load-hoisted, but these kind of instructions

      // are not directly copied in code-generation.

      auto VirtDef =

          VirtualUse::create(S, Stmt, Stmt->getSurroundingLoop(), &Inst, true);

      assert(VirtDef.getKind() == VirtualUse::Synthesizable ||

             VirtDef.getKind() == VirtualUse::Intra ||

             VirtDef.getKind() == VirtualUse::Hoisted);

    }

  }


  if (S->hasSingleExitEdge())

    return;


  // PHINodes in the SCoP region's exit block are also uses to be checked.

  if (!S->getRegion().isTopLevelRegion()) {

    for (auto &Inst : *S->getRegion().getExit()) {

      if (!isa<PHINode>(Inst))

        break;


      for (auto &Op : Inst.operands())

        verifyUse(S, Op, LI);

    }

  }

}

#endif


void ScopBuilder::buildScop(Region &R, AssumptionCache &AC) {

  scop.reset(new Scop(R, SE, LI, DT, *SD.getDetectionContext(&R), ORE,

                      SD.getNextID()));


  buildStmts(R);


  // Create all invariant load instructions first. These are categorized as

  // 'synthesizable', therefore are not part of any ScopStmt but need to be

  // created somewhere.

  const InvariantLoadsSetTy &RIL = scop->getRequiredInvariantLoads();

  for (BasicBlock *BB : scop->getRegion().blocks()) {

    if (SD.isErrorBlock(*BB, scop->getRegion()))

      continue;


    for (Instruction &Inst : *BB) {

      LoadInst *Load = dyn_cast<LoadInst>(&Inst);

      if (!Load)

        continue;


      if (!RIL.count(Load))

        continue;


      // Invariant loads require a MemoryAccess to be created in some statement.

      // It is not important to which statement the MemoryAccess is added

      // because it will later be removed from the ScopStmt again. We chose the

      // first statement of the basic block the LoadInst is in.

      ArrayRef<ScopStmt *> List = scop->getStmtListFor(BB);

      assert(!List.empty());

      ScopStmt *RILStmt = List.front();

      buildMemoryAccess(Load, RILStmt);

    }

  }

  buildAccessFunctions();


  // In case the region does not have an exiting block we will later (during

  // code generation) split the exit block. This will move potential PHI nodes

  // from the current exit block into the new region exiting block. Hence, PHI

  // nodes that are at this point not part of the region will be.

  // To handle these PHI nodes later we will now model their operands as scalar

  // accesses. Note that we do not model anything in the exit block if we have

  // an exiting block in the region, as there will not be any splitting later.

  if (!R.isTopLevelRegion() && !scop->hasSingleExitEdge()) {

    for (Instruction &Inst : *R.getExit()) {

      PHINode *PHI = dyn_cast<PHINode>(&Inst);

      if (!PHI)

        break;


      buildPHIAccesses(nullptr, PHI, nullptr, true);

    }

  }


  // Create memory accesses for global reads since all arrays are now known.

  const SCEV *AF = SE.getConstant(IntegerType::getInt64Ty(SE.getContext()), 0);

  for (auto GlobalReadPair : GlobalReads) {

    ScopStmt *GlobalReadStmt = GlobalReadPair.first;

    Instruction *GlobalRead = GlobalReadPair.second;

    for (auto *BP : ArrayBasePointers)

      addArrayAccess(GlobalReadStmt, MemAccInst(GlobalRead), MemoryAccess::READ,

                     BP, BP->getType(), false, {AF}, {nullptr}, GlobalRead);

  }


  buildInvariantEquivalenceClasses();


  /// A map from basic blocks to their invalid domains.

  DenseMap<BasicBlock *, isl::set> InvalidDomainMap;


  if (!buildDomains(&R, InvalidDomainMap)) {

    POLLY_DEBUG(

        dbgs() << "Bailing-out because buildDomains encountered problems\n");

    return;

  }


  addUserAssumptions(AC, InvalidDomainMap);


  // Initialize the invalid domain.

  for (ScopStmt &Stmt : scop->Stmts)

    if (Stmt.isBlockStmt())

      Stmt.setInvalidDomain(InvalidDomainMap[Stmt.getEntryBlock()]);

    else

      Stmt.setInvalidDomain(InvalidDomainMap[getRegionNodeBasicBlock(

          Stmt.getRegion()->getNode())]);


  // Remove empty statements.

  // Exit early in case there are no executable statements left in this scop.

  scop->removeStmtNotInDomainMap();

  scop->simplifySCoP(false);

  if (scop->isEmpty()) {

    POLLY_DEBUG(dbgs() << "Bailing-out because SCoP is empty\n");

    return;

  }


  // The ScopStmts now have enough information to initialize themselves.

  for (ScopStmt &Stmt : *scop) {

    collectSurroundingLoops(Stmt);


    buildDomain(Stmt);

    buildAccessRelations(Stmt);


    if (DetectReductions)

      checkForReductions(Stmt);

  }


  // Check early for a feasible runtime context.

  if (!scop->hasFeasibleRuntimeContext()) {

    POLLY_DEBUG(

        dbgs() << "Bailing-out because of unfeasible context (early)\n");

    return;

  }


  // Check early for profitability. Afterwards it cannot change anymore,

  // only the runtime context could become infeasible.

  if (!scop->isProfitable(UnprofitableScalarAccs)) {

    scop->invalidate(PROFITABLE, DebugLoc());

    POLLY_DEBUG(

        dbgs() << "Bailing-out because SCoP is not considered profitable\n");

    return;

  }


  buildSchedule();


  finalizeAccesses();


  scop->realignParams();

  addUserContext();


  // After the context was fully constructed, thus all our knowledge about

  // the parameters is in there, we add all recorded assumptions to the

  // assumed/invalid context.

  addRecordedAssumptions();


  scop->simplifyContexts();

  if (!buildAliasChecks()) {

    POLLY_DEBUG(dbgs() << "Bailing-out because could not build alias checks\n");

    return;

  }


  hoistInvariantLoads();

  canonicalizeDynamicBasePtrs();

  verifyInvariantLoads();

  scop->simplifySCoP(true);


  // Check late for a feasible runtime context because profitability did not

  // change.

  if (!scop->hasFeasibleRuntimeContext()) {

    POLLY_DEBUG(dbgs() << "Bailing-out because of unfeasible context (late)\n");

    return;

  }


#ifndef NDEBUG

  verifyUses(scop.get(), LI, DT);

#endif

}


ScopBuilder::ScopBuilder(Region *R, AssumptionCache &AC, AAResults &AA,

                         const DataLayout &DL, DominatorTree &DT, LoopInfo &LI,

                         ScopDetection &SD, ScalarEvolution &SE,

                         OptimizationRemarkEmitter &ORE)

    : AA(AA), DL(DL), DT(DT), LI(LI), SD(SD), SE(SE), ORE(ORE) {

  DebugLoc Beg, End;

  auto P = getBBPairForRegion(R);

  getDebugLocations(P, Beg, End);


  std::string Msg = "SCoP begins here.";

  ORE.emit(OptimizationRemarkAnalysis(DEBUG_TYPE, "ScopEntry", Beg, P.first)

           << Msg);


  buildScop(*R, AC);


  POLLY_DEBUG(dbgs() << *scop);


  if (!scop->hasFeasibleRuntimeContext()) {

    InfeasibleScops++;

    Msg = "SCoP ends here but was dismissed.";

    POLLY_DEBUG(dbgs() << "SCoP detected but dismissed\n");

    RecordedAssumptions.clear();

    scop.reset();

  } else {

    Msg = "SCoP ends here.";

    ++ScopFound;

    if (scop->getMaxLoopDepth() > 0)

      ++RichScopFound;

  }


  if (R->isTopLevelRegion())

    ORE.emit(OptimizationRemarkAnalysis(DEBUG_TYPE, "ScopEnd", End, P.first)

             << Msg);

  else

    ORE.emit(OptimizationRemarkAnalysis(DEBUG_TYPE, "ScopEnd", End, P.second)

             << Msg);

}

OptComputeOut
static cl::opt< int > OptComputeOut("polly-dependences-computeout", cl::desc("Bound the dependence analysis by a maximal amount of " "computational steps (0 means no bound)"), cl::Hidden, cl::init(500000), cl::cat(PollyCategory))

DEBUG_TYPE
#define DEBUG_TYPE
Definition: DependenceInfo.cpp:43

GICHelper.h

ISLTools.h

unsignedFromIslSize
unsigned unsignedFromIslSize(const isl::size &Size)
Check that Size is valid (only on debug builds) and cast it to unsigned.
Definition: ISLTools.h:40

Options.h

PollyCategory
llvm::cl::OptionCategory PollyCategory

PollyDebug.h

POLLY_DEBUG
#define POLLY_DEBUG(X)
Definition: PollyDebug.h:23

SCEVValidator.h

OptComputeOut
static cl::opt< int > OptComputeOut("polly-analysis-computeout", cl::desc("Bound the scop analysis by a maximal amount of " "computational steps (0 means no bound)"), cl::Hidden, cl::init(800000), cl::cat(PollyCategory))

DisableMultiplicativeReductions
static cl::opt< bool > DisableMultiplicativeReductions("polly-disable-multiplicative-reductions", cl::desc("Disable multiplicative reductions"), cl::Hidden, cl::cat(PollyCategory))

replaceBasePtrArrays
static void replaceBasePtrArrays(Scop &S, const ScopArrayInfo *Old, const ScopArrayInfo *New)
Replace the base pointer arrays in all memory accesses referencing Old, with a reference to New.
Definition: ScopBuilder.cpp:3163

partitionSetParts
static std::pair< isl::set, isl::set > partitionSetParts(isl::set S, unsigned Dim)
Compute the (un)bounded parts of S wrt.
Definition: ScopBuilder.cpp:227

createNextIterationMap
static isl::map createNextIterationMap(isl::space SetSpace, unsigned Dim)
}
Definition: ScopBuilder.cpp:198

buildConditionSet
static isl::set buildConditionSet(ICmpInst::Predicate Pred, isl::pw_aff L, isl::pw_aff R)
Create the conditions under which L Pred R is true.
Definition: ScopBuilder.cpp:266

findCanonicalArray
static const ScopArrayInfo * findCanonicalArray(Scop &S, MemoryAccessList &Accesses)
Find the canonical scop array info object for a set of invariant load hoisted loads.
Definition: ScopBuilder.cpp:3141

collectBoundedParts
static isl::set collectBoundedParts(isl::set S)
Add BSet to set BoundedParts if BSet is bounded.
Definition: ScopBuilder.cpp:215

joinOrderedPHIs
static void joinOrderedPHIs(EquivalenceClasses< Instruction * > &UnionFind, ArrayRef< Instruction * > ModeledInsts)
If the BasicBlock has an edge from itself, ensure that the PHI WRITEs for the incoming values from th...
Definition: ScopBuilder.cpp:1925

UserContextStr
static cl::opt< std::string > UserContextStr("polly-context", cl::value_desc("isl parameter set"), cl::desc("Provide additional constraints on the context parameters"), cl::init(""), cl::cat(PollyCategory))

isDivisible
static bool isDivisible(const SCEV *Expr, unsigned Size, ScalarEvolution &SE)
Check if Expr is divisible by Size.
Definition: ScopBuilder.cpp:2165

getRegionNodeSuccessor
static BasicBlock * getRegionNodeSuccessor(RegionNode *RN, Instruction *TI, unsigned idx)
Return the idx'th block that is executed after RN.
Definition: ScopBuilder.cpp:171

PollyAllowDereferenceOfAllFunctionParams
static cl::opt< bool > PollyAllowDereferenceOfAllFunctionParams("polly-allow-dereference-of-all-function-parameters", cl::desc("Treat all parameters to functions that are pointers as dereferencible." " This is useful for invariant load hoisting, since we can generate" " less runtime checks. This is only valid if all pointers to functions" " are always initialized, so that Polly can choose to hoist" " their loads. "), cl::Hidden, cl::init(false), cl::cat(PollyCategory))

getAccessDomain
static isl::set getAccessDomain(MemoryAccess *MA)
Definition: ScopBuilder.cpp:3344

RunTimeChecksMaxArraysPerGroup
static cl::opt< unsigned > RunTimeChecksMaxArraysPerGroup("polly-rtc-max-arrays-per-group", cl::desc("The maximal number of arrays to compare in each alias group."), cl::Hidden, cl::init(20), cl::cat(PollyCategory))

isAccessRangeTooComplex
static bool isAccessRangeTooComplex(isl::set AccessRange)
Check if an access range is too complex.
Definition: ScopBuilder.cpp:2834

getReductionType
static MemoryAccess::ReductionType getReductionType(const BinaryOperator *BinOp)
Return the reduction type for a given binary operator.
Definition: ScopBuilder.cpp:2485

isUsedForIndirectHoistedLoad
static bool isUsedForIndirectHoistedLoad(Scop &S, const ScopArrayInfo *Array)
Check if Array severs as base array in an invariant load.
Definition: ScopBuilder.cpp:3153

XModelReadOnlyScalars
static cl::opt< bool, true > XModelReadOnlyScalars("polly-analyze-read-only-scalars", cl::desc("Model read-only scalar values in the scop description"), cl::location(ModelReadOnlyScalars), cl::Hidden, cl::init(true), cl::cat(PollyCategory))

isAParameter
static bool isAParameter(llvm::Value *maybeParam, const Function &F)
Definition: ScopBuilder.cpp:2973

combineInSequence
static isl::schedule combineInSequence(isl::schedule Prev, isl::schedule Succ)
Definition: ScopBuilder.cpp:1135

joinOrderedInstructions
static void joinOrderedInstructions(EquivalenceClasses< Instruction * > &UnionFind, ArrayRef< Instruction * > ModeledInsts)
Ensure that the order of ordered instructions does not change.
Definition: ScopBuilder.cpp:1874

RunTimeChecksMaxAccessDisjuncts
static cl::opt< unsigned > RunTimeChecksMaxAccessDisjuncts("polly-rtc-max-array-disjuncts", cl::desc("The maximal number of disjunts allowed in memory accesses to " "to build RTCs."), cl::Hidden, cl::init(8), cl::cat(PollyCategory))

GranularityChoice
GranularityChoice
Definition: ScopBuilder.cpp:145

GranularityChoice::ScalarIndependence
@ ScalarIndependence

GranularityChoice::BasicBlocks
@ BasicBlocks

GranularityChoice::Stores
@ Stores

joinOperandTree
static void joinOperandTree(EquivalenceClasses< Instruction * > &UnionFind, ArrayRef< Instruction * > ModeledInsts)
Join instructions to the same statement if one uses the scalar result of the other.
Definition: ScopBuilder.cpp:1847

hasIntersectingAccesses
bool hasIntersectingAccesses(isl::set AllAccs, MemoryAccess *LoadMA, MemoryAccess *StoreMA, isl::set Domain, SmallVector< MemoryAccess *, 8 > &MemAccs)
True if AllAccs intersects with MemAccs execpt LoadMA and StoreMA.
Definition: ScopBuilder.cpp:2527

DetectReductions
static cl::opt< bool > DetectReductions("polly-detect-reductions", cl::desc("Detect and exploit reductions"), cl::Hidden, cl::init(true), cl::cat(PollyCategory))

makeStmtName
static std::string makeStmtName(BasicBlock *BB, long BBIdx, int Count, bool IsMain, bool IsLast=false)
Generate a name for a statement.
Definition: ScopBuilder.cpp:1789

getRegionNodeBasicBlock
static BasicBlock * getRegionNodeBasicBlock(RegionNode *RN)
Helper to treat non-affine regions and basic blocks the same.
Definition: ScopBuilder.cpp:164

StmtGranularity
static cl::opt< GranularityChoice > StmtGranularity("polly-stmt-granularity", cl::desc("Algorithm to use for splitting basic blocks into multiple statements"), cl::values(clEnumValN(GranularityChoice::BasicBlocks, "bb", "One statement per basic block"), clEnumValN(GranularityChoice::ScalarIndependence, "scalar-indep", "Scalar independence heuristic"), clEnumValN(GranularityChoice::Stores, "store", "Store-level granularity")), cl::init(GranularityChoice::ScalarIndependence), cl::cat(PollyCategory))

containsErrorBlock
static bool containsErrorBlock(RegionNode *RN, const Region &R, ScopDetection *SD)
Definition: ScopBuilder.cpp:179

verifyUse
static void verifyUse(Scop *S, Use &Op, LoopInfo &LI)
Definition: ScopBuilder.cpp:3552

STATISTIC
STATISTIC(ScopFound, "Number of valid Scops")

MaxDimensionsInAccessRange
static unsigned const MaxDimensionsInAccessRange
Definition: ScopBuilder.cpp:77

buildMinMaxAccess
static bool buildMinMaxAccess(isl::set Set, Scop::MinMaxVectorTy &MinMaxAccesses, Scop &S)
Add the minimal/maximal access in Set to User.
Definition: ScopBuilder.cpp:3250

mapToDimension
static isl::multi_union_pw_aff mapToDimension(isl::union_set USet, unsigned N)
Definition: ScopBuilder.cpp:1158

verifyUses
static void verifyUses(Scop *S, LoopInfo &LI, DominatorTree &DT)
Check the consistency of every statement's MemoryAccesses.
Definition: ScopBuilder.cpp:3573

combineReductionType
static MemoryAccess::ReductionType combineReductionType(MemoryAccess::ReductionType RT0, MemoryAccess::ReductionType RT1)
Combine two reduction types.
Definition: ScopBuilder.cpp:2516

isOrderedInstruction
static bool isOrderedInstruction(Instruction *Inst)
Is Inst an ordered instruction?
Definition: ScopBuilder.cpp:1841

RunTimeChecksMaxParameters
static cl::opt< unsigned > RunTimeChecksMaxParameters("polly-rtc-max-parameters", cl::desc("The maximal number of parameters allowed in RTCs."), cl::Hidden, cl::init(8), cl::cat(PollyCategory))

UnprofitableScalarAccs
static cl::opt< bool > UnprofitableScalarAccs("polly-unprofitable-scalar-accs", cl::desc("Count statements with scalar accesses as not optimizable"), cl::Hidden, cl::init(false), cl::cat(PollyCategory))

checkCandidatePairAccesses
bool checkCandidatePairAccesses(MemoryAccess *LoadMA, MemoryAccess *StoreMA, isl::set Domain, SmallVector< MemoryAccess *, 8 > &MemAccs)
Test if the accesses of LoadMA and StoreMA can form a reduction.
Definition: ScopBuilder.cpp:2552

PollyIgnoreInbounds
static cl::opt< bool > PollyIgnoreInbounds("polly-ignore-inbounds", cl::desc("Do not take inbounds assumptions at all"), cl::Hidden, cl::init(false), cl::cat(PollyCategory))

ScopBuilder.h

ScopDetection.h

N
static RegisterPass< ScopOnlyPrinterWrapperPass > N("dot-scops-only", "Polly - Print Scops of function (with no function bodies)")

ScopHelper.h

ScopInfo.h

VirtualInstruction.h

isl_pw_aff_free
__isl_null isl_pw_aff * isl_pw_aff_free(__isl_take isl_pw_aff *pwaff)

isl_pw_aff_zero_on_domain
__isl_give isl_pw_aff * isl_pw_aff_zero_on_domain(__isl_take isl_local_space *ls)
Definition: isl_aff.c:206

isl_pw_aff_get_domain_space
__isl_give isl_space * isl_pw_aff_get_domain_space(__isl_keep isl_pw_aff *pwaff)

isl_pw_aff_lt_set
__isl_export __isl_give isl_set * isl_pw_aff_lt_set(__isl_take isl_pw_aff *pwaff1, __isl_take isl_pw_aff *pwaff2)
Definition: isl_aff.c:3069

isl_pw_aff_le_set
__isl_export __isl_give isl_set * isl_pw_aff_le_set(__isl_take isl_pw_aff *pwaff1, __isl_take isl_pw_aff *pwaff2)
Definition: isl_aff.c:3063

isl_pw_aff_copy
__isl_give isl_pw_aff * isl_pw_aff_copy(__isl_keep isl_pw_aff *pwaff)

isl::aff
Definition: isl-noexceptions.h:314

isl::aff::get_denominator_val
isl::val get_denominator_val() const
Definition: isl-noexceptions.h:5102

isl::aff::add_constant_si
isl::aff add_constant_si(int v) const
Definition: isl-noexceptions.h:4977

isl::basic_set
Definition: isl-noexceptions.h:1669

isl::basic_set::get_div
isl::aff get_div(int pos) const
Definition: isl-noexceptions.h:9217

isl::basic_set::is_equal
boolean is_equal(const isl::basic_set &bset2) const
Definition: isl-noexceptions.h:9415

isl::basic_set::dim
class size dim(isl::dim type) const
Definition: isl-noexceptions.h:9169

isl::basic_set::fix_si
isl::basic_set fix_si(isl::dim type, unsigned int pos, int value) const
Definition: isl-noexceptions.h:9252

isl::constraint
Definition: isl-noexceptions.h:1881

isl::constraint::alloc_inequality
static isl::constraint alloc_inequality(isl::local_space ls)
Definition: isl-noexceptions.h:10043

isl::constraint::alloc_equality
static isl::constraint alloc_equality(isl::local_space ls)
Definition: isl-noexceptions.h:10037

isl::id
Definition: isl-noexceptions.h:1948

isl::id::is_null
bool is_null() const
Definition: isl-noexceptions.h:10227

isl::id::alloc
static isl::id alloc(isl::ctx ctx, const std::string &name, void *user)
Definition: isl-noexceptions.h:10235

isl::local_space
Definition: isl-noexceptions.h:2053

isl::map
Definition: isl-noexceptions.h:2081

isl::map::add_constraint
isl::map add_constraint(isl::constraint constraint) const
Definition: isl-noexceptions.h:10630

isl::map::equate
isl::map equate(isl::dim type1, int pos1, isl::dim type2, int pos2) const
Definition: isl-noexceptions.h:10888

isl::map::universe
static isl::map universe(isl::space space)
Definition: isl-noexceptions.h:11775

isl::map::domain_tuple_dim
class size domain_tuple_dim() const
Definition: isl-noexceptions.h:10834

isl::map::set_tuple_id
isl::map set_tuple_id(isl::dim type, isl::id id) const
Definition: isl-noexceptions.h:11676

isl::map::range
isl::set range() const
Definition: isl-noexceptions.h:11557

isl::map::unite
isl::map unite(isl::map map2) const
Definition: isl-noexceptions.h:11759

isl::map::get_space
isl::space get_space() const
Definition: isl-noexceptions.h:11693

isl::map::domain
isl::set domain() const
Definition: isl-noexceptions.h:10789

isl::map::is_empty
boolean is_empty() const
Definition: isl-noexceptions.h:11288

isl::map::has_equal_space
boolean has_equal_space(const isl::map &map2) const
Definition: isl-noexceptions.h:11092

isl::map::intersect_domain
isl::map intersect_domain(isl::set set) const
Definition: isl-noexceptions.h:11138

isl::map::lex_le
static isl::map lex_le(isl::space set_space)
Definition: isl-noexceptions.h:11383

isl::map::copy
__isl_give isl_map * copy() const &
Definition: isl-noexceptions.h:10608

isl::map::involves_dims
boolean involves_dims(isl::dim type, unsigned int first, unsigned int n) const
Definition: isl-noexceptions.h:11260

isl::multi_union_pw_aff
Definition: isl-noexceptions.h:2704

isl::pw_aff
Definition: isl-noexceptions.h:3011

isl::pw_aff::lt_set
isl::set lt_set(isl::pw_aff pwaff2) const
Definition: isl-noexceptions.h:15505

isl::pw_aff::le_set
isl::set le_set(isl::pw_aff pwaff2) const
Definition: isl-noexceptions.h:15494

isl::pw_aff::get_domain_space
isl::space get_domain_space() const
Definition: isl-noexceptions.h:15273

isl::pw_aff::eq_set
isl::set eq_set(isl::pw_aff pwaff2) const
Definition: isl-noexceptions.h:15283

isl::pw_aff::ne_set
isl::set ne_set(isl::pw_aff pwaff2) const
Definition: isl-noexceptions.h:15575

isl::pw_aff::ge_set
isl::set ge_set(isl::pw_aff pwaff2) const
Definition: isl-noexceptions.h:15350

isl::pw_aff::add
isl::multi_pw_aff add(const isl::multi_pw_aff &multi2) const
Definition: isl-noexceptions.h:15083

isl::pw_aff::gt_set
isl::set gt_set(isl::pw_aff pwaff2) const
Definition: isl-noexceptions.h:15377

isl::pw_multi_aff
Definition: isl-noexceptions.h:3242

isl::pw_multi_aff::at
isl::pw_aff at(int pos) const
Definition: isl-noexceptions.h:16267

isl::pw_multi_aff::dim
class size dim(isl::dim type) const
Definition: isl-noexceptions.h:16301

isl::pw_multi_aff::set_pw_aff
isl::multi_pw_aff set_pw_aff(int pos, const isl::pw_aff &el) const
Definition: isl-noexceptions.h:16750

isl::pw_multi_aff::coalesce
isl::pw_multi_aff coalesce() const
Definition: isl-noexceptions.h:16295

isl::pw_multi_aff::project_out_map
static isl::pw_multi_aff project_out_map(isl::space space, isl::dim type, unsigned int first, unsigned int n)
Definition: isl-noexceptions.h:16605

isl::pw_multi_aff::is_null
bool is_null() const
Definition: isl-noexceptions.h:16168

isl::schedule_node::insert_mark
isl::schedule_node insert_mark(isl::id mark) const
Definition: isl-noexceptions.h:17645

isl::schedule_node::child
isl::schedule_node child(int pos) const
Definition: isl-noexceptions.h:17503

isl::schedule_node::get_schedule
isl::schedule get_schedule() const
Definition: isl-noexceptions.h:17792

isl::schedule
Definition: isl-noexceptions.h:3448

isl::schedule::is_null
bool is_null() const
Definition: isl-noexceptions.h:17128

isl::schedule::insert_partial_schedule
isl::schedule insert_partial_schedule(isl::multi_union_pw_aff partial) const
Definition: isl-noexceptions.h:17165

isl::schedule::get_root
isl::schedule_node get_root() const
Definition: isl-noexceptions.h:17200

isl::schedule::from_domain
static isl::schedule from_domain(isl::union_set domain)
Definition: isl-noexceptions.h:17153

isl::schedule::get_domain
isl::union_set get_domain() const
Definition: isl-noexceptions.h:17148

isl::schedule::sequence
isl::schedule sequence(isl::schedule schedule2) const
Definition: isl-noexceptions.h:17205

isl::set
Definition: isl-noexceptions.h:3878

isl::set::project_out
isl::set project_out(isl::dim type, unsigned int first, unsigned int n) const
Definition: isl-noexceptions.h:19121

isl::set::intersect
isl::set intersect(isl::set set2) const
Definition: isl-noexceptions.h:18822

isl::set::subtract
isl::set subtract(isl::set set2) const
Definition: isl-noexceptions.h:19258

isl::set::involves_dims
boolean involves_dims(isl::dim type, unsigned int first, unsigned int n) const
Definition: isl-noexceptions.h:18849

isl::set::set_dim_id
isl::set set_dim_id(isl::dim type, unsigned int pos, isl::id id) const
Definition: isl-noexceptions.h:19192

isl::set::insert_dims
isl::set insert_dims(isl::dim type, unsigned int pos, unsigned int n) const
Definition: isl-noexceptions.h:18810

isl::set::find_dim_by_id
int find_dim_by_id(isl::dim type, const isl::id &id) const
Definition: isl-noexceptions.h:18704

isl::set::universe
static isl::set universe(isl::space space)
Definition: isl-noexceptions.h:19359

isl::set::n_basic_set
class size n_basic_set() const
Definition: isl-noexceptions.h:19057

isl::set::has_equal_space
boolean has_equal_space(const isl::set &set2) const
Definition: isl-noexceptions.h:18787

isl::set::copy
__isl_give isl_set * copy() const &
Definition: isl-noexceptions.h:18493

isl::set::complement
isl::set complement() const
Definition: isl-noexceptions.h:18589

isl::set::gist_params
isl::set gist_params(isl::set context) const
Definition: isl-noexceptions.h:18781

isl::set::lexmax_pw_multi_aff
isl::pw_multi_aff lexmax_pw_multi_aff() const
Definition: isl-noexceptions.h:18986

isl::set::is_subset
boolean is_subset(const isl::set &set2) const
Definition: isl-noexceptions.h:18948

isl::set::remove_dims
isl::set remove_dims(isl::dim type, unsigned int first, unsigned int n) const
Definition: isl-noexceptions.h:19156

isl::set::lexmin_pw_multi_aff
isl::pw_multi_aff lexmin_pw_multi_aff() const
Definition: isl-noexceptions.h:18998

isl::set::detect_equalities
isl::set detect_equalities() const
Definition: isl-noexceptions.h:18611

isl::set::get_dim_name
std::string get_dim_name(isl::dim type, unsigned int pos) const
Definition: isl-noexceptions.h:18671

isl::set::set_tuple_id
isl::set set_tuple_id(isl::id id) const
Definition: isl-noexceptions.h:19208

isl::set::coalesce
isl::set coalesce() const
Definition: isl-noexceptions.h:18583

isl::set::is_null
bool is_null() const
Definition: isl-noexceptions.h:18507

isl::set::empty
static isl::set empty(isl::space space)
Definition: isl-noexceptions.h:18688

isl::set::tuple_dim
class size tuple_dim() const
Definition: isl-noexceptions.h:19297

isl::set::add_constraint
isl::set add_constraint(isl::constraint constraint) const
Definition: isl-noexceptions.h:18515

isl::set::get_space
isl::space get_space() const
Definition: isl-noexceptions.h:19242

isl::set::apply
isl::set apply(isl::map map) const
Definition: isl-noexceptions.h:18539

isl::set::is_empty
boolean is_empty() const
Definition: isl-noexceptions.h:18888

isl::set::release
__isl_give isl_set * release()
Definition: isl-noexceptions.h:18501

isl::set::lower_bound_si
isl::set lower_bound_si(isl::dim type, unsigned int pos, int value) const
Definition: isl-noexceptions.h:19016

isl::set::get
__isl_keep isl_set * get() const
Definition: isl-noexceptions.h:18497

isl::set::dim
class size dim(isl::dim type) const
Definition: isl-noexceptions.h:18617

isl::set::add_dims
isl::set add_dims(isl::dim type, unsigned int n) const
Definition: isl-noexceptions.h:18521

isl::set::eliminate
isl::set eliminate(isl::dim type, unsigned int first, unsigned int n) const
Definition: isl-noexceptions.h:18682

isl::set::is_disjoint
boolean is_disjoint(const isl::set &set2) const
Definition: isl-noexceptions.h:18867

isl::set::unite
isl::set unite(isl::set set2) const
Definition: isl-noexceptions.h:19338

isl::set::get_basic_set_list
isl::basic_set_list get_basic_set_list() const
Definition: isl-noexceptions.h:18572

isl::set::is_equal
boolean is_equal(const isl::set &set2) const
Definition: isl-noexceptions.h:18894

isl::set::simple_hull
isl::basic_set simple_hull() const
Definition: isl-noexceptions.h:19230

isl::set::remove_divs
isl::set remove_divs() const
Definition: isl-noexceptions.h:19162

isl::set::affine_hull
isl::basic_set affine_hull() const
Definition: isl-noexceptions.h:18527

isl::set::params
isl::set params() const
Definition: isl-noexceptions.h:19063

isl::set::project_out_all_params
isl::set project_out_all_params() const
Definition: isl-noexceptions.h:19127

isl::size
Definition: isl-noexceptions.h:154

isl::space
Definition: isl-noexceptions.h:4101

isl::space::dim
class size dim(isl::dim type) const
Definition: isl-noexceptions.h:19667

isl::space::get_dim_id
isl::id get_dim_id(isl::dim type, unsigned int pos) const
Definition: isl-noexceptions.h:19679

isl::space::map_from_set
isl::space map_from_set() const
Definition: isl-noexceptions.h:19820

isl::space::range
isl::space range() const
Definition: isl-noexceptions.h:19891

isl::space::align_params
isl::space align_params(isl::space space2) const
Definition: isl-noexceptions.h:19655

isl::union_map
Definition: isl-noexceptions.h:4280

isl::union_map::range
isl::union_set range() const
Definition: isl-noexceptions.h:20832

isl::union_map::unite
isl::union_map unite(isl::union_map umap2) const
Definition: isl-noexceptions.h:20909

isl::union_map::intersect_range
isl::union_map intersect_range(isl::space space) const
Definition: isl-noexceptions.h:20665

isl::union_map::empty
static isl::union_map empty(isl::ctx ctx)
Definition: isl-noexceptions.h:20500

isl::union_map::params
isl::set params() const
Definition: isl-noexceptions.h:20766

isl::union_map::intersect_domain
isl::union_map intersect_domain(isl::space space) const
Definition: isl-noexceptions.h:20635

isl::union_pw_multi_aff
Definition: isl-noexceptions.h:4540

isl::union_pw_multi_aff::empty
static isl::union_pw_multi_aff empty(isl::space space)
Definition: isl-noexceptions.h:21702

isl::union_set
Definition: isl-noexceptions.h:4607

isl::union_set::contains
boolean contains(const isl::space &space) const
Definition: isl-noexceptions.h:21975

isl::union_set::is_null
bool is_null() const
Definition: isl-noexceptions.h:21937

isl::union_set::get_set_list
isl::set_list get_set_list() const
Definition: isl-noexceptions.h:22167

isl::union_set::extract_set
isl::set extract_set(isl::space space) const
Definition: isl-noexceptions.h:22007

isl::union_set::get_space
isl::space get_space() const
Definition: isl-noexceptions.h:22178

isl::union_set::is_empty
boolean is_empty() const
Definition: isl-noexceptions.h:22083

isl::val
Definition: isl-noexceptions.h:4718

isl::val::is_int
boolean is_int() const
Definition: isl-noexceptions.h:22581

polly::IslMaxOperationsGuard
Scoped limit of ISL operations.
Definition: GICHelper.h:424

polly::MemAccInst
Utility proxy to wrap the common members of LoadInst and StoreInst.
Definition: ScopHelper.h:140

polly::MemAccInst::getValueOperand
llvm::Value * getValueOperand() const
Definition: ScopHelper.h:237

polly::MemAccInst::isLoad
bool isLoad() const
Definition: ScopHelper.h:310

polly::MemAccInst::dyn_cast
static MemAccInst dyn_cast(llvm::Value &V)
Definition: ScopHelper.h:178

polly::MemAccInst::isStore
bool isStore() const
Definition: ScopHelper.h:311

polly::MemAccInst::getPointerOperand
llvm::Value * getPointerOperand() const
Definition: ScopHelper.h:248

polly::MemoryAccess
Represent memory accesses in statements.
Definition: ScopInfo.h:431

polly::MemoryAccess::addIncoming
void addIncoming(BasicBlock *IncomingBlock, Value *IncomingValue)
Add a new incoming block/value pairs for this PHI/ExitPHI access.
Definition: ScopInfo.h:736

polly::MemoryAccess::dump
void dump() const
Print the MemoryAccess to stderr.
Definition: ScopInfo.cpp:955

polly::MemoryAccess::Sizes
SmallVector< const SCEV *, 4 > Sizes
Size of each dimension of the accessed array.
Definition: ScopInfo.h:548

polly::MemoryAccess::AccessType
AccessType
The access type of a memory access.
Definition: ScopInfo.h:457

polly::MemoryAccess::MAY_WRITE
@ MAY_WRITE
Definition: ScopInfo.h:460

polly::MemoryAccess::READ
@ READ
Definition: ScopInfo.h:458

polly::MemoryAccess::MUST_WRITE
@ MUST_WRITE
Definition: ScopInfo.h:459

polly::MemoryAccess::ReductionType
ReductionType
Reduction access type.
Definition: ScopInfo.h:466

polly::MemoryAccess::RT_BOTTOM
@ RT_BOTTOM
Pseudo type for the data flow analysis.
Definition: ScopInfo.h:474

polly::MemoryAccess::RT_BOR
@ RT_BOR
Bitwise Or.
Definition: ScopInfo.h:470

polly::MemoryAccess::RT_BAND
@ RT_BAND
Bitwise And.
Definition: ScopInfo.h:472

polly::MemoryAccess::RT_ADD
@ RT_ADD
Addition.
Definition: ScopInfo.h:468

polly::MemoryAccess::RT_BXOR
@ RT_BXOR
Bitwise XOr.
Definition: ScopInfo.h:471

polly::MemoryAccess::RT_NONE
@ RT_NONE
Indicate no reduction at all.
Definition: ScopInfo.h:467

polly::MemoryAccess::RT_MUL
@ RT_MUL
Multiplication.
Definition: ScopInfo.h:469

polly::MemoryAccess::isValueKind
bool isValueKind() const
Old name of isOriginalValueKind().
Definition: ScopInfo.h:986

polly::MemoryAccess::isPHIKind
bool isPHIKind() const
Old name of isOriginalPHIKind.
Definition: ScopInfo.h:998

polly::MemoryAccess::isWrite
bool isWrite() const
Is this a write memory access?
Definition: ScopInfo.h:769

polly::MemoryAccess::getAccessInstruction
Instruction * getAccessInstruction() const
Return the access instruction of this memory access.
Definition: ScopInfo.h:885

polly::MemoryAccess::subscripts
iterator_range< SubscriptsTy::const_iterator > subscripts() const
Return an iterator range containing the subscripts.
Definition: ScopInfo.h:888

polly::MemoryAccess::isExitPHIKind
bool isExitPHIKind() const
Old name of isOriginalExitPHIKind().
Definition: ScopInfo.h:1014

polly::MemoryAccess::isRead
bool isRead() const
Is this a read memory access?
Definition: ScopInfo.h:760

polly::MemoryAccess::buildAccessRelation
void buildAccessRelation(const ScopArrayInfo *SAI)
Assemble the access relation from all available information.
Definition: ScopInfo.cpp:817

polly::MemoryAccess::isScalarKind
bool isScalarKind() const
Old name of isOriginalScalarKind.
Definition: ScopInfo.h:973

polly::MemoryAccess::getElementType
Type * getElementType() const
Return the element type of the accessed array wrt. this access.
Definition: ScopInfo.h:864

polly::MemoryAccess::getScopArrayInfo
const ScopArrayInfo * getScopArrayInfo() const
Legacy name of getOriginalScopArrayInfo().
Definition: ScopInfo.h:853

polly::MemoryAccess::getOriginalBaseAddr
Value * getOriginalBaseAddr() const
Get the original base address of this access (e.g.
Definition: ScopInfo.h:833

polly::MemoryAccess::getStatement
ScopStmt * getStatement() const
Get the statement that contains this memory access.
Definition: ScopInfo.h:1031

polly::MemoryAccess::isAffine
bool isAffine() const
Is the memory access affine?
Definition: ScopInfo.h:1085

polly::MemoryAccess::getAccessRelation
isl::map getAccessRelation() const
Old name of getLatestAccessRelation().
Definition: ScopInfo.h:795

polly::MemoryAccess::isMemoryIntrinsic
bool isMemoryIntrinsic() const
Is this a memory intrinsic access (memcpy, memset, memmove)?
Definition: ScopInfo.h:772

polly::ScopArrayInfo
A class to store information about arrays in the SCoP.
Definition: ScopInfo.h:219

polly::ScopArrayInfo::isCompatibleWith
bool isCompatibleWith(const ScopArrayInfo *Array) const
Verify that Array is compatible to this ScopArrayInfo.
Definition: ScopInfo.cpp:271

polly::ScopArrayInfo::getBasePtrId
isl::id getBasePtrId() const
Return the isl id for the base pointer.
Definition: ScopInfo.cpp:342

polly::ScopBuilder::buildDomain
void buildDomain(ScopStmt &Stmt)
Build the domain of Stmt.
Definition: ScopBuilder.cpp:2457

polly::ScopBuilder::propagateDomainConstraintsToRegionExit
void propagateDomainConstraintsToRegionExit(BasicBlock *BB, Loop *BBLoop, SmallPtrSetImpl< BasicBlock * > &FinishedExitBlocks, DenseMap< BasicBlock *, isl::set > &InvalidDomainMap)
Propagate domains that are known due to graph properties.
Definition: ScopBuilder.cpp:630

polly::ScopBuilder::isRequiredInvariantLoad
bool isRequiredInvariantLoad(LoadInst *LI) const
Return true if and only if LI is a required invariant load.
Definition: ScopBuilder.h:650

polly::ScopBuilder::propagateInvalidStmtDomains
bool propagateInvalidStmtDomains(Region *R, DenseMap< BasicBlock *, isl::set > &InvalidDomainMap)
Propagate invalid domains of statements through R.
Definition: ScopBuilder.cpp:999

polly::ScopBuilder::ensurePHIWrite
void ensurePHIWrite(PHINode *PHI, ScopStmt *IncomintStmt, BasicBlock *IncomingBlock, Value *IncomingValue, bool IsExitBlock)
Create a write MemoryAccess for the incoming block of a phi node.
Definition: ScopBuilder.cpp:2414

polly::ScopBuilder::addInvariantLoads
void addInvariantLoads(ScopStmt &Stmt, InvariantAccessesTy &InvMAs)
Add invariant loads listed in InvMAs with the domain of Stmt.
Definition: ScopBuilder.cpp:3017

polly::ScopBuilder::canonicalizeDynamicBasePtrs
void canonicalizeDynamicBasePtrs()
Canonicalize arrays with base pointers from the same equivalence class.
Definition: ScopBuilder.cpp:3177

polly::ScopBuilder::calculateMinMaxAccess
bool calculateMinMaxAccess(AliasGroupTy AliasGroup, Scop::MinMaxVectorTy &MinMaxAccesses)
Wrapper function to calculate minimal/maximal accesses to each array.
Definition: ScopBuilder.cpp:3321

polly::ScopBuilder::verifyInvariantLoads
void verifyInvariantLoads()
Verify that all required invariant loads have been hoisted.
Definition: ScopBuilder.cpp:2787

polly::ScopBuilder::LoopStackElementTy
LoopStackElement { Loop *L LoopStackElementTy
A loop stack element to keep track of per-loop information during schedule construction.
Definition: ScopBuilder.h:704

polly::ScopBuilder::Schedule
isl::schedule Schedule
Definition: ScopBuilder.h:707

polly::ScopBuilder::addUserContext
void addUserContext()
Add user provided parameter constraints to context (command line).
Definition: ScopBuilder.cpp:2862

polly::ScopBuilder::ensureValueRead
void ensureValueRead(Value *V, ScopStmt *UserStmt)
Ensure an llvm::Value is available in the BB's statement, creating a MemoryAccess for reloading it if...
Definition: ScopBuilder.cpp:2369

polly::ScopBuilder::buildPHIAccesses
void buildPHIAccesses(ScopStmt *PHIStmt, PHINode *PHI, Region *NonAffineSubRegion, bool IsExitBlock=false)
Create MemoryAccesses for the given PHI node in the given region.
Definition: ScopBuilder.cpp:1081

polly::ScopBuilder::buildSchedule
void buildSchedule()
Construct the schedule of this SCoP.
Definition: ScopBuilder.cpp:1178

polly::ScopBuilder::GlobalReads
SmallVector< std::pair< ScopStmt *, Instruction * >, 16 > GlobalReads
Set of instructions that might read any memory location.
Definition: ScopBuilder.h:57

polly::ScopBuilder::SE
ScalarEvolution & SE
The ScalarEvolution to help building Scop.
Definition: ScopBuilder.h:51

polly::ScopBuilder::foldAccessRelations
void foldAccessRelations()
Fold memory accesses to handle parametric offset.
Definition: ScopBuilder.cpp:2323

polly::ScopBuilder::buildAliasGroupsForAccesses
std::tuple< AliasGroupVectorTy, DenseSet< const ScopArrayInfo * > > buildAliasGroupsForAccesses()
Build alias groups for all memory accesses in the Scop.
Definition: ScopBuilder.cpp:3374

polly::ScopBuilder::propagateDomainConstraints
bool propagateDomainConstraints(Region *R, DenseMap< BasicBlock *, isl::set > &InvalidDomainMap)
Propagate the domain constraints through the region R.
Definition: ScopBuilder.cpp:588

polly::ScopBuilder::buildConditionSets
bool buildConditionSets(BasicBlock *BB, Instruction *TI, Loop *L, __isl_keep isl_set *Domain, DenseMap< BasicBlock *, isl::set > &InvalidDomainMap, SmallVectorImpl< __isl_give isl_set * > &ConditionSets)
Build the conditions sets for the terminator TI in the Domain.
Definition: ScopBuilder.cpp:566

polly::ScopBuilder::addPHIReadAccess
void addPHIReadAccess(ScopStmt *PHIStmt, PHINode *PHI)
Create a MemoryAccess for reading the value of a phi.
Definition: ScopBuilder.cpp:2451

polly::ScopBuilder::buildAccessCallInst
bool buildAccessCallInst(MemAccInst Inst, ScopStmt *Stmt)
Try to build a MemoryAccess for a call instruction.
Definition: ScopBuilder.cpp:1637

polly::ScopBuilder::buildScalarDependences
void buildScalarDependences(ScopStmt *UserStmt, Instruction *Inst)
Analyze and extract the cross-BB scalar dependences (or, dataflow dependencies) of an instruction.
Definition: ScopBuilder.cpp:1123

polly::ScopBuilder::foldSizeConstantsToRight
void foldSizeConstantsToRight()
Fold size constants to the right.
Definition: ScopBuilder.cpp:2193

polly::ScopBuilder::ArrayBasePointers
SmallSetVector< Value *, 16 > ArrayBasePointers
Set of all accessed array base pointers.
Definition: ScopBuilder.h:60

polly::ScopBuilder::LoopStackTy
SmallVector< LoopStackElementTy, 4 > LoopStackTy
The loop stack used for schedule construction.
Definition: ScopBuilder.h:724

polly::ScopBuilder::addMemoryAccess
MemoryAccess * addMemoryAccess(ScopStmt *Stmt, Instruction *Inst, MemoryAccess::AccessType AccType, Value *BaseAddress, Type *ElemType, bool Affine, Value *AccessValue, ArrayRef< const SCEV * > Subscripts, ArrayRef< const SCEV * > Sizes, MemoryKind Kind)
Create a new MemoryAccess object and add it to #AccFuncMap.
Definition: ScopBuilder.cpp:2114

polly::ScopBuilder::hoistInvariantLoads
void hoistInvariantLoads()
Hoist invariant memory loads and check for required ones.
Definition: ScopBuilder.cpp:2801

polly::ScopBuilder::AliasGroupVectorTy
SmallVector< AliasGroupTy, 4 > AliasGroupVectorTy
A vector of alias groups.
Definition: ScopBuilder.h:370

polly::ScopBuilder::AA
AAResults & AA
The AAResults to build AliasSetTracker.
Definition: ScopBuilder.h:36

polly::ScopBuilder::buildAccessMultiDimFixed
bool buildAccessMultiDimFixed(MemAccInst Inst, ScopStmt *Stmt)
Try to build a multi-dimensional fixed sized MemoryAccess from the Load/Store instruction.
Definition: ScopBuilder.cpp:1442

polly::ScopBuilder::DT
DominatorTree & DT
DominatorTree to reason about guaranteed execution.
Definition: ScopBuilder.h:42

polly::ScopBuilder::buildUnsignedConditionSets
__isl_give isl_set * buildUnsignedConditionSets(BasicBlock *BB, Value *Condition, __isl_keep isl_set *Domain, const SCEV *SCEV_TestVal, const SCEV *SCEV_UpperBound, DenseMap< BasicBlock *, isl::set > &InvalidDomainMap, bool IsStrictUpperBound)
Build condition sets for unsigned ICmpInst(s).
Definition: ScopBuilder.cpp:362

polly::ScopBuilder::DL
const DataLayout & DL
Target data for element size computing.
Definition: ScopBuilder.h:39

polly::ScopBuilder::buildAccessMemIntrinsic
bool buildAccessMemIntrinsic(MemAccInst Inst, ScopStmt *Stmt)
Try to build a MemoryAccess for a memory intrinsic.
Definition: ScopBuilder.cpp:1563

polly::ScopBuilder::assumeNoOutOfBounds
void assumeNoOutOfBounds()
Assume that all memory accesses are within bounds.
Definition: ScopBuilder.cpp:2329

polly::ScopBuilder::getNonHoistableCtx
isl::set getNonHoistableCtx(MemoryAccess *Access, isl::union_map Writes)
Return the context under which the access cannot be hoisted.
Definition: ScopBuilder.cpp:2903

polly::ScopBuilder::buildInvariantEquivalenceClasses
void buildInvariantEquivalenceClasses()
Create equivalence classes for required invariant accesses.
Definition: ScopBuilder.cpp:811

polly::ScopBuilder::buildAliasGroups
bool buildAliasGroups()
Build all alias groups for this SCoP.
Definition: ScopBuilder.cpp:3418

polly::ScopBuilder::addArrayAccess
void addArrayAccess(ScopStmt *Stmt, MemAccInst MemAccInst, MemoryAccess::AccessType AccType, Value *BaseAddress, Type *ElemType, bool IsAffine, ArrayRef< const SCEV * > Subscripts, ArrayRef< const SCEV * > Sizes, Value *AccessValue)
Create a MemoryAccess that represents either a LoadInst or StoreInst.
Definition: ScopBuilder.cpp:2152

polly::ScopBuilder::adjustDomainDimensions
isl::set adjustDomainDimensions(isl::set Dom, Loop *OldL, Loop *NewL)
Adjust the dimensions of Dom that was constructed for OldL to be compatible to domains constructed fo...
Definition: ScopBuilder.cpp:294

polly::ScopBuilder::buildAccessMultiDimParam
bool buildAccessMultiDimParam(MemAccInst Inst, ScopStmt *Stmt)
Try to build a multi-dimensional parametric sized MemoryAccess.
Definition: ScopBuilder.cpp:1508

polly::ScopBuilder::NumBlocksProcessed
unsigned NumBlocksProcessed
Definition: ScopBuilder.h:711

polly::ScopBuilder::buildEscapingDependences
void buildEscapingDependences(Instruction *Inst)
Build the escaping dependences for Inst.
Definition: ScopBuilder.cpp:1323

polly::ScopBuilder::buildEqivClassBlockStmts
void buildEqivClassBlockStmts(BasicBlock *BB)
Create one or more ScopStmts for BB using equivalence classes.
Definition: ScopBuilder.cpp:1945

polly::ScopBuilder::splitAliasGroupsByDomain
void splitAliasGroupsByDomain(AliasGroupVectorTy &AliasGroups)
Split alias groups by iteration domains.
Definition: ScopBuilder.cpp:3529

polly::ScopBuilder::buildAliasGroup
bool buildAliasGroup(AliasGroupTy &AliasGroup, DenseSet< const ScopArrayInfo * > HasWriteAccess)
Build a given alias group and its access data.
Definition: ScopBuilder.cpp:3450

polly::ScopBuilder::addUserAssumptions
void addUserAssumptions(AssumptionCache &AC, DenseMap< BasicBlock *, isl::set > &InvalidDomainMap)
Add user provided parameter constraints to context (source code).
Definition: ScopBuilder.cpp:1365

polly::ScopBuilder::checkForReductions
void checkForReductions(ScopStmt &Stmt)
Check for reductions in Stmt.
Definition: ScopBuilder.cpp:2592

polly::ScopBuilder::buildDomains
bool buildDomains(Region *R, DenseMap< BasicBlock *, isl::set > &InvalidDomainMap)
Compute the domain for each basic block in R.
Definition: ScopBuilder.cpp:831

polly::ScopBuilder::buildSequentialBlockStmts
void buildSequentialBlockStmts(BasicBlock *BB, bool SplitOnStore=false)
Create one or more ScopStmts for BB.
Definition: ScopBuilder.cpp:1814

polly::ScopBuilder::SD
ScopDetection & SD
Valid Regions for Scop.
Definition: ScopBuilder.h:48

polly::ScopBuilder::shouldModelInst
bool shouldModelInst(Instruction *Inst, Loop *L)
Should an instruction be modeled in a ScopStmt.
Definition: ScopBuilder.cpp:1776

polly::ScopBuilder::scop
std::unique_ptr< Scop > scop
Definition: ScopBuilder.h:63

polly::ScopBuilder::buildMemoryAccess
void buildMemoryAccess(MemAccInst Inst, ScopStmt *Stmt)
Build an instance of MemoryAccess from the Load/Store instruction.
Definition: ScopBuilder.cpp:1733

polly::ScopBuilder::buildAliasChecks
bool buildAliasChecks()
Build the alias checks for this SCoP.
Definition: ScopBuilder.cpp:3351

polly::ScopBuilder::updateAccessDimensionality
void updateAccessDimensionality()
Update access dimensionalities.
Definition: ScopBuilder.cpp:2298

polly::ScopBuilder::addRecordedAssumptions
void addRecordedAssumptions()
Add all recorded assumptions to the assumed context.
Definition: ScopBuilder.cpp:1331

polly::ScopBuilder::buildAccessRelations
void buildAccessRelations(ScopStmt &Stmt)
Build the access relation of all memory accesses of Stmt.
Definition: ScopBuilder.cpp:3207

polly::ScopBuilder::RecordedAssumptions
RecordedAssumptionsTy RecordedAssumptions
Collection to hold taken assumptions.
Definition: ScopBuilder.h:75

polly::ScopBuilder::hasNonHoistableBasePtrInScop
bool hasNonHoistableBasePtrInScop(MemoryAccess *MA, isl::union_map Writes)
Check if the base ptr of MA is in the SCoP but not hoistable.
Definition: ScopBuilder.cpp:2848

polly::ScopBuilder::addLoopBoundsToHeaderDomain
bool addLoopBoundsToHeaderDomain(Loop *L, DenseMap< BasicBlock *, isl::set > &InvalidDomainMap)
Add loop carried constraints to the header block of the loop L.
Definition: ScopBuilder.cpp:730

polly::ScopBuilder::buildDomainsWithBranchConstraints
bool buildDomainsWithBranchConstraints(Region *R, DenseMap< BasicBlock *, isl::set > &InvalidDomainMap)
Compute the branching constraints for each basic block in R.
Definition: ScopBuilder.cpp:871

polly::ScopBuilder::buildAccessFunctions
void buildAccessFunctions()
Build the access functions for the subregion SR.
Definition: ScopBuilder.cpp:1754

polly::ScopBuilder::canAlwaysBeHoisted
bool canAlwaysBeHoisted(MemoryAccess *MA, bool StmtInvalidCtxIsEmpty, bool MAInvalidCtxIsEmpty, bool NonHoistableCtxIsEmpty)
Check if MA can always be hoisted without execution context.
Definition: ScopBuilder.cpp:2981

polly::ScopBuilder::buildAccessSingleDim
bool buildAccessSingleDim(MemAccInst Inst, ScopStmt *Stmt)
Build a single-dimensional parametric sized MemoryAccess from the Load/Store instruction.
Definition: ScopBuilder.cpp:1684

polly::ScopBuilder::collectSurroundingLoops
void collectSurroundingLoops(ScopStmt &Stmt)
Fill NestLoops with loops surrounding Stmt.
Definition: ScopBuilder.cpp:2464

polly::ScopBuilder::finalizeAccesses
void finalizeAccesses()
Finalize all access relations.
Definition: ScopBuilder.cpp:2291

polly::ScopBuilder::buildScop
void buildScop(Region &R, AssumptionCache &AC)
Definition: ScopBuilder.cpp:3623

polly::ScopBuilder::LI
LoopInfo & LI
LoopInfo for information about loops.
Definition: ScopBuilder.h:45

polly::ScopBuilder::ORE
OptimizationRemarkEmitter & ORE
An optimization diagnostic interface to add optimization remarks.
Definition: ScopBuilder.h:54

polly::ScopBuilder::buildStmts
void buildStmts(Region &SR)
Create ScopStmt for all BBs and non-affine subregions of SR.
Definition: ScopBuilder.cpp:2029

polly::ScopBuilder::ensureValueWrite
void ensureValueWrite(Instruction *Inst)
Create a MemoryAccess for writing an llvm::Instruction.
Definition: ScopBuilder.cpp:2343

polly::ScopBuilder::AliasGroupTy
SmallVector< MemoryAccess *, 4 > AliasGroupTy
A vector of memory accesses that belong to an alias group.
Definition: ScopBuilder.h:367

polly::ScopBuilder::getPwAff
__isl_give isl_pw_aff * getPwAff(BasicBlock *BB, DenseMap< BasicBlock *, isl::set > &InvalidDomainMap, const SCEV *E, bool NonNegative=false)
Compute the isl representation for the SCEV E in this BB.
Definition: ScopBuilder.cpp:346

polly::ScopBuilder::getPredecessorDomainConstraints
isl::set getPredecessorDomainConstraints(BasicBlock *BB, isl::set Domain)
Compute the union of predecessor domains for BB.
Definition: ScopBuilder.cpp:675

polly::ScopBuilder::ScopBuilder
ScopBuilder(Region *R, AssumptionCache &AC, AAResults &AA, const DataLayout &DL, DominatorTree &DT, LoopInfo &LI, ScopDetection &SD, ScalarEvolution &SE, OptimizationRemarkEmitter &ORE)
Definition: ScopBuilder.cpp:3776

polly::ScopDetection
Pass to detect the maximal static control parts (Scops) of a function.
Definition: ScopDetection.h:133

polly::ScopDetection::getDetectionContext
DetectionContext * getDetectionContext(const Region *R) const
Return the detection context for R, nullptr if R was invalid.
Definition: ScopDetection.cpp:1959

polly::ScopDetection::getNextID
int getNextID()
Definition: ScopDetection.h:201

polly::ScopDetection::isErrorBlock
bool isErrorBlock(llvm::BasicBlock &BB, const llvm::Region &R)
Check if the block is a error block.
Definition: ScopDetection.cpp:1474

polly::ScopStmt
Statement of the Scop.
Definition: ScopInfo.h:1140

polly::ScopStmt::addAccess
void addAccess(MemoryAccess *Access, bool Preprend=false)
Add Access to this statement's list of accesses.
Definition: ScopInfo.cpp:1127

polly::ScopStmt::getArrayAccessFor
MemoryAccess & getArrayAccessFor(const Instruction *Inst) const
Return the only array access for Inst.
Definition: ScopInfo.h:1434

polly::ScopStmt::getParent
Scop * getParent()
Definition: ScopInfo.h:1528

polly::ScopStmt::getEntryBlock
BasicBlock * getEntryBlock() const
Return a BasicBlock from this statement.
Definition: ScopInfo.cpp:1221

polly::ScopStmt::Domain
isl::set Domain
The iteration domain describes the set of iterations for which this statement is executed.
Definition: ScopInfo.h:1207

polly::ScopStmt::getInstructions
const std::vector< Instruction * > & getInstructions() const
Definition: ScopInfo.h:1531

polly::ScopStmt::isBlockStmt
bool isBlockStmt() const
Return true if this statement represents a single basic block.
Definition: ScopInfo.h:1321

polly::ScopStmt::getInvalidContext
isl::set getInvalidContext() const
Get the invalid context for this statement.
Definition: ScopInfo.h:1309

polly::ScopStmt::NestLoops
SmallVector< Loop *, 4 > NestLoops
Definition: ScopInfo.h:1258

polly::ScopStmt::getRegion
Region * getRegion() const
Get the region represented by this ScopStmt (if any).
Definition: ScopInfo.h:1330

polly::ScopStmt::represents
bool represents(BasicBlock *BB) const
Return whether this statement represents BB.
Definition: ScopInfo.h:1351

polly::ScopStmt::getBasicBlock
BasicBlock * getBasicBlock() const
Get the BasicBlock represented by this ScopStmt (if any).
Definition: ScopInfo.h:1318

polly::ScopStmt::MemAccs
MemoryAccessVec MemAccs
The memory accesses of this statement.
Definition: ScopInfo.h:1212

polly::ScopStmt::getBaseName
const char * getBaseName() const
Definition: ScopInfo.cpp:1229

polly::ScopStmt::contains
bool contains(const Loop *L) const
Return whether L is boxed within this statement.
Definition: ScopInfo.h:1342

polly::ScopStmt::isRegionStmt
bool isRegionStmt() const
Return true if this statement represents a whole region.
Definition: ScopInfo.h:1333

polly::ScopStmt::setInvalidDomain
void setInvalidDomain(isl::set ID)
Set the invalid context for this statement to ID.
Definition: ScopInfo.cpp:1219

polly::ScopStmt::getDomain
isl::set getDomain() const
Get the iteration domain of this ScopStmt.
Definition: ScopInfo.cpp:1237

polly::ScopStmt::lookupValueWriteOf
MemoryAccess * lookupValueWriteOf(Instruction *Inst) const
Return the MemoryAccess that writes the value of an instruction defined in this statement,...
Definition: ScopInfo.h:1444

polly::ScopStmt::getSurroundingLoop
Loop * getSurroundingLoop() const
Return the closest innermost loop that contains this statement, but is not contained in it.
Definition: ScopInfo.h:1381

polly::ScopStmt::lookupPHIWriteOf
MemoryAccess * lookupPHIWriteOf(PHINode *PHI) const
Return the PHI write MemoryAccess for the incoming values from any basic block in this ScopStmt,...
Definition: ScopInfo.h:1465

polly::ScopStmt::lookupValueReadOf
MemoryAccess * lookupValueReadOf(Value *Inst) const
Return the MemoryAccess that reloads a value, or nullptr if not existing, respectively not yet added.
Definition: ScopInfo.h:1452

polly::Scop
Static Control Part.
Definition: ScopInfo.h:1630

polly::Scop::MinMaxVectorTy
SmallVector< MinMaxAccessTy, 4 > MinMaxVectorTy
Vector of minimal/maximal accesses to different arrays.
Definition: ScopInfo.h:1636

polly::Scop::incrementNumberOfAliasingAssumptions
static void incrementNumberOfAliasingAssumptions(unsigned Step)
Increment actual number of aliasing assumptions taken.
Definition: ScopInfo.cpp:2497

polly::Scop::getRegion
const Region & getRegion() const
Get the maximum region of this static control part.
Definition: ScopInfo.h:2088

polly::VirtualUse::create
static VirtualUse create(Scop *S, const Use &U, LoopInfo *LI, bool Virtual)
Get a VirtualUse for an llvm::Use.
Definition: VirtualInstruction.cpp:19

polly::VirtualUse::Intra
@ Intra
Definition: VirtualInstruction.h:59

polly::VirtualUse::Block
@ Block
Definition: VirtualInstruction.h:41

polly::VirtualUse::ReadOnly
@ ReadOnly
Definition: VirtualInstruction.h:55

polly::VirtualUse::Hoisted
@ Hoisted
Definition: VirtualInstruction.h:49

polly::VirtualUse::Synthesizable
@ Synthesizable
Definition: VirtualInstruction.h:44

polly::VirtualUse::Constant
@ Constant
Definition: VirtualInstruction.h:38

polly::VirtualUse::Inter
@ Inter
Definition: VirtualInstruction.h:63

isl_ctx_last_error
enum isl_error isl_ctx_last_error(isl_ctx *ctx)
Definition: isl_ctx.c:321

__isl_give
#define __isl_give
Definition: ctx.h:19

isl_error_quota
@ isl_error_quota
Definition: ctx.h:81

__isl_keep
#define __isl_keep
Definition: ctx.h:25

isl_size
int isl_size
Definition: ctx.h:96

isl_id_free
__isl_null isl_id * isl_id_free(__isl_take isl_id *id)
Definition: isl_id.c:207

isl_id_get_user
void * isl_id_get_user(__isl_keep isl_id *id)
Definition: isl_id.c:36

C
#define C(FN,...)
Definition: isl_test2.cc:197

assert
#define assert(exp)
Definition: isl_test_cpp-checked.cc:43

isl_local_space_from_space
__isl_give isl_local_space * isl_local_space_from_space(__isl_take isl_space *space)
Definition: isl_local_space.c:93

isl_set
struct isl_set isl_set
Definition: map_type.h:26

isl::manage_copy
aff manage_copy(__isl_keep isl_aff *ptr)
Definition: isl-noexceptions.h:4853

isl::dim::in
@ in

isl::dim::div
@ div

isl::dim::out
@ out

isl::dim::set
@ set

isl::dim::param
@ param

isl::manage
boolean manage(isl_bool val)
Definition: isl-noexceptions.h:95

llvm
This file contains the declaration of the PolyhedralInfo class, which will provide an interface to ex...
Definition: Canonicalization.h:14

polly
Definition: Canonicalization.h:20

polly::PWACtx
std::pair< isl::pw_aff, isl::set > PWACtx
The result type of the SCEVAffinator.
Definition: SCEVAffinator.h:27

polly::getRegionNodeLoop
llvm::Loop * getRegionNodeLoop(llvm::RegionNode *RN, llvm::LoopInfo &LI)
Return the smallest loop surrounding RN.

polly::isAffineConstraint
bool isAffineConstraint(llvm::Value *V, const llvm::Region *R, llvm::Loop *Scope, llvm::ScalarEvolution &SE, ParameterSetTy &Params, bool OrExpr=false)
Check if V describes an affine constraint in R.

polly::MaxDisjunctsInDomain
unsigned const MaxDisjunctsInDomain
Definition: ScopInfo.cpp:118

polly::getIslCompatibleName
std::string getIslCompatibleName(const std::string &Prefix, const llvm::Value *Val, long Number, const std::string &Suffix, bool UseInstructionNames)
Combine Prefix, Val (or Number) and Suffix to an isl-compatible name.

polly::findValues
void findValues(const llvm::SCEV *Expr, llvm::ScalarEvolution &SE, llvm::SetVector< llvm::Value * > &Values)
Find the values referenced by SCEVUnknowns in a given SCEV expression.

polly::findLoops
void findLoops(const llvm::SCEV *Expr, llvm::SetVector< const llvm::Loop * > &Loops)
Find the loops referenced from a SCEV expression.

polly::getConditionFromTerminator
llvm::Value * getConditionFromTerminator(llvm::Instruction *TI)
Return the condition for the terminator TI.

polly::isAffineExpr
bool isAffineExpr(const llvm::Region *R, llvm::Loop *Scope, const llvm::SCEV *Expression, llvm::ScalarEvolution &SE, InvariantLoadsSetTy *ILS=nullptr)

polly::getNumBlocksInRegionNode
unsigned getNumBlocksInRegionNode(llvm::RegionNode *RN)
Get the number of blocks in RN.

polly::getFirstNonBoxedLoopFor
llvm::Loop * getFirstNonBoxedLoopFor(llvm::Loop *L, llvm::LoopInfo &LI, const BoxedLoopsSetTy &BoxedLoops)
Definition: ScopHelper.cpp:688

polly::getDebugLocations
void getDebugLocations(const BBPair &P, DebugLoc &Begin, DebugLoc &End)
Set the begin and end source location for the region limited by P.
Definition: ScopDetectionDiagnostic.cpp:112

polly::AS_RESTRICTION
@ AS_RESTRICTION
Definition: ScopHelper.h:57

polly::AS_ASSUMPTION
@ AS_ASSUMPTION
Definition: ScopHelper.h:57

polly::MemoryKind
MemoryKind
The different memory kinds used in Polly.
Definition: ScopInfo.h:100

polly::MemoryKind::Array
@ Array
MemoryKind::Array: Models a one or multi-dimensional array.

polly::MemoryKind::Value
@ Value
MemoryKind::Value: Models an llvm::Value.

polly::MemoryKind::PHI
@ PHI
MemoryKind::PHI: Models PHI nodes within the SCoP.

polly::MemoryKind::ExitPHI
@ ExitPHI
MemoryKind::ExitPHI: Models PHI nodes in the SCoP's exit block.

polly::hasDisableAllTransformsHint
bool hasDisableAllTransformsHint(llvm::Loop *L)
Does the loop's LoopID contain a 'llvm.loop.disable_heuristics' property?

polly::tryForwardThroughPHI
const llvm::SCEV * tryForwardThroughPHI(const llvm::SCEV *Expr, llvm::Region &R, llvm::ScalarEvolution &SE, ScopDetection *SD)
Try to look through PHI nodes, where some incoming edges come from error blocks.

polly::isDebugCall
bool isDebugCall(llvm::Instruction *Inst)
Is the given instruction a call to a debug function?

polly::rangeIslSize
llvm::iota_range< unsigned > rangeIslSize(unsigned Begin, isl::size End)
Check that End is valid and return an iterator from Begin to End.
Definition: ISLTools.cpp:597

polly::simplify
void simplify(isl::set &Set)
Simplify a set inplace.
Definition: ISLTools.cpp:289

polly::getBBPairForRegion
BBPair getBBPairForRegion(const Region *R)
Return the region delimiters (entry & exit block) of R.
Definition: ScopDetectionDiagnostic.cpp:108

polly::getLoopSurroundingScop
llvm::Loop * getLoopSurroundingScop(Scop &S, llvm::LoopInfo &LI)
Get the smallest loop that contains S but is not in S.

polly::UseInstructionNames
bool UseInstructionNames
Definition: ScopInfo.cpp:156

polly::InvariantLoadsSetTy
llvm::SetVector< llvm::AssertingVH< llvm::LoadInst > > InvariantLoadsSetTy
Type for a set of invariant loads.
Definition: ScopHelper.h:109

polly::recordAssumption
void recordAssumption(RecordedAssumptionsTy *RecordedAssumptions, AssumptionKind Kind, isl::set Set, llvm::DebugLoc Loc, AssumptionSign Sign, llvm::BasicBlock *BB=nullptr, bool RTC=true)
Record an assumption for later addition to the assumed context.

polly::extractConstantFactor
std::pair< const llvm::SCEVConstant *, const llvm::SCEV * > extractConstantFactor(const llvm::SCEV *M, llvm::ScalarEvolution &SE)
Extract the constant factors from the multiplication M.

polly::ParameterSetTy
llvm::SetVector< const llvm::SCEV * > ParameterSetTy
Set type for parameters.
Definition: ScopHelper.h:112

polly::ModelReadOnlyScalars
bool ModelReadOnlyScalars
Command line switch whether to model read-only accesses.
Definition: ScopBuilder.cpp:71

polly::createIslLoopAttr
isl::id createIslLoopAttr(isl::ctx Ctx, llvm::Loop *L)
Create an isl::id that identifies an original loop.

polly::PollyUseRuntimeAliasChecks
bool PollyUseRuntimeAliasChecks
Definition: ScopDetection.cpp:159

polly::PollyDelinearize
bool PollyDelinearize
Definition: ScopDetection.cpp:235

polly::INFINITELOOP
@ INFINITELOOP
Definition: ScopHelper.h:51

polly::ERRORBLOCK
@ ERRORBLOCK
Definition: ScopHelper.h:49

polly::INVARIANTLOAD
@ INVARIANTLOAD
Definition: ScopHelper.h:52

polly::COMPLEXITY
@ COMPLEXITY
Definition: ScopHelper.h:50

polly::ALIASING
@ ALIASING
Definition: ScopHelper.h:44

polly::PROFITABLE
@ PROFITABLE
Definition: ScopHelper.h:48

polly::INBOUNDS
@ INBOUNDS
Definition: ScopHelper.h:45

polly::DELINEARIZATION
@ DELINEARIZATION
Definition: ScopHelper.h:53

polly::getUniqueNonErrorValue
llvm::Value * getUniqueNonErrorValue(llvm::PHINode *PHI, llvm::Region *R, ScopDetection *SD)
Return a unique non-error block incoming value for PHI if available.

polly::PollyInvariantLoadHoisting
bool PollyInvariantLoadHoisting
Definition: ScopDetection.cpp:218

polly::isIgnoredIntrinsic
bool isIgnoredIntrinsic(const llvm::Value *V)
Return true iff V is an intrinsic that we ignore during code generation.

polly::canSynthesize
bool canSynthesize(const llvm::Value *V, const Scop &S, llvm::ScalarEvolution *SE, llvm::Loop *Scope)
Check whether a value an be synthesized by the code generator.

polly::InvariantAccessesTy
SmallVector< InvariantAccess, 8 > InvariantAccessesTy
Ordered container type to hold invariant accesses.
Definition: ScopInfo.h:1103

polly::APIntFromVal
llvm::APInt APIntFromVal(__isl_take isl_val *Val)
Translate isl_val to llvm::APInt.
Definition: GICHelper.cpp:51

polly::getNumBlocksInLoop
unsigned getNumBlocksInLoop(llvm::Loop *L)
Get the number of blocks in L.

polly::MemoryAccessList
std::forward_list< MemoryAccess * > MemoryAccessList
Ordered list type to hold accesses.
Definition: ScopInfo.h:1091

isl_set_universe
__isl_export __isl_give isl_set * isl_set_universe(__isl_take isl_space *space)
Definition: isl_map.c:6366

isl_set_coalesce
__isl_export __isl_give isl_set * isl_set_coalesce(__isl_take isl_set *set)
Definition: isl_coalesce.c:4261

isl_set_subtract
__isl_export __isl_give isl_set * isl_set_subtract(__isl_take isl_set *set1, __isl_take isl_set *set2)
Definition: isl_map_subtract.c:588

isl_set_get_space
__isl_export __isl_give isl_space * isl_set_get_space(__isl_keep isl_set *set)
Definition: isl_map.c:603

isl_set_union
__isl_export __isl_give isl_set * isl_set_union(__isl_take isl_set *set1, __isl_take isl_set *set2)
Definition: isl_map.c:8281

isl_set_n_param
isl_size isl_set_n_param(__isl_keep isl_set *set)
Definition: isl_map.c:227

isl_set_complement
__isl_export __isl_give isl_set * isl_set_complement(__isl_take isl_set *set)
Definition: isl_map_subtract.c:941

isl_set_free
__isl_null isl_set * isl_set_free(__isl_take isl_set *set)
Definition: isl_map.c:3513

isl_set_copy
__isl_give isl_set * isl_set_copy(__isl_keep isl_set *set)
Definition: isl_map.c:1470

isl_set_project_out
__isl_give isl_set * isl_set_project_out(__isl_take isl_set *set, enum isl_dim_type type, unsigned first, unsigned n)
Definition: isl_map.c:4639

isl_set_n_basic_set
__isl_export isl_size isl_set_n_basic_set(__isl_keep isl_set *set)
Definition: isl_map.c:11257

isl_set_intersect
__isl_export __isl_give isl_set * isl_set_intersect(__isl_take isl_set *set1, __isl_take isl_set *set2)
Definition: isl_map.c:3965

isl_set_get_dim_id
__isl_give isl_id * isl_set_get_dim_id(__isl_keep isl_set *set, enum isl_dim_type type, unsigned pos)
Definition: isl_map.c:1003

isl_set_empty
__isl_export __isl_give isl_set * isl_set_empty(__isl_take isl_space *space)
Definition: isl_map.c:6343

isl_set_params
__isl_export __isl_give isl_set * isl_set_params(__isl_take isl_set *set)
Definition: isl_map.c:5948

isl_space_set_alloc
__isl_give isl_space * isl_space_set_alloc(isl_ctx *ctx, unsigned nparam, unsigned dim)
Definition: isl_space.c:156

isl_dim_param
@ isl_dim_param
Definition: space_type.h:15

Kind
Definition: template_cpp.h:55

S
Definition: isl_test_cpp17-generic.cc:3

isl_pw_aff
Definition: isl_aff_private.h:34

polly::Assumption
Helper struct to remember assumptions.
Definition: ScopHelper.h:60

polly::InvariantEquivClassTy
Type for equivalent invariant accesses and their domain context.
Definition: ScopInfo.h:1106

polly::InvariantEquivClassTy::InvariantAccesses
MemoryAccessList InvariantAccesses
Memory accesses now treated invariant.
Definition: ScopInfo.h:1115

Domain
static TupleKindPtr Domain("Domain")