doxygen/ScopDetection_8cpp_source.html

//===- ScopDetection.cpp - Detect Scops -----------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// Detect the maximal Scops of a function.

//

// A static control part (Scop) is a subgraph of the control flow graph (CFG)

// that only has statically known control flow and can therefore be described

// within the polyhedral model.

//

// Every Scop fulfills these restrictions:

//

// * It is a single entry single exit region

//

// * Only affine linear bounds in the loops

//

// Every natural loop in a Scop must have a number of loop iterations that can

// be described as an affine linear function in surrounding loop iterators or

// parameters. (A parameter is a scalar that does not change its value during

// execution of the Scop).

//

// * Only comparisons of affine linear expressions in conditions

//

// * All loops and conditions perfectly nested

//

// The control flow needs to be structured such that it could be written using

// just 'for' and 'if' statements, without the need for any 'goto', 'break' or

// 'continue'.

//

// * Side effect free functions call

//

// Function calls and intrinsics that do not have side effects (readnone)

// or memory intrinsics (memset, memcpy, memmove) are allowed.

//

// The Scop detection finds the largest Scops by checking if the largest

// region is a Scop. If this is not the case, its canonical subregions are

// checked until a region is a Scop. It is now tried to extend this Scop by

// creating a larger non canonical region.

//

//===----------------------------------------------------------------------===//


#include "polly/ScopDetection.h"

#include "polly/LinkAllPasses.h"

#include "polly/Options.h"

#include "polly/ScopDetectionDiagnostic.h"

#include "polly/Support/SCEVValidator.h"

#include "polly/Support/ScopHelper.h"

#include "polly/Support/ScopLocation.h"

#include "llvm/ADT/SmallPtrSet.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/Analysis/AliasAnalysis.h"

#include "llvm/Analysis/Delinearization.h"

#include "llvm/Analysis/Loads.h"

#include "llvm/Analysis/LoopInfo.h"

#include "llvm/Analysis/OptimizationRemarkEmitter.h"

#include "llvm/Analysis/RegionInfo.h"

#include "llvm/Analysis/ScalarEvolution.h"

#include "llvm/Analysis/ScalarEvolutionExpressions.h"

#include "llvm/IR/BasicBlock.h"

#include "llvm/IR/DebugLoc.h"

#include "llvm/IR/DerivedTypes.h"

#include "llvm/IR/DiagnosticInfo.h"

#include "llvm/IR/DiagnosticPrinter.h"

#include "llvm/IR/Dominators.h"

#include "llvm/IR/Function.h"

#include "llvm/IR/InstrTypes.h"

#include "llvm/IR/Instruction.h"

#include "llvm/IR/Instructions.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/Metadata.h"

#include "llvm/IR/Module.h"

#include "llvm/IR/PassManager.h"

#include "llvm/IR/Value.h"

#include "llvm/InitializePasses.h"

#include "llvm/Pass.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/Regex.h"

#include "llvm/Support/raw_ostream.h"

#include <algorithm>

#include <cassert>

#include <memory>

#include <stack>

#include <string>

#include <utility>

#include <vector>


using namespace llvm;

using namespace polly;


#include "polly/Support/PollyDebug.h"

#define DEBUG_TYPE "polly-detect"


// This option is set to a very high value, as analyzing such loops increases

// compile time on several cases. For experiments that enable this option,

// a value of around 40 has been working to avoid run-time regressions with

// Polly while still exposing interesting optimization opportunities.

static cl::opt<int> ProfitabilityMinPerLoopInstructions(

    "polly-detect-profitability-min-per-loop-insts",

    cl::desc("The minimal number of per-loop instructions before a single loop "

             "region is considered profitable"),

    cl::Hidden, cl::ValueRequired, cl::init(100000000), cl::cat(PollyCategory));


bool polly::PollyProcessUnprofitable;


static cl::opt<bool, true> XPollyProcessUnprofitable(

    "polly-process-unprofitable",

    cl::desc(

        "Process scops that are unlikely to benefit from Polly optimizations."),

    cl::location(PollyProcessUnprofitable), cl::cat(PollyCategory));


static cl::list<std::string> OnlyFunctions(

    "polly-only-func",

    cl::desc("Only run on functions that match a regex. "

             "Multiple regexes can be comma separated. "

             "Scop detection will run on all functions that match "

             "ANY of the regexes provided."),

    cl::CommaSeparated, cl::cat(PollyCategory));


static cl::list<std::string> IgnoredFunctions(

    "polly-ignore-func",

    cl::desc("Ignore functions that match a regex. "

             "Multiple regexes can be comma separated. "

             "Scop detection will ignore all functions that match "

             "ANY of the regexes provided."),

    cl::CommaSeparated, cl::cat(PollyCategory));


bool polly::PollyAllowFullFunction;


static cl::opt<bool, true>

    XAllowFullFunction("polly-detect-full-functions",

                       cl::desc("Allow the detection of full functions"),

                       cl::location(polly::PollyAllowFullFunction),

                       cl::init(false), cl::cat(PollyCategory));


static cl::opt<std::string> OnlyRegion(

    "polly-only-region",

    cl::desc("Only run on certain regions (The provided identifier must "

             "appear in the name of the region's entry block"),

    cl::value_desc("identifier"), cl::ValueRequired, cl::init(""),

    cl::cat(PollyCategory));


static cl::opt<bool>

    IgnoreAliasing("polly-ignore-aliasing",

                   cl::desc("Ignore possible aliasing of the array bases"),

                   cl::Hidden, cl::cat(PollyCategory));


bool polly::PollyAllowUnsignedOperations;


static cl::opt<bool, true> XPollyAllowUnsignedOperations(

    "polly-allow-unsigned-operations",

    cl::desc("Allow unsigned operations such as comparisons or zero-extends."),

    cl::location(PollyAllowUnsignedOperations), cl::Hidden, cl::init(true),

    cl::cat(PollyCategory));


bool polly::PollyUseRuntimeAliasChecks;


static cl::opt<bool, true> XPollyUseRuntimeAliasChecks(

    "polly-use-runtime-alias-checks",

    cl::desc("Use runtime alias checks to resolve possible aliasing."),

    cl::location(PollyUseRuntimeAliasChecks), cl::Hidden, cl::init(true),

    cl::cat(PollyCategory));


static cl::opt<bool>

    ReportLevel("polly-report",

                cl::desc("Print information about the activities of Polly"),

                cl::cat(PollyCategory));


static cl::opt<bool> AllowDifferentTypes(

    "polly-allow-differing-element-types",

    cl::desc("Allow different element types for array accesses"), cl::Hidden,

    cl::init(true), cl::cat(PollyCategory));


static cl::opt<bool>

    AllowNonAffine("polly-allow-nonaffine",

                   cl::desc("Allow non affine access functions in arrays"),

                   cl::Hidden, cl::cat(PollyCategory));


static cl::opt<bool>

    AllowModrefCall("polly-allow-modref-calls",

                    cl::desc("Allow functions with known modref behavior"),

                    cl::Hidden, cl::cat(PollyCategory));


static cl::opt<bool> AllowNonAffineSubRegions(

    "polly-allow-nonaffine-branches",

    cl::desc("Allow non affine conditions for branches"), cl::Hidden,

    cl::init(true), cl::cat(PollyCategory));


static cl::opt<bool>

    AllowNonAffineSubLoops("polly-allow-nonaffine-loops",

                           cl::desc("Allow non affine conditions for loops"),

                           cl::Hidden, cl::cat(PollyCategory));


static cl::opt<bool, true>

    TrackFailures("polly-detect-track-failures",

                  cl::desc("Track failure strings in detecting scop regions"),

                  cl::location(PollyTrackFailures), cl::Hidden, cl::init(true),

                  cl::cat(PollyCategory));


static cl::opt<bool> KeepGoing("polly-detect-keep-going",

                               cl::desc("Do not fail on the first error."),

                               cl::Hidden, cl::cat(PollyCategory));


static cl::opt<bool, true>

    PollyDelinearizeX("polly-delinearize",

                      cl::desc("Delinearize array access functions"),

                      cl::location(PollyDelinearize), cl::Hidden,

                      cl::init(true), cl::cat(PollyCategory));


static cl::opt<bool>

    VerifyScops("polly-detect-verify",

                cl::desc("Verify the detected SCoPs after each transformation"),

                cl::Hidden, cl::cat(PollyCategory));


bool polly::PollyInvariantLoadHoisting;


static cl::opt<bool, true>

    XPollyInvariantLoadHoisting("polly-invariant-load-hoisting",

                                cl::desc("Hoist invariant loads."),

                                cl::location(PollyInvariantLoadHoisting),

                                cl::Hidden, cl::cat(PollyCategory));


static cl::opt<bool> PollyAllowErrorBlocks(

    "polly-allow-error-blocks",

    cl::desc("Allow to speculate on the execution of 'error blocks'."),

    cl::Hidden, cl::init(true), cl::cat(PollyCategory));


/// The minimal trip count under which loops are considered unprofitable.

static const unsigned MIN_LOOP_TRIP_COUNT = 8;


bool polly::PollyTrackFailures = false;

bool polly::PollyDelinearize = false;

StringRef polly::PollySkipFnAttr = "polly.skip.fn";


//===----------------------------------------------------------------------===//

// Statistics.


STATISTIC(NumScopRegions, "Number of scops");

STATISTIC(NumLoopsInScop, "Number of loops in scops");

STATISTIC(NumScopsDepthZero, "Number of scops with maximal loop depth 0");

STATISTIC(NumScopsDepthOne, "Number of scops with maximal loop depth 1");

STATISTIC(NumScopsDepthTwo, "Number of scops with maximal loop depth 2");

STATISTIC(NumScopsDepthThree, "Number of scops with maximal loop depth 3");

STATISTIC(NumScopsDepthFour, "Number of scops with maximal loop depth 4");

STATISTIC(NumScopsDepthFive, "Number of scops with maximal loop depth 5");

STATISTIC(NumScopsDepthLarger,

          "Number of scops with maximal loop depth 6 and larger");

STATISTIC(NumProfScopRegions, "Number of scops (profitable scops only)");

STATISTIC(NumLoopsInProfScop,

          "Number of loops in scops (profitable scops only)");

STATISTIC(NumLoopsOverall, "Number of total loops");

STATISTIC(NumProfScopsDepthZero,

          "Number of scops with maximal loop depth 0 (profitable scops only)");

STATISTIC(NumProfScopsDepthOne,

          "Number of scops with maximal loop depth 1 (profitable scops only)");

STATISTIC(NumProfScopsDepthTwo,

          "Number of scops with maximal loop depth 2 (profitable scops only)");

STATISTIC(NumProfScopsDepthThree,

          "Number of scops with maximal loop depth 3 (profitable scops only)");

STATISTIC(NumProfScopsDepthFour,

          "Number of scops with maximal loop depth 4 (profitable scops only)");

STATISTIC(NumProfScopsDepthFive,

          "Number of scops with maximal loop depth 5 (profitable scops only)");

STATISTIC(NumProfScopsDepthLarger,

          "Number of scops with maximal loop depth 6 and larger "

          "(profitable scops only)");

STATISTIC(MaxNumLoopsInScop, "Maximal number of loops in scops");

STATISTIC(MaxNumLoopsInProfScop,

          "Maximal number of loops in scops (profitable scops only)");


static void updateLoopCountStatistic(ScopDetection::LoopStats Stats,

                                     bool OnlyProfitable);


namespace {


class DiagnosticScopFound final : public DiagnosticInfo {

private:

  static int PluginDiagnosticKind;


  Function &F;

  std::string FileName;

  unsigned EntryLine, ExitLine;


public:

  DiagnosticScopFound(Function &F, std::string FileName, unsigned EntryLine,

                      unsigned ExitLine)

      : DiagnosticInfo(PluginDiagnosticKind, DS_Note), F(F), FileName(FileName),

        EntryLine(EntryLine), ExitLine(ExitLine) {}


  void print(DiagnosticPrinter &DP) const override;


  static bool classof(const DiagnosticInfo *DI) {

    return DI->getKind() == PluginDiagnosticKind;

  }

};

} // namespace


int DiagnosticScopFound::PluginDiagnosticKind =

    getNextAvailablePluginDiagnosticKind();


void DiagnosticScopFound::print(DiagnosticPrinter &DP) const {

  DP << "Polly detected an optimizable loop region (scop) in function '" << F

     << "'\n";


  if (FileName.empty()) {

    DP << "Scop location is unknown. Compile with debug info "

          "(-g) to get more precise information. ";

    return;

  }


  DP << FileName << ":" << EntryLine << ": Start of scop\n";

  DP << FileName << ":" << ExitLine << ": End of scop";

}


/// Check if a string matches any regex in a list of regexes.

/// @param Str the input string to match against.

/// @param RegexList a list of strings that are regular expressions.

static bool doesStringMatchAnyRegex(StringRef Str,

                                    const cl::list<std::string> &RegexList) {

  for (auto RegexStr : RegexList) {

    Regex R(RegexStr);


    std::string Err;

    if (!R.isValid(Err))

      report_fatal_error(Twine("invalid regex given as input to polly: ") + Err,

                         true);


    if (R.match(Str))

      return true;

  }

  return false;

}


//===----------------------------------------------------------------------===//

// ScopDetection.


ScopDetection::ScopDetection(const DominatorTree &DT, ScalarEvolution &SE,

                             LoopInfo &LI, RegionInfo &RI, AAResults &AA,

                             OptimizationRemarkEmitter &ORE)

    : DT(DT), SE(SE), LI(LI), RI(RI), AA(AA), ORE(ORE) {}


void ScopDetection::detect(Function &F) {

  assert(ValidRegions.empty() && "Detection must run only once");


  if (!PollyProcessUnprofitable && LI.empty())

    return;


  Region *TopRegion = RI.getTopLevelRegion();


  if (!OnlyFunctions.empty() &&

      !doesStringMatchAnyRegex(F.getName(), OnlyFunctions))

    return;


  if (doesStringMatchAnyRegex(F.getName(), IgnoredFunctions))

    return;


  if (!isValidFunction(F))

    return;


  findScops(*TopRegion);


  NumScopRegions += ValidRegions.size();


  // Prune non-profitable regions.

  for (auto &DIt : DetectionContextMap) {

    DetectionContext &DC = *DIt.getSecond().get();

    if (DC.Log.hasErrors())

      continue;

    if (!ValidRegions.count(&DC.CurRegion))

      continue;

    LoopStats Stats = countBeneficialLoops(&DC.CurRegion, SE, LI, 0);

    updateLoopCountStatistic(Stats, false /* OnlyProfitable */);

    if (isProfitableRegion(DC)) {

      updateLoopCountStatistic(Stats, true /* OnlyProfitable */);

      continue;

    }


    ValidRegions.remove(&DC.CurRegion);

  }


  NumProfScopRegions += ValidRegions.size();

  NumLoopsOverall += countBeneficialLoops(TopRegion, SE, LI, 0).NumLoops;


  // Only makes sense when we tracked errors.

  if (PollyTrackFailures)

    emitMissedRemarks(F);


  if (ReportLevel)

    printLocations(F);


  assert(ValidRegions.size() <= DetectionContextMap.size() &&

         "Cached more results than valid regions");

}


template <class RR, typename... Args>

inline bool ScopDetection::invalid(DetectionContext &Context, bool Assert,

                                   Args &&...Arguments) const {

  if (!Context.Verifying) {

    RejectLog &Log = Context.Log;

    std::shared_ptr<RR> RejectReason = std::make_shared<RR>(Arguments...);

    Context.IsInvalid = true;


    // Log even if PollyTrackFailures is false, the log entries are also used in

    // canUseISLTripCount().

    Log.report(RejectReason);


    POLLY_DEBUG(dbgs() << RejectReason->getMessage());

    POLLY_DEBUG(dbgs() << "\n");

  } else {

    assert(!Assert && "Verification of detected scop failed");

  }


  return false;

}


bool ScopDetection::isMaxRegionInScop(const Region &R, bool Verify) {

  if (!ValidRegions.count(&R))

    return false;


  if (Verify) {

    BBPair P = getBBPairForRegion(&R);

    std::unique_ptr<DetectionContext> &Entry = DetectionContextMap[P];


    // Free previous DetectionContext for the region and create and verify a new

    // one. Be sure that the DetectionContext is not still used by a ScopInfop.

    // Due to changes but CodeGeneration of another Scop, the Region object and

    // the BBPair might not match anymore.

    Entry = std::make_unique<DetectionContext>(const_cast<Region &>(R), AA,

                                               /*Verifying=*/false);


    return isValidRegion(*Entry.get());

  }


  return true;

}


std::string ScopDetection::regionIsInvalidBecause(const Region *R) const {

  // Get the first error we found. Even in keep-going mode, this is the first

  // reason that caused the candidate to be rejected.

  auto *Log = lookupRejectionLog(R);


  // This can happen when we marked a region invalid, but didn't track

  // an error for it.

  if (!Log || !Log->hasErrors())

    return "";


  RejectReasonPtr RR = *Log->begin();

  return RR->getMessage();

}


bool ScopDetection::addOverApproximatedRegion(Region *AR,

                                              DetectionContext &Context) const {

  // If we already know about Ar we can exit.

  if (!Context.NonAffineSubRegionSet.insert(AR))

    return true;


  // All loops in the region have to be overapproximated too if there

  // are accesses that depend on the iteration count.


  for (BasicBlock *BB : AR->blocks()) {

    Loop *L = LI.getLoopFor(BB);

    if (AR->contains(L))

      Context.BoxedLoopsSet.insert(L);

  }


  return (AllowNonAffineSubLoops || Context.BoxedLoopsSet.empty());

}


bool ScopDetection::onlyValidRequiredInvariantLoads(

    InvariantLoadsSetTy &RequiredILS, DetectionContext &Context) const {

  Region &CurRegion = Context.CurRegion;

  const DataLayout &DL = CurRegion.getEntry()->getModule()->getDataLayout();


  if (!PollyInvariantLoadHoisting && !RequiredILS.empty())

    return false;


  for (LoadInst *Load : RequiredILS) {

    // If we already know a load has been accepted as required invariant, we

    // already run the validation below once and consequently don't need to

    // run it again. Hence, we return early. For certain test cases (e.g.,

    // COSMO this avoids us spending 50% of scop-detection time in this

    // very function (and its children).

    if (Context.RequiredILS.count(Load))

      continue;

    if (!isHoistableLoad(Load, CurRegion, LI, SE, DT, Context.RequiredILS))

      return false;


    for (auto NonAffineRegion : Context.NonAffineSubRegionSet) {

      if (isSafeToLoadUnconditionally(Load->getPointerOperand(),

                                      Load->getType(), Load->getAlign(), DL,

                                      nullptr))

        continue;


      if (NonAffineRegion->contains(Load) &&

          Load->getParent() != NonAffineRegion->getEntry())

        return false;

    }

  }


  Context.RequiredILS.insert(RequiredILS.begin(), RequiredILS.end());


  return true;

}


bool ScopDetection::involvesMultiplePtrs(const SCEV *S0, const SCEV *S1,

                                         Loop *Scope) const {

  SetVector<Value *> Values;

  findValues(S0, SE, Values);

  if (S1)

    findValues(S1, SE, Values);


  SmallPtrSet<Value *, 8> PtrVals;

  for (auto *V : Values) {

    if (auto *P2I = dyn_cast<PtrToIntInst>(V))

      V = P2I->getOperand(0);


    if (!V->getType()->isPointerTy())

      continue;


    const SCEV *PtrSCEV = SE.getSCEVAtScope(V, Scope);

    if (isa<SCEVConstant>(PtrSCEV))

      continue;


    auto *BasePtr = dyn_cast<SCEVUnknown>(SE.getPointerBase(PtrSCEV));

    if (!BasePtr)

      return true;


    Value *BasePtrVal = BasePtr->getValue();

    if (PtrVals.insert(BasePtrVal).second) {

      for (auto *PtrVal : PtrVals)

        if (PtrVal != BasePtrVal && !AA.isNoAlias(PtrVal, BasePtrVal))

          return true;

    }

  }


  return false;

}


bool ScopDetection::isAffine(const SCEV *S, Loop *Scope,

                             DetectionContext &Context) const {

  InvariantLoadsSetTy AccessILS;

  if (!isAffineExpr(&Context.CurRegion, Scope, S, SE, &AccessILS))

    return false;


  if (!onlyValidRequiredInvariantLoads(AccessILS, Context))

    return false;


  return true;

}


bool ScopDetection::isValidSwitch(BasicBlock &BB, SwitchInst *SI,

                                  Value *Condition, bool IsLoopBranch,

                                  DetectionContext &Context) const {

  Loop *L = LI.getLoopFor(&BB);

  const SCEV *ConditionSCEV = SE.getSCEVAtScope(Condition, L);


  if (IsLoopBranch && L->isLoopLatch(&BB))

    return false;


  // Check for invalid usage of different pointers in one expression.

  if (involvesMultiplePtrs(ConditionSCEV, nullptr, L))

    return false;


  if (isAffine(ConditionSCEV, L, Context))

    return true;


  if (AllowNonAffineSubRegions &&

      addOverApproximatedRegion(RI.getRegionFor(&BB), Context))

    return true;


  return invalid<ReportNonAffBranch>(Context, /*Assert=*/true, &BB,

                                     ConditionSCEV, ConditionSCEV, SI);

}


bool ScopDetection::isValidBranch(BasicBlock &BB, BranchInst *BI,

                                  Value *Condition, bool IsLoopBranch,

                                  DetectionContext &Context) {

  // Constant integer conditions are always affine.

  if (isa<ConstantInt>(Condition))

    return true;


  if (BinaryOperator *BinOp = dyn_cast<BinaryOperator>(Condition)) {

    auto Opcode = BinOp->getOpcode();

    if (Opcode == Instruction::And || Opcode == Instruction::Or) {

      Value *Op0 = BinOp->getOperand(0);

      Value *Op1 = BinOp->getOperand(1);

      return isValidBranch(BB, BI, Op0, IsLoopBranch, Context) &&

             isValidBranch(BB, BI, Op1, IsLoopBranch, Context);

    }

  }


  if (auto PHI = dyn_cast<PHINode>(Condition)) {

    auto *Unique = dyn_cast_or_null<ConstantInt>(

        getUniqueNonErrorValue(PHI, &Context.CurRegion, this));

    if (Unique && (Unique->isZero() || Unique->isOne()))

      return true;

  }


  if (auto Load = dyn_cast<LoadInst>(Condition))

    if (!IsLoopBranch && Context.CurRegion.contains(Load)) {

      Context.RequiredILS.insert(Load);

      return true;

    }


  // Non constant conditions of branches need to be ICmpInst.

  if (!isa<ICmpInst>(Condition)) {

    if (!IsLoopBranch && AllowNonAffineSubRegions &&

        addOverApproximatedRegion(RI.getRegionFor(&BB), Context))

      return true;

    return invalid<ReportInvalidCond>(Context, /*Assert=*/true, BI, &BB);

  }


  ICmpInst *ICmp = cast<ICmpInst>(Condition);


  // Are both operands of the ICmp affine?

  if (isa<UndefValue>(ICmp->getOperand(0)) ||

      isa<UndefValue>(ICmp->getOperand(1)))

    return invalid<ReportUndefOperand>(Context, /*Assert=*/true, &BB, ICmp);


  Loop *L = LI.getLoopFor(&BB);

  const SCEV *LHS = SE.getSCEVAtScope(ICmp->getOperand(0), L);

  const SCEV *RHS = SE.getSCEVAtScope(ICmp->getOperand(1), L);


  LHS = tryForwardThroughPHI(LHS, Context.CurRegion, SE, this);

  RHS = tryForwardThroughPHI(RHS, Context.CurRegion, SE, this);


  // If unsigned operations are not allowed try to approximate the region.

  if (ICmp->isUnsigned() && !PollyAllowUnsignedOperations)

    return !IsLoopBranch && AllowNonAffineSubRegions &&

           addOverApproximatedRegion(RI.getRegionFor(&BB), Context);


  // Check for invalid usage of different pointers in one expression.

  if (ICmp->isEquality() && involvesMultiplePtrs(LHS, nullptr, L) &&

      involvesMultiplePtrs(RHS, nullptr, L))

    return false;


  // Check for invalid usage of different pointers in a relational comparison.

  if (ICmp->isRelational() && involvesMultiplePtrs(LHS, RHS, L))

    return false;


  if (isAffine(LHS, L, Context) && isAffine(RHS, L, Context))

    return true;


  if (!IsLoopBranch && AllowNonAffineSubRegions &&

      addOverApproximatedRegion(RI.getRegionFor(&BB), Context))

    return true;


  if (IsLoopBranch)

    return false;


  return invalid<ReportNonAffBranch>(Context, /*Assert=*/true, &BB, LHS, RHS,

                                     ICmp);

}


bool ScopDetection::isValidCFG(BasicBlock &BB, bool IsLoopBranch,

                               bool AllowUnreachable,

                               DetectionContext &Context) {

  Region &CurRegion = Context.CurRegion;


  Instruction *TI = BB.getTerminator();


  if (AllowUnreachable && isa<UnreachableInst>(TI))

    return true;


  // Return instructions are only valid if the region is the top level region.

  if (isa<ReturnInst>(TI) && CurRegion.isTopLevelRegion())

    return true;


  Value *Condition = getConditionFromTerminator(TI);


  if (!Condition)

    return invalid<ReportInvalidTerminator>(Context, /*Assert=*/true, &BB);


  // UndefValue is not allowed as condition.

  if (isa<UndefValue>(Condition))

    return invalid<ReportUndefCond>(Context, /*Assert=*/true, TI, &BB);


  if (BranchInst *BI = dyn_cast<BranchInst>(TI))

    return isValidBranch(BB, BI, Condition, IsLoopBranch, Context);


  SwitchInst *SI = dyn_cast<SwitchInst>(TI);

  assert(SI && "Terminator was neither branch nor switch");


  return isValidSwitch(BB, SI, Condition, IsLoopBranch, Context);

}


bool ScopDetection::isValidCallInst(CallInst &CI,

                                    DetectionContext &Context) const {

  if (CI.doesNotReturn())

    return false;


  if (CI.doesNotAccessMemory())

    return true;


  if (auto *II = dyn_cast<IntrinsicInst>(&CI))

    if (isValidIntrinsicInst(*II, Context))

      return true;


  Function *CalledFunction = CI.getCalledFunction();


  // Indirect calls are not supported.

  if (CalledFunction == nullptr)

    return false;


  if (isDebugCall(&CI)) {

    POLLY_DEBUG(dbgs() << "Allow call to debug function: "

                       << CalledFunction->getName() << '\n');

    return true;

  }


  if (AllowModrefCall) {

    MemoryEffects ME = AA.getMemoryEffects(CalledFunction);

    if (ME.onlyAccessesArgPointees()) {

      for (const auto &Arg : CI.args()) {

        if (!Arg->getType()->isPointerTy())

          continue;


        // Bail if a pointer argument has a base address not known to

        // ScalarEvolution. Note that a zero pointer is acceptable.

        const SCEV *ArgSCEV =

            SE.getSCEVAtScope(Arg, LI.getLoopFor(CI.getParent()));

        if (ArgSCEV->isZero())

          continue;


        auto *BP = dyn_cast<SCEVUnknown>(SE.getPointerBase(ArgSCEV));

        if (!BP)

          return false;


        // Implicitly disable delinearization since we have an unknown

        // accesses with an unknown access function.

        Context.HasUnknownAccess = true;

      }


      // Explicitly use addUnknown so we don't put a loop-variant

      // pointer into the alias set.

      Context.AST.addUnknown(&CI);

      return true;

    }


    if (ME.onlyReadsMemory()) {

      // Implicitly disable delinearization since we have an unknown

      // accesses with an unknown access function.

      Context.HasUnknownAccess = true;

      // Explicitly use addUnknown so we don't put a loop-variant

      // pointer into the alias set.

      Context.AST.addUnknown(&CI);

      return true;

    }

    return false;

  }


  return false;

}


bool ScopDetection::isValidIntrinsicInst(IntrinsicInst &II,

                                         DetectionContext &Context) const {

  if (isIgnoredIntrinsic(&II))

    return true;


  // The closest loop surrounding the call instruction.

  Loop *L = LI.getLoopFor(II.getParent());


  // The access function and base pointer for memory intrinsics.

  const SCEV *AF;

  const SCEVUnknown *BP;


  switch (II.getIntrinsicID()) {

  // Memory intrinsics that can be represented are supported.

  case Intrinsic::memmove:

  case Intrinsic::memcpy:

    AF = SE.getSCEVAtScope(cast<MemTransferInst>(II).getSource(), L);

    if (!AF->isZero()) {

      BP = dyn_cast<SCEVUnknown>(SE.getPointerBase(AF));

      // Bail if the source pointer is not valid.

      if (!isValidAccess(&II, AF, BP, Context))

        return false;

    }

    [[fallthrough]];

  case Intrinsic::memset:

    AF = SE.getSCEVAtScope(cast<MemIntrinsic>(II).getDest(), L);

    if (!AF->isZero()) {

      BP = dyn_cast<SCEVUnknown>(SE.getPointerBase(AF));

      // Bail if the destination pointer is not valid.

      if (!isValidAccess(&II, AF, BP, Context))

        return false;

    }


    // Bail if the length is not affine.

    if (!isAffine(SE.getSCEVAtScope(cast<MemIntrinsic>(II).getLength(), L), L,

                  Context))

      return false;


    return true;

  default:

    break;

  }


  return false;

}


bool ScopDetection::isInvariant(Value &Val, const Region &Reg,

                                DetectionContext &Ctx) const {

  // A reference to function argument or constant value is invariant.

  if (isa<Argument>(Val) || isa<Constant>(Val))

    return true;


  Instruction *I = dyn_cast<Instruction>(&Val);

  if (!I)

    return false;


  if (!Reg.contains(I))

    return true;


  // Loads within the SCoP may read arbitrary values, need to hoist them. If it

  // is not hoistable, it will be rejected later, but here we assume it is and

  // that makes the value invariant.

  if (auto LI = dyn_cast<LoadInst>(I)) {

    Ctx.RequiredILS.insert(LI);

    return true;

  }


  return false;

}


namespace {


/// Remove smax of smax(0, size) expressions from a SCEV expression and

/// register the '...' components.

///

/// Array access expressions as they are generated by GFortran contain smax(0,

/// size) expressions that confuse the 'normal' delinearization algorithm.

/// However, if we extract such expressions before the normal delinearization

/// takes place they can actually help to identify array size expressions in

/// Fortran accesses. For the subsequently following delinearization the smax(0,

/// size) component can be replaced by just 'size'. This is correct as we will

/// always add and verify the assumption that for all subscript expressions

/// 'exp' the inequality 0 <= exp < size holds. Hence, we will also verify

/// that 0 <= size, which means smax(0, size) == size.

class SCEVRemoveMax final : public SCEVRewriteVisitor<SCEVRemoveMax> {

public:

  SCEVRemoveMax(ScalarEvolution &SE, std::vector<const SCEV *> *Terms)

      : SCEVRewriteVisitor(SE), Terms(Terms) {}


  static const SCEV *rewrite(const SCEV *Scev, ScalarEvolution &SE,

                             std::vector<const SCEV *> *Terms = nullptr) {

    SCEVRemoveMax Rewriter(SE, Terms);

    return Rewriter.visit(Scev);

  }


  const SCEV *visitSMaxExpr(const SCEVSMaxExpr *Expr) {

    if ((Expr->getNumOperands() == 2) && Expr->getOperand(0)->isZero()) {

      auto Res = visit(Expr->getOperand(1));

      if (Terms)

        (*Terms).push_back(Res);

      return Res;

    }


    return Expr;

  }


private:

  std::vector<const SCEV *> *Terms;

};

} // namespace


SmallVector<const SCEV *, 4>

ScopDetection::getDelinearizationTerms(DetectionContext &Context,

                                       const SCEVUnknown *BasePointer) const {

  SmallVector<const SCEV *, 4> Terms;

  for (const auto &Pair : Context.Accesses[BasePointer]) {

    std::vector<const SCEV *> MaxTerms;

    SCEVRemoveMax::rewrite(Pair.second, SE, &MaxTerms);

    if (!MaxTerms.empty()) {

      Terms.insert(Terms.begin(), MaxTerms.begin(), MaxTerms.end());

      continue;

    }

    // In case the outermost expression is a plain add, we check if any of its

    // terms has the form 4 * %inst * %param * %param ..., aka a term that

    // contains a product between a parameter and an instruction that is

    // inside the scop. Such instructions, if allowed at all, are instructions

    // SCEV can not represent, but Polly is still looking through. As a

    // result, these instructions can depend on induction variables and are

    // most likely no array sizes. However, terms that are multiplied with

    // them are likely candidates for array sizes.

    if (auto *AF = dyn_cast<SCEVAddExpr>(Pair.second)) {

      for (auto Op : AF->operands()) {

        if (auto *AF2 = dyn_cast<SCEVAddRecExpr>(Op))

          collectParametricTerms(SE, AF2, Terms);

        if (auto *AF2 = dyn_cast<SCEVMulExpr>(Op)) {

          SmallVector<const SCEV *, 0> Operands;


          for (const SCEV *MulOp : AF2->operands()) {

            if (auto *Const = dyn_cast<SCEVConstant>(MulOp))

              Operands.push_back(Const);

            if (auto *Unknown = dyn_cast<SCEVUnknown>(MulOp)) {

              if (auto *Inst = dyn_cast<Instruction>(Unknown->getValue())) {

                if (!Context.CurRegion.contains(Inst))

                  Operands.push_back(MulOp);


              } else {

                Operands.push_back(MulOp);

              }

            }

          }

          if (Operands.size())

            Terms.push_back(SE.getMulExpr(Operands));

        }

      }

    }

    if (Terms.empty())

      collectParametricTerms(SE, Pair.second, Terms);

  }

  return Terms;

}


bool ScopDetection::hasValidArraySizes(DetectionContext &Context,

                                       SmallVectorImpl<const SCEV *> &Sizes,

                                       const SCEVUnknown *BasePointer,

                                       Loop *Scope) const {

  // If no sizes were found, all sizes are trivially valid. We allow this case

  // to make it possible to pass known-affine accesses to the delinearization to

  // try to recover some interesting multi-dimensional accesses, but to still

  // allow the already known to be affine access in case the delinearization

  // fails. In such situations, the delinearization will just return a Sizes

  // array of size zero.

  if (Sizes.size() == 0)

    return true;


  Value *BaseValue = BasePointer->getValue();

  Region &CurRegion = Context.CurRegion;

  for (const SCEV *DelinearizedSize : Sizes) {

    // Don't pass down the scope to isAfffine; array dimensions must be

    // invariant across the entire scop.

    if (!isAffine(DelinearizedSize, nullptr, Context)) {

      Sizes.clear();

      break;

    }

    if (auto *Unknown = dyn_cast<SCEVUnknown>(DelinearizedSize)) {

      auto *V = dyn_cast<Value>(Unknown->getValue());

      if (auto *Load = dyn_cast<LoadInst>(V)) {

        if (Context.CurRegion.contains(Load) &&

            isHoistableLoad(Load, CurRegion, LI, SE, DT, Context.RequiredILS))

          Context.RequiredILS.insert(Load);

        continue;

      }

    }

    if (hasScalarDepsInsideRegion(DelinearizedSize, &CurRegion, Scope, false,

                                  Context.RequiredILS))

      return invalid<ReportNonAffineAccess>(

          Context, /*Assert=*/true, DelinearizedSize,

          Context.Accesses[BasePointer].front().first, BaseValue);

  }


  // No array shape derived.

  if (Sizes.empty()) {

    if (AllowNonAffine)

      return true;


    for (const auto &Pair : Context.Accesses[BasePointer]) {

      const Instruction *Insn = Pair.first;

      const SCEV *AF = Pair.second;


      if (!isAffine(AF, Scope, Context)) {

        invalid<ReportNonAffineAccess>(Context, /*Assert=*/true, AF, Insn,

                                       BaseValue);

        if (!KeepGoing)

          return false;

      }

    }

    return false;

  }

  return true;

}


// We first store the resulting memory accesses in TempMemoryAccesses. Only

// if the access functions for all memory accesses have been successfully

// delinearized we continue. Otherwise, we either report a failure or, if

// non-affine accesses are allowed, we drop the information. In case the

// information is dropped the memory accesses need to be overapproximated

// when translated to a polyhedral representation.

bool ScopDetection::computeAccessFunctions(

    DetectionContext &Context, const SCEVUnknown *BasePointer,

    std::shared_ptr<ArrayShape> Shape) const {

  Value *BaseValue = BasePointer->getValue();

  bool BasePtrHasNonAffine = false;

  MapInsnToMemAcc TempMemoryAccesses;

  for (const auto &Pair : Context.Accesses[BasePointer]) {

    const Instruction *Insn = Pair.first;

    auto *AF = Pair.second;

    AF = SCEVRemoveMax::rewrite(AF, SE);

    bool IsNonAffine = false;

    TempMemoryAccesses.insert(std::make_pair(Insn, MemAcc(Insn, Shape)));

    MemAcc *Acc = &TempMemoryAccesses.find(Insn)->second;

    auto *Scope = LI.getLoopFor(Insn->getParent());


    if (!AF) {

      if (isAffine(Pair.second, Scope, Context))

        Acc->DelinearizedSubscripts.push_back(Pair.second);

      else

        IsNonAffine = true;

    } else {

      if (Shape->DelinearizedSizes.size() == 0) {

        Acc->DelinearizedSubscripts.push_back(AF);

      } else {

        llvm::computeAccessFunctions(SE, AF, Acc->DelinearizedSubscripts,

                                     Shape->DelinearizedSizes);

        if (Acc->DelinearizedSubscripts.size() == 0)

          IsNonAffine = true;

      }

      for (const SCEV *S : Acc->DelinearizedSubscripts)

        if (!isAffine(S, Scope, Context))

          IsNonAffine = true;

    }


    // (Possibly) report non affine access

    if (IsNonAffine) {

      BasePtrHasNonAffine = true;

      if (!AllowNonAffine) {

        invalid<ReportNonAffineAccess>(Context, /*Assert=*/true, Pair.second,

                                       Insn, BaseValue);

        if (!KeepGoing)

          return false;

      }

    }

  }


  if (!BasePtrHasNonAffine)

    Context.InsnToMemAcc.insert(TempMemoryAccesses.begin(),

                                TempMemoryAccesses.end());


  return true;

}


bool ScopDetection::hasBaseAffineAccesses(DetectionContext &Context,

                                          const SCEVUnknown *BasePointer,

                                          Loop *Scope) const {

  auto Shape = std::shared_ptr<ArrayShape>(new ArrayShape(BasePointer));


  auto Terms = getDelinearizationTerms(Context, BasePointer);


  findArrayDimensions(SE, Terms, Shape->DelinearizedSizes,

                      Context.ElementSize[BasePointer]);


  if (!hasValidArraySizes(Context, Shape->DelinearizedSizes, BasePointer,

                          Scope))

    return false;


  return computeAccessFunctions(Context, BasePointer, Shape);

}


bool ScopDetection::hasAffineMemoryAccesses(DetectionContext &Context) const {

  // TODO: If we have an unknown access and other non-affine accesses we do

  //       not try to delinearize them for now.

  if (Context.HasUnknownAccess && !Context.NonAffineAccesses.empty())

    return AllowNonAffine;


  for (auto &Pair : Context.NonAffineAccesses) {

    auto *BasePointer = Pair.first;

    auto *Scope = Pair.second;

    if (!hasBaseAffineAccesses(Context, BasePointer, Scope)) {

      Context.IsInvalid = true;

      if (!KeepGoing)

        return false;

    }

  }

  return true;

}


bool ScopDetection::isValidAccess(Instruction *Inst, const SCEV *AF,

                                  const SCEVUnknown *BP,

                                  DetectionContext &Context) const {


  if (!BP)

    return invalid<ReportNoBasePtr>(Context, /*Assert=*/true, Inst);


  auto *BV = BP->getValue();

  if (isa<UndefValue>(BV))

    return invalid<ReportUndefBasePtr>(Context, /*Assert=*/true, Inst);


  // FIXME: Think about allowing IntToPtrInst

  if (IntToPtrInst *Inst = dyn_cast<IntToPtrInst>(BV))

    return invalid<ReportIntToPtr>(Context, /*Assert=*/true, Inst);


  // Check that the base address of the access is invariant in the current

  // region.

  if (!isInvariant(*BV, Context.CurRegion, Context))

    return invalid<ReportVariantBasePtr>(Context, /*Assert=*/true, BV, Inst);


  AF = SE.getMinusSCEV(AF, BP);


  const SCEV *Size;

  if (!isa<MemIntrinsic>(Inst)) {

    Size = SE.getElementSize(Inst);

  } else {

    auto *SizeTy =

        SE.getEffectiveSCEVType(PointerType::getUnqual(SE.getContext()));

    Size = SE.getConstant(SizeTy, 8);

  }


  if (Context.ElementSize[BP]) {

    if (!AllowDifferentTypes && Context.ElementSize[BP] != Size)

      return invalid<ReportDifferentArrayElementSize>(Context, /*Assert=*/true,

                                                      Inst, BV);


    Context.ElementSize[BP] = SE.getSMinExpr(Size, Context.ElementSize[BP]);

  } else {

    Context.ElementSize[BP] = Size;

  }


  bool IsVariantInNonAffineLoop = false;

  SetVector<const Loop *> Loops;

  findLoops(AF, Loops);

  for (const Loop *L : Loops)

    if (Context.BoxedLoopsSet.count(L))

      IsVariantInNonAffineLoop = true;


  auto *Scope = LI.getLoopFor(Inst->getParent());

  bool IsAffine = !IsVariantInNonAffineLoop && isAffine(AF, Scope, Context);

  // Do not try to delinearize memory intrinsics and force them to be affine.

  if (isa<MemIntrinsic>(Inst) && !IsAffine) {

    return invalid<ReportNonAffineAccess>(Context, /*Assert=*/true, AF, Inst,

                                          BV);

  } else if (PollyDelinearize && !IsVariantInNonAffineLoop) {

    Context.Accesses[BP].push_back({Inst, AF});


    if (!IsAffine)

      Context.NonAffineAccesses.insert(

          std::make_pair(BP, LI.getLoopFor(Inst->getParent())));

  } else if (!AllowNonAffine && !IsAffine) {

    return invalid<ReportNonAffineAccess>(Context, /*Assert=*/true, AF, Inst,

                                          BV);

  }


  if (IgnoreAliasing)

    return true;


  // Check if the base pointer of the memory access does alias with

  // any other pointer. This cannot be handled at the moment.

  AAMDNodes AATags = Inst->getAAMetadata();

  AliasSet &AS = Context.AST.getAliasSetFor(

      MemoryLocation::getBeforeOrAfter(BP->getValue(), AATags));


  if (!AS.isMustAlias()) {

    if (PollyUseRuntimeAliasChecks) {

      bool CanBuildRunTimeCheck = true;

      // The run-time alias check places code that involves the base pointer at

      // the beginning of the SCoP. This breaks if the base pointer is defined

      // inside the scop. Hence, we can only create a run-time check if we are

      // sure the base pointer is not an instruction defined inside the scop.

      // However, we can ignore loads that will be hoisted.


      auto ASPointers = AS.getPointers();


      InvariantLoadsSetTy VariantLS, InvariantLS;

      // In order to detect loads which are dependent on other invariant loads

      // as invariant, we use fixed-point iteration method here i.e we iterate

      // over the alias set for arbitrary number of times until it is safe to

      // assume that all the invariant loads have been detected

      while (true) {

        const unsigned int VariantSize = VariantLS.size(),

                           InvariantSize = InvariantLS.size();


        for (const Value *Ptr : ASPointers) {

          Instruction *Inst = dyn_cast<Instruction>(const_cast<Value *>(Ptr));

          if (Inst && Context.CurRegion.contains(Inst)) {

            auto *Load = dyn_cast<LoadInst>(Inst);

            if (Load && InvariantLS.count(Load))

              continue;

            if (Load && isHoistableLoad(Load, Context.CurRegion, LI, SE, DT,

                                        InvariantLS)) {

              if (VariantLS.count(Load))

                VariantLS.remove(Load);

              Context.RequiredILS.insert(Load);

              InvariantLS.insert(Load);

            } else {

              CanBuildRunTimeCheck = false;

              VariantLS.insert(Load);

            }

          }

        }


        if (InvariantSize == InvariantLS.size() &&

            VariantSize == VariantLS.size())

          break;

      }


      if (CanBuildRunTimeCheck)

        return true;

    }

    return invalid<ReportAlias>(Context, /*Assert=*/true, Inst, AS);

  }


  return true;

}


bool ScopDetection::isValidMemoryAccess(MemAccInst Inst,

                                        DetectionContext &Context) const {

  Value *Ptr = Inst.getPointerOperand();

  Loop *L = LI.getLoopFor(Inst->getParent());

  const SCEV *AccessFunction = SE.getSCEVAtScope(Ptr, L);

  const SCEVUnknown *BasePointer;


  BasePointer = dyn_cast<SCEVUnknown>(SE.getPointerBase(AccessFunction));


  return isValidAccess(Inst, AccessFunction, BasePointer, Context);

}


bool ScopDetection::isValidInstruction(Instruction &Inst,

                                       DetectionContext &Context) {

  for (auto &Op : Inst.operands()) {

    auto *OpInst = dyn_cast<Instruction>(&Op);


    if (!OpInst)

      continue;


    if (isErrorBlock(*OpInst->getParent(), Context.CurRegion)) {

      auto *PHI = dyn_cast<PHINode>(OpInst);

      if (PHI) {

        for (User *U : PHI->users()) {

          auto *UI = dyn_cast<Instruction>(U);

          if (!UI || !UI->isTerminator())

            return false;

        }

      } else {

        return false;

      }

    }

  }


  if (isa<LandingPadInst>(&Inst) || isa<ResumeInst>(&Inst))

    return false;


  // We only check the call instruction but not invoke instruction.

  if (CallInst *CI = dyn_cast<CallInst>(&Inst)) {

    if (isValidCallInst(*CI, Context))

      return true;


    return invalid<ReportFuncCall>(Context, /*Assert=*/true, &Inst);

  }


  if (!Inst.mayReadOrWriteMemory()) {

    if (!isa<AllocaInst>(Inst))

      return true;


    return invalid<ReportAlloca>(Context, /*Assert=*/true, &Inst);

  }


  // Check the access function.

  if (auto MemInst = MemAccInst::dyn_cast(Inst)) {

    Context.hasStores |= isa<StoreInst>(MemInst);

    Context.hasLoads |= isa<LoadInst>(MemInst);

    if (!MemInst.isSimple())

      return invalid<ReportNonSimpleMemoryAccess>(Context, /*Assert=*/true,

                                                  &Inst);


    return isValidMemoryAccess(MemInst, Context);

  }


  // We do not know this instruction, therefore we assume it is invalid.

  return invalid<ReportUnknownInst>(Context, /*Assert=*/true, &Inst);

}


/// Check whether @p L has exiting blocks.

///

/// @param L The loop of interest

///

/// @return True if the loop has exiting blocks, false otherwise.

static bool hasExitingBlocks(Loop *L) {

  SmallVector<BasicBlock *, 4> ExitingBlocks;

  L->getExitingBlocks(ExitingBlocks);

  return !ExitingBlocks.empty();

}


bool ScopDetection::canUseISLTripCount(Loop *L, DetectionContext &Context) {

  // FIXME: Yes, this is bad. isValidCFG() may call invalid<Reason>() which

  // causes the SCoP to be rejected regardless on whether non-ISL trip counts

  // could be used. We currently preserve the legacy behaviour of rejecting

  // based on Context.Log.size() added by isValidCFG() or before, regardless on

  // whether the ISL trip count can be used or can be used as a non-affine

  // region. However, we allow rejections by isValidCFG() that do not result in

  // an error log entry.

  bool OldIsInvalid = Context.IsInvalid;


  // Ensure the loop has valid exiting blocks as well as latches, otherwise we

  // need to overapproximate it as a boxed loop.

  SmallVector<BasicBlock *, 4> LoopControlBlocks;

  L->getExitingBlocks(LoopControlBlocks);

  L->getLoopLatches(LoopControlBlocks);

  for (BasicBlock *ControlBB : LoopControlBlocks) {

    if (!isValidCFG(*ControlBB, true, false, Context)) {

      Context.IsInvalid = OldIsInvalid || Context.Log.size();

      return false;

    }

  }


  // We can use ISL to compute the trip count of L.

  Context.IsInvalid = OldIsInvalid || Context.Log.size();

  return true;

}


bool ScopDetection::isValidLoop(Loop *L, DetectionContext &Context) {

  // Loops that contain part but not all of the blocks of a region cannot be

  // handled by the schedule generation. Such loop constructs can happen

  // because a region can contain BBs that have no path to the exit block

  // (Infinite loops, UnreachableInst), but such blocks are never part of a

  // loop.

  //

  // _______________

  // | Loop Header | <-----------.

  // ---------------             |

  //        |                    |

  // _______________       ______________

  // | RegionEntry |-----> | RegionExit |----->

  // ---------------       --------------

  //        |

  // _______________

  // | EndlessLoop | <--.

  // ---------------    |

  //       |            |

  //       \------------/

  //

  // In the example above, the loop (LoopHeader,RegionEntry,RegionExit) is

  // neither entirely contained in the region RegionEntry->RegionExit

  // (containing RegionEntry,EndlessLoop) nor is the region entirely contained

  // in the loop.

  // The block EndlessLoop is contained in the region because Region::contains

  // tests whether it is not dominated by RegionExit. This is probably to not

  // having to query the PostdominatorTree. Instead of an endless loop, a dead

  // end can also be formed by an UnreachableInst. This case is already caught

  // by isErrorBlock(). We hence only have to reject endless loops here.

  if (!hasExitingBlocks(L))

    return invalid<ReportLoopHasNoExit>(Context, /*Assert=*/true, L);


  // The algorithm for domain construction assumes that loops has only a single

  // exit block (and hence corresponds to a subregion). Note that we cannot use

  // L->getExitBlock() because it does not check whether all exiting edges point

  // to the same BB.

  SmallVector<BasicBlock *, 4> ExitBlocks;

  L->getExitBlocks(ExitBlocks);

  BasicBlock *TheExitBlock = ExitBlocks[0];

  for (BasicBlock *ExitBB : ExitBlocks) {

    if (TheExitBlock != ExitBB)

      return invalid<ReportLoopHasMultipleExits>(Context, /*Assert=*/true, L);

  }


  if (canUseISLTripCount(L, Context))

    return true;


  if (AllowNonAffineSubLoops && AllowNonAffineSubRegions) {

    Region *R = RI.getRegionFor(L->getHeader());

    while (R != &Context.CurRegion && !R->contains(L))

      R = R->getParent();


    if (addOverApproximatedRegion(R, Context))

      return true;

  }


  const SCEV *LoopCount = SE.getBackedgeTakenCount(L);

  return invalid<ReportLoopBound>(Context, /*Assert=*/true, L, LoopCount);

}


/// Return the number of loops in @p L (incl. @p L) that have a trip

///        count that is not known to be less than @MinProfitableTrips.

ScopDetection::LoopStats

ScopDetection::countBeneficialSubLoops(Loop *L, ScalarEvolution &SE,

                                       unsigned MinProfitableTrips) {

  const SCEV *TripCount = SE.getBackedgeTakenCount(L);


  int NumLoops = 1;

  int MaxLoopDepth = 1;

  if (MinProfitableTrips > 0)

    if (auto *TripCountC = dyn_cast<SCEVConstant>(TripCount))

      if (TripCountC->getType()->getScalarSizeInBits() <= 64)

        if (TripCountC->getValue()->getZExtValue() <= MinProfitableTrips)

          NumLoops -= 1;


  for (auto &SubLoop : *L) {

    LoopStats Stats = countBeneficialSubLoops(SubLoop, SE, MinProfitableTrips);

    NumLoops += Stats.NumLoops;

    MaxLoopDepth = std::max(MaxLoopDepth, Stats.MaxDepth + 1);

  }


  return {NumLoops, MaxLoopDepth};

}


ScopDetection::LoopStats

ScopDetection::countBeneficialLoops(Region *R, ScalarEvolution &SE,

                                    LoopInfo &LI, unsigned MinProfitableTrips) {

  int LoopNum = 0;

  int MaxLoopDepth = 0;


  auto L = LI.getLoopFor(R->getEntry());


  // If L is fully contained in R, move to first loop surrounding R. Otherwise,

  // L is either nullptr or already surrounding R.

  if (L && R->contains(L)) {

    L = R->outermostLoopInRegion(L);

    L = L->getParentLoop();

  }


  auto SubLoops =

      L ? L->getSubLoopsVector() : std::vector<Loop *>(LI.begin(), LI.end());


  for (auto &SubLoop : SubLoops)

    if (R->contains(SubLoop)) {

      LoopStats Stats =

          countBeneficialSubLoops(SubLoop, SE, MinProfitableTrips);

      LoopNum += Stats.NumLoops;

      MaxLoopDepth = std::max(MaxLoopDepth, Stats.MaxDepth);

    }


  return {LoopNum, MaxLoopDepth};

}


static bool isErrorBlockImpl(BasicBlock &BB, const Region &R, LoopInfo &LI,

                             const DominatorTree &DT) {

  if (isa<UnreachableInst>(BB.getTerminator()))

    return true;


  if (LI.isLoopHeader(&BB))

    return false;


  // Don't consider something outside the SCoP as error block. It will precede

  // the code versioning runtime check.

  if (!R.contains(&BB))

    return false;


  // Basic blocks that are always executed are not considered error blocks,

  // as their execution can not be a rare event.

  bool DominatesAllPredecessors = true;

  if (R.isTopLevelRegion()) {

    for (BasicBlock &I : *R.getEntry()->getParent()) {

      if (isa<ReturnInst>(I.getTerminator()) && !DT.dominates(&BB, &I)) {

        DominatesAllPredecessors = false;

        break;

      }

    }

  } else {

    for (auto Pred : predecessors(R.getExit())) {

      if (R.contains(Pred) && !DT.dominates(&BB, Pred)) {

        DominatesAllPredecessors = false;

        break;

      }

    }

  }


  if (DominatesAllPredecessors)

    return false;


  for (Instruction &Inst : BB)

    if (CallInst *CI = dyn_cast<CallInst>(&Inst)) {

      if (isDebugCall(CI))

        continue;


      if (isIgnoredIntrinsic(CI))

        continue;


      // memset, memcpy and memmove are modeled intrinsics.

      if (isa<MemSetInst>(CI) || isa<MemTransferInst>(CI))

        continue;


      if (!CI->doesNotAccessMemory())

        return true;

      if (CI->doesNotReturn())

        return true;

    }


  return false;

}


bool ScopDetection::isErrorBlock(llvm::BasicBlock &BB, const llvm::Region &R) {

  if (!PollyAllowErrorBlocks)

    return false;


  auto It = ErrorBlockCache.insert({std::make_pair(&BB, &R), false});

  if (!It.second)

    return It.first->getSecond();


  bool Result = isErrorBlockImpl(BB, R, LI, DT);

  It.first->second = Result;

  return Result;

}


Region *ScopDetection::expandRegion(Region &R) {

  // Initial no valid region was found (greater than R)

  std::unique_ptr<Region> LastValidRegion;

  auto ExpandedRegion = std::unique_ptr<Region>(R.getExpandedRegion());


  POLLY_DEBUG(dbgs() << "\tExpanding " << R.getNameStr() << "\n");


  while (ExpandedRegion) {

    BBPair P = getBBPairForRegion(ExpandedRegion.get());

    std::unique_ptr<DetectionContext> &Entry = DetectionContextMap[P];

    Entry = std::make_unique<DetectionContext>(*ExpandedRegion, AA,

                                               /*Verifying=*/false);

    DetectionContext &Context = *Entry.get();


    POLLY_DEBUG(dbgs() << "\t\tTrying " << ExpandedRegion->getNameStr()

                       << "\n");

    // Only expand when we did not collect errors.


    if (!Context.Log.hasErrors()) {

      // If the exit is valid check all blocks

      //  - if true, a valid region was found => store it + keep expanding

      //  - if false, .tbd. => stop  (should this really end the loop?)

      if (!allBlocksValid(Context) || Context.Log.hasErrors()) {

        removeCachedResults(*ExpandedRegion);

        DetectionContextMap.erase(P);

        break;

      }


      // Store this region, because it is the greatest valid (encountered so

      // far).

      if (LastValidRegion) {

        removeCachedResults(*LastValidRegion);

        DetectionContextMap.erase(P);

      }

      LastValidRegion = std::move(ExpandedRegion);


      // Create and test the next greater region (if any)

      ExpandedRegion =

          std::unique_ptr<Region>(LastValidRegion->getExpandedRegion());


    } else {

      // Create and test the next greater region (if any)

      removeCachedResults(*ExpandedRegion);

      DetectionContextMap.erase(P);

      ExpandedRegion =

          std::unique_ptr<Region>(ExpandedRegion->getExpandedRegion());

    }

  }


  POLLY_DEBUG({

    if (LastValidRegion)

      dbgs() << "\tto " << LastValidRegion->getNameStr() << "\n";

    else

      dbgs() << "\tExpanding " << R.getNameStr() << " failed\n";

  });


  return LastValidRegion.release();

}


static bool regionWithoutLoops(Region &R, LoopInfo &LI) {

  for (const BasicBlock *BB : R.blocks())

    if (R.contains(LI.getLoopFor(BB)))

      return false;


  return true;

}


void ScopDetection::removeCachedResultsRecursively(const Region &R) {

  for (auto &SubRegion : R) {

    if (ValidRegions.count(SubRegion.get())) {

      removeCachedResults(*SubRegion.get());

    } else

      removeCachedResultsRecursively(*SubRegion);

  }

}


void ScopDetection::removeCachedResults(const Region &R) {

  ValidRegions.remove(&R);

}


void ScopDetection::findScops(Region &R) {

  std::unique_ptr<DetectionContext> &Entry =

      DetectionContextMap[getBBPairForRegion(&R)];

  Entry = std::make_unique<DetectionContext>(R, AA, /*Verifying=*/false);

  DetectionContext &Context = *Entry.get();


  bool DidBailout = true;

  if (!PollyProcessUnprofitable && regionWithoutLoops(R, LI))

    invalid<ReportUnprofitable>(Context, /*Assert=*/true, &R);

  else

    DidBailout = !isValidRegion(Context);


  (void)DidBailout;

  if (KeepGoing) {

    assert((!DidBailout || Context.IsInvalid) &&

           "With -polly-detect-keep-going, it is sufficient that if "

           "isValidRegion short-circuited, that SCoP is invalid");

  } else {

    assert(DidBailout == Context.IsInvalid &&

           "isValidRegion must short-circuit iff the ScoP is invalid");

  }


  if (Context.IsInvalid) {

    removeCachedResults(R);

  } else {

    ValidRegions.insert(&R);

    return;

  }


  for (auto &SubRegion : R)

    findScops(*SubRegion);


  // Try to expand regions.

  //

  // As the region tree normally only contains canonical regions, non canonical

  // regions that form a Scop are not found. Therefore, those non canonical

  // regions are checked by expanding the canonical ones.


  std::vector<Region *> ToExpand;


  for (auto &SubRegion : R)

    ToExpand.push_back(SubRegion.get());


  for (Region *CurrentRegion : ToExpand) {

    // Skip invalid regions. Regions may become invalid, if they are element of

    // an already expanded region.

    if (!ValidRegions.count(CurrentRegion))

      continue;


    // Skip regions that had errors.

    bool HadErrors = lookupRejectionLog(CurrentRegion)->hasErrors();

    if (HadErrors)

      continue;


    Region *ExpandedR = expandRegion(*CurrentRegion);


    if (!ExpandedR)

      continue;


    R.addSubRegion(ExpandedR, true);

    ValidRegions.insert(ExpandedR);

    removeCachedResults(*CurrentRegion);

    removeCachedResultsRecursively(*ExpandedR);

  }

}


bool ScopDetection::allBlocksValid(DetectionContext &Context) {

  Region &CurRegion = Context.CurRegion;


  for (const BasicBlock *BB : CurRegion.blocks()) {

    Loop *L = LI.getLoopFor(BB);

    if (L && L->getHeader() == BB) {

      if (CurRegion.contains(L)) {

        if (!isValidLoop(L, Context)) {

          Context.IsInvalid = true;

          if (!KeepGoing)

            return false;

        }

      } else {

        SmallVector<BasicBlock *, 1> Latches;

        L->getLoopLatches(Latches);

        for (BasicBlock *Latch : Latches)

          if (CurRegion.contains(Latch))

            return invalid<ReportLoopOnlySomeLatches>(Context, /*Assert=*/true,

                                                      L);

      }

    }

  }


  for (BasicBlock *BB : CurRegion.blocks()) {

    bool IsErrorBlock = isErrorBlock(*BB, CurRegion);


    // Also check exception blocks (and possibly register them as non-affine

    // regions). Even though exception blocks are not modeled, we use them

    // to forward-propagate domain constraints during ScopInfo construction.

    if (!isValidCFG(*BB, false, IsErrorBlock, Context) && !KeepGoing)

      return false;


    if (IsErrorBlock)

      continue;


    for (BasicBlock::iterator I = BB->begin(), E = --BB->end(); I != E; ++I)

      if (!isValidInstruction(*I, Context)) {

        Context.IsInvalid = true;

        if (!KeepGoing)

          return false;

      }

  }


  if (!hasAffineMemoryAccesses(Context))

    return false;


  return true;

}


bool ScopDetection::hasSufficientCompute(DetectionContext &Context,

                                         int NumLoops) const {

  int InstCount = 0;


  if (NumLoops == 0)

    return false;


  for (auto *BB : Context.CurRegion.blocks())

    if (Context.CurRegion.contains(LI.getLoopFor(BB)))

      InstCount += BB->size();


  InstCount = InstCount / NumLoops;


  return InstCount >= ProfitabilityMinPerLoopInstructions;

}


bool ScopDetection::hasPossiblyDistributableLoop(

    DetectionContext &Context) const {

  for (auto *BB : Context.CurRegion.blocks()) {

    auto *L = LI.getLoopFor(BB);

    if (!L)

      continue;

    if (!Context.CurRegion.contains(L))

      continue;

    if (Context.BoxedLoopsSet.count(L))

      continue;

    unsigned StmtsWithStoresInLoops = 0;

    for (auto *LBB : L->blocks()) {

      bool MemStore = false;

      for (auto &I : *LBB)

        MemStore |= isa<StoreInst>(&I);

      StmtsWithStoresInLoops += MemStore;

    }

    return (StmtsWithStoresInLoops > 1);

  }

  return false;

}


bool ScopDetection::isProfitableRegion(DetectionContext &Context) const {

  Region &CurRegion = Context.CurRegion;


  if (PollyProcessUnprofitable)

    return true;


  // We can probably not do a lot on scops that only write or only read

  // data.

  if (!Context.hasStores || !Context.hasLoads)

    return invalid<ReportUnprofitable>(Context, /*Assert=*/true, &CurRegion);


  int NumLoops =

      countBeneficialLoops(&CurRegion, SE, LI, MIN_LOOP_TRIP_COUNT).NumLoops;

  int NumAffineLoops = NumLoops - Context.BoxedLoopsSet.size();


  // Scops with at least two loops may allow either loop fusion or tiling and

  // are consequently interesting to look at.

  if (NumAffineLoops >= 2)

    return true;


  // A loop with multiple non-trivial blocks might be amendable to distribution.

  if (NumAffineLoops == 1 && hasPossiblyDistributableLoop(Context))

    return true;


  // Scops that contain a loop with a non-trivial amount of computation per

  // loop-iteration are interesting as we may be able to parallelize such

  // loops. Individual loops that have only a small amount of computation

  // per-iteration are performance-wise very fragile as any change to the

  // loop induction variables may affect performance. To not cause spurious

  // performance regressions, we do not consider such loops.

  if (NumAffineLoops == 1 && hasSufficientCompute(Context, NumLoops))

    return true;


  return invalid<ReportUnprofitable>(Context, /*Assert=*/true, &CurRegion);

}


bool ScopDetection::isValidRegion(DetectionContext &Context) {

  Region &CurRegion = Context.CurRegion;


  POLLY_DEBUG(dbgs() << "Checking region: " << CurRegion.getNameStr()

                     << "\n\t");


  if (!PollyAllowFullFunction && CurRegion.isTopLevelRegion()) {

    POLLY_DEBUG(dbgs() << "Top level region is invalid\n");

    Context.IsInvalid = true;

    return false;

  }


  DebugLoc DbgLoc;

  if (CurRegion.getExit() &&

      isa<UnreachableInst>(CurRegion.getExit()->getTerminator())) {

    POLLY_DEBUG(dbgs() << "Unreachable in exit\n");

    return invalid<ReportUnreachableInExit>(Context, /*Assert=*/true,

                                            CurRegion.getExit(), DbgLoc);

  }


  if (!OnlyRegion.empty() &&

      !CurRegion.getEntry()->getName().count(OnlyRegion)) {

    POLLY_DEBUG({

      dbgs() << "Region entry does not match -polly-only-region";

      dbgs() << "\n";

    });

    Context.IsInvalid = true;

    return false;

  }


  for (BasicBlock *Pred : predecessors(CurRegion.getEntry())) {

    Instruction *PredTerm = Pred->getTerminator();

    if (isa<IndirectBrInst>(PredTerm) || isa<CallBrInst>(PredTerm))

      return invalid<ReportIndirectPredecessor>(

          Context, /*Assert=*/true, PredTerm, PredTerm->getDebugLoc());

  }


  // SCoP cannot contain the entry block of the function, because we need

  // to insert alloca instruction there when translate scalar to array.

  if (!PollyAllowFullFunction &&

      CurRegion.getEntry() ==

          &(CurRegion.getEntry()->getParent()->getEntryBlock()))

    return invalid<ReportEntry>(Context, /*Assert=*/true, CurRegion.getEntry());


  if (!allBlocksValid(Context)) {

    // TODO: Every failure condition within allBlocksValid should call

    // invalid<Reason>(). Otherwise we reject SCoPs without giving feedback to

    // the user.

    Context.IsInvalid = true;

    return false;

  }


  if (!isReducibleRegion(CurRegion, DbgLoc))

    return invalid<ReportIrreducibleRegion>(Context, /*Assert=*/true,

                                            &CurRegion, DbgLoc);


  POLLY_DEBUG(dbgs() << "OK\n");

  return true;

}


void ScopDetection::markFunctionAsInvalid(Function *F) {

  F->addFnAttr(PollySkipFnAttr);

}


bool ScopDetection::isValidFunction(Function &F) {

  return !F.hasFnAttribute(PollySkipFnAttr);

}


void ScopDetection::printLocations(Function &F) {

  for (const Region *R : *this) {

    unsigned LineEntry, LineExit;

    std::string FileName;


    getDebugLocation(R, LineEntry, LineExit, FileName);

    DiagnosticScopFound Diagnostic(F, FileName, LineEntry, LineExit);

    F.getContext().diagnose(Diagnostic);

  }

}


void ScopDetection::emitMissedRemarks(const Function &F) {

  for (auto &DIt : DetectionContextMap) {

    DetectionContext &DC = *DIt.getSecond().get();

    if (DC.Log.hasErrors())

      emitRejectionRemarks(DIt.getFirst(), DC.Log, ORE);

  }

}


bool ScopDetection::isReducibleRegion(Region &R, DebugLoc &DbgLoc) const {

  /// Enum for coloring BBs in Region.

  ///

  /// WHITE - Unvisited BB in DFS walk.

  /// GREY - BBs which are currently on the DFS stack for processing.

  /// BLACK - Visited and completely processed BB.

  enum Color { WHITE, GREY, BLACK };


  BasicBlock *REntry = R.getEntry();

  BasicBlock *RExit = R.getExit();

  // Map to match the color of a BasicBlock during the DFS walk.

  DenseMap<const BasicBlock *, Color> BBColorMap;

  // Stack keeping track of current BB and index of next child to be processed.

  std::stack<std::pair<BasicBlock *, unsigned>> DFSStack;


  unsigned AdjacentBlockIndex = 0;

  BasicBlock *CurrBB, *SuccBB;

  CurrBB = REntry;


  // Initialize the map for all BB with WHITE color.

  for (auto *BB : R.blocks())

    BBColorMap[BB] = WHITE;


  // Process the entry block of the Region.

  BBColorMap[CurrBB] = GREY;

  DFSStack.push(std::make_pair(CurrBB, 0));


  while (!DFSStack.empty()) {

    // Get next BB on stack to be processed.

    CurrBB = DFSStack.top().first;

    AdjacentBlockIndex = DFSStack.top().second;

    DFSStack.pop();


    // Loop to iterate over the successors of current BB.

    const Instruction *TInst = CurrBB->getTerminator();

    unsigned NSucc = TInst->getNumSuccessors();

    for (unsigned I = AdjacentBlockIndex; I < NSucc;

         ++I, ++AdjacentBlockIndex) {

      SuccBB = TInst->getSuccessor(I);


      // Checks for region exit block and self-loops in BB.

      if (SuccBB == RExit || SuccBB == CurrBB)

        continue;


      // WHITE indicates an unvisited BB in DFS walk.

      if (BBColorMap[SuccBB] == WHITE) {

        // Push the current BB and the index of the next child to be visited.

        DFSStack.push(std::make_pair(CurrBB, I + 1));

        // Push the next BB to be processed.

        DFSStack.push(std::make_pair(SuccBB, 0));

        // First time the BB is being processed.

        BBColorMap[SuccBB] = GREY;

        break;

      } else if (BBColorMap[SuccBB] == GREY) {

        // GREY indicates a loop in the control flow.

        // If the destination dominates the source, it is a natural loop

        // else, an irreducible control flow in the region is detected.

        if (!DT.dominates(SuccBB, CurrBB)) {

          // Get debug info of instruction which causes irregular control flow.

          DbgLoc = TInst->getDebugLoc();

          return false;

        }

      }

    }


    // If all children of current BB have been processed,

    // then mark that BB as fully processed.

    if (AdjacentBlockIndex == NSucc)

      BBColorMap[CurrBB] = BLACK;

  }


  return true;

}


static void updateLoopCountStatistic(ScopDetection::LoopStats Stats,

                                     bool OnlyProfitable) {

  if (!OnlyProfitable) {

    NumLoopsInScop += Stats.NumLoops;

    MaxNumLoopsInScop =

        std::max(MaxNumLoopsInScop.getValue(), (uint64_t)Stats.NumLoops);

    if (Stats.MaxDepth == 0)

      NumScopsDepthZero++;

    else if (Stats.MaxDepth == 1)

      NumScopsDepthOne++;

    else if (Stats.MaxDepth == 2)

      NumScopsDepthTwo++;

    else if (Stats.MaxDepth == 3)

      NumScopsDepthThree++;

    else if (Stats.MaxDepth == 4)

      NumScopsDepthFour++;

    else if (Stats.MaxDepth == 5)

      NumScopsDepthFive++;

    else

      NumScopsDepthLarger++;

  } else {

    NumLoopsInProfScop += Stats.NumLoops;

    MaxNumLoopsInProfScop =

        std::max(MaxNumLoopsInProfScop.getValue(), (uint64_t)Stats.NumLoops);

    if (Stats.MaxDepth == 0)

      NumProfScopsDepthZero++;

    else if (Stats.MaxDepth == 1)

      NumProfScopsDepthOne++;

    else if (Stats.MaxDepth == 2)

      NumProfScopsDepthTwo++;

    else if (Stats.MaxDepth == 3)

      NumProfScopsDepthThree++;

    else if (Stats.MaxDepth == 4)

      NumProfScopsDepthFour++;

    else if (Stats.MaxDepth == 5)

      NumProfScopsDepthFive++;

    else

      NumProfScopsDepthLarger++;

  }

}


ScopDetection::DetectionContext *

ScopDetection::getDetectionContext(const Region *R) const {

  auto DCMIt = DetectionContextMap.find(getBBPairForRegion(R));

  if (DCMIt == DetectionContextMap.end())

    return nullptr;

  return DCMIt->second.get();

}


const RejectLog *ScopDetection::lookupRejectionLog(const Region *R) const {

  const DetectionContext *DC = getDetectionContext(R);

  return DC ? &DC->Log : nullptr;

}


void ScopDetection::verifyRegion(const Region &R) {

  assert(isMaxRegionInScop(R) && "Expect R is a valid region.");


  DetectionContext Context(const_cast<Region &>(R), AA, true /*verifying*/);

  isValidRegion(Context);

}


void ScopDetection::verifyAnalysis() {

  if (!VerifyScops)

    return;


  for (const Region *R : ValidRegions)

    verifyRegion(*R);

}


bool ScopDetectionWrapperPass::runOnFunction(Function &F) {

  auto &LI = getAnalysis<LoopInfoWrapperPass>().getLoopInfo();

  auto &RI = getAnalysis<RegionInfoPass>().getRegionInfo();

  auto &AA = getAnalysis<AAResultsWrapperPass>().getAAResults();

  auto &SE = getAnalysis<ScalarEvolutionWrapperPass>().getSE();

  auto &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree();

  auto &ORE = getAnalysis<OptimizationRemarkEmitterWrapperPass>().getORE();


  Result = std::make_unique<ScopDetection>(DT, SE, LI, RI, AA, ORE);

  Result->detect(F);

  return false;

}


void ScopDetectionWrapperPass::getAnalysisUsage(AnalysisUsage &AU) const {

  AU.addRequired<LoopInfoWrapperPass>();

  AU.addRequiredTransitive<ScalarEvolutionWrapperPass>();

  AU.addRequired<DominatorTreeWrapperPass>();

  AU.addRequired<OptimizationRemarkEmitterWrapperPass>();

  // We also need AA and RegionInfo when we are verifying analysis.

  AU.addRequiredTransitive<AAResultsWrapperPass>();

  AU.addRequiredTransitive<RegionInfoPass>();

  AU.setPreservesAll();

}


void ScopDetectionWrapperPass::print(raw_ostream &OS, const Module *) const {

  for (const Region *R : Result->ValidRegions)

    OS << "Valid Region for Scop: " << R->getNameStr() << '\n';


  OS << "\n";

}


ScopDetectionWrapperPass::ScopDetectionWrapperPass() : FunctionPass(ID) {

  // Disable runtime alias checks if we ignore aliasing all together.

  if (IgnoreAliasing)

    PollyUseRuntimeAliasChecks = false;

}


ScopAnalysis::ScopAnalysis() {

  // Disable runtime alias checks if we ignore aliasing all together.

  if (IgnoreAliasing)

    PollyUseRuntimeAliasChecks = false;

}


void ScopDetectionWrapperPass::releaseMemory() { Result.reset(); }


char ScopDetectionWrapperPass::ID;


AnalysisKey ScopAnalysis::Key;


ScopDetection ScopAnalysis::run(Function &F, FunctionAnalysisManager &FAM) {

  auto &LI = FAM.getResult<LoopAnalysis>(F);

  auto &RI = FAM.getResult<RegionInfoAnalysis>(F);

  auto &AA = FAM.getResult<AAManager>(F);

  auto &SE = FAM.getResult<ScalarEvolutionAnalysis>(F);

  auto &DT = FAM.getResult<DominatorTreeAnalysis>(F);

  auto &ORE = FAM.getResult<OptimizationRemarkEmitterAnalysis>(F);


  ScopDetection Result(DT, SE, LI, RI, AA, ORE);

  Result.detect(F);

  return Result;

}


PreservedAnalyses ScopAnalysisPrinterPass::run(Function &F,

                                               FunctionAnalysisManager &FAM) {

  OS << "Detected Scops in Function " << F.getName() << "\n";

  auto &SD = FAM.getResult<ScopAnalysis>(F);

  for (const Region *R : SD.ValidRegions)

    OS << "Valid Region for Scop: " << R->getNameStr() << '\n';


  OS << "\n";

  return PreservedAnalyses::all();

}


Pass *polly::createScopDetectionWrapperPassPass() {

  return new ScopDetectionWrapperPass();

}


INITIALIZE_PASS_BEGIN(ScopDetectionWrapperPass, "polly-detect",

                      "Polly - Detect static control parts (SCoPs)", false,

                      false);

INITIALIZE_PASS_DEPENDENCY(AAResultsWrapperPass);

INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass);

INITIALIZE_PASS_DEPENDENCY(RegionInfoPass);

INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass);

INITIALIZE_PASS_DEPENDENCY(ScalarEvolutionWrapperPass);

INITIALIZE_PASS_DEPENDENCY(OptimizationRemarkEmitterWrapperPass);

INITIALIZE_PASS_END(ScopDetectionWrapperPass, "polly-detect",

                    "Polly - Detect static control parts (SCoPs)", false, false)


//===----------------------------------------------------------------------===//


namespace {

/// Print result from ScopDetectionWrapperPass.

class ScopDetectionPrinterLegacyPass final : public FunctionPass {

public:

  static char ID;


  ScopDetectionPrinterLegacyPass() : ScopDetectionPrinterLegacyPass(outs()) {}


  explicit ScopDetectionPrinterLegacyPass(llvm::raw_ostream &OS)

      : FunctionPass(ID), OS(OS) {}


  bool runOnFunction(Function &F) override {

    ScopDetectionWrapperPass &P = getAnalysis<ScopDetectionWrapperPass>();


    OS << "Printing analysis '" << P.getPassName() << "' for function '"

       << F.getName() << "':\n";

    P.print(OS);


    return false;

  }


  void getAnalysisUsage(AnalysisUsage &AU) const override {

    FunctionPass::getAnalysisUsage(AU);

    AU.addRequired<ScopDetectionWrapperPass>();

    AU.setPreservesAll();

  }


private:

  llvm::raw_ostream &OS;

};


char ScopDetectionPrinterLegacyPass::ID = 0;

} // namespace


Pass *polly::createScopDetectionPrinterLegacyPass(raw_ostream &OS) {

  return new ScopDetectionPrinterLegacyPass(OS);

}


INITIALIZE_PASS_BEGIN(ScopDetectionPrinterLegacyPass, "polly-print-detect",

                      "Polly - Print static control parts (SCoPs)", false,

                      false);

INITIALIZE_PASS_DEPENDENCY(ScopDetectionWrapperPass);

INITIALIZE_PASS_END(ScopDetectionPrinterLegacyPass, "polly-print-detect",

                    "Polly - Print static control parts (SCoPs)", false, false)

S1
S1()

Verify
static cl::opt< bool > Verify("polly-codegen-verify", cl::desc("Verify the function generated by Polly"), cl::Hidden, cl::cat(PollyCategory))

INITIALIZE_PASS_BEGIN
INITIALIZE_PASS_BEGIN(DependenceInfo, "polly-dependences", "Polly - Calculate dependences", false, false)

INITIALIZE_PASS_END
INITIALIZE_PASS_END(DependenceInfo, "polly-dependences", "Polly - Calculate dependences", false, false) namespace
Definition: DependenceInfo.cpp:935

INITIALIZE_PASS_DEPENDENCY
INITIALIZE_PASS_DEPENDENCY(ScopInfoRegionPass)

Function
polly dump Polly Dump Function
Definition: DumpFunctionPass.cpp:131

LinkAllPasses.h

Options.h

PollyCategory
llvm::cl::OptionCategory PollyCategory

PollyDebug.h

POLLY_DEBUG
#define POLLY_DEBUG(X)
Definition: PollyDebug.h:23

SCEVValidator.h

ScopDetectionDiagnostic.h

MIN_LOOP_TRIP_COUNT
static const unsigned MIN_LOOP_TRIP_COUNT
The minimal trip count under which loops are considered unprofitable.
Definition: ScopDetection.cpp:232

XPollyProcessUnprofitable
static cl::opt< bool, true > XPollyProcessUnprofitable("polly-process-unprofitable", cl::desc("Process scops that are unlikely to benefit from Polly optimizations."), cl::location(PollyProcessUnprofitable), cl::cat(PollyCategory))

AllowDifferentTypes
static cl::opt< bool > AllowDifferentTypes("polly-allow-differing-element-types", cl::desc("Allow different element types for array accesses"), cl::Hidden, cl::init(true), cl::cat(PollyCategory))

AllowNonAffine
static cl::opt< bool > AllowNonAffine("polly-allow-nonaffine", cl::desc("Allow non affine access functions in arrays"), cl::Hidden, cl::cat(PollyCategory))

STATISTIC
STATISTIC(NumScopRegions, "Number of scops")

OnlyFunctions
static cl::list< std::string > OnlyFunctions("polly-only-func", cl::desc("Only run on functions that match a regex. " "Multiple regexes can be comma separated. " "Scop detection will run on all functions that match " "ANY of the regexes provided."), cl::CommaSeparated, cl::cat(PollyCategory))

VerifyScops
static cl::opt< bool > VerifyScops("polly-detect-verify", cl::desc("Verify the detected SCoPs after each transformation"), cl::Hidden, cl::cat(PollyCategory))

hasExitingBlocks
static bool hasExitingBlocks(Loop *L)
Check whether L has exiting blocks.
Definition: ScopDetection.cpp:1271

OnlyRegion
static cl::opt< std::string > OnlyRegion("polly-only-region", cl::desc("Only run on certain regions (The provided identifier must " "appear in the name of the region's entry block"), cl::value_desc("identifier"), cl::ValueRequired, cl::init(""), cl::cat(PollyCategory))

regionWithoutLoops
static bool regionWithoutLoops(Region &R, LoopInfo &LI)
Definition: ScopDetection.cpp:1546

KeepGoing
static cl::opt< bool > KeepGoing("polly-detect-keep-going", cl::desc("Do not fail on the first error."), cl::Hidden, cl::cat(PollyCategory))

ProfitabilityMinPerLoopInstructions
static cl::opt< int > ProfitabilityMinPerLoopInstructions("polly-detect-profitability-min-per-loop-insts", cl::desc("The minimal number of per-loop instructions before a single loop " "region is considered profitable"), cl::Hidden, cl::ValueRequired, cl::init(100000000), cl::cat(PollyCategory))

TrackFailures
static cl::opt< bool, true > TrackFailures("polly-detect-track-failures", cl::desc("Track failure strings in detecting scop regions"), cl::location(PollyTrackFailures), cl::Hidden, cl::init(true), cl::cat(PollyCategory))

doesStringMatchAnyRegex
static bool doesStringMatchAnyRegex(StringRef Str, const cl::list< std::string > &RegexList)
Check if a string matches any regex in a list of regexes.
Definition: ScopDetection.cpp:321

PollyAllowErrorBlocks
static cl::opt< bool > PollyAllowErrorBlocks("polly-allow-error-blocks", cl::desc("Allow to speculate on the execution of 'error blocks'."), cl::Hidden, cl::init(true), cl::cat(PollyCategory))

IgnoredFunctions
static cl::list< std::string > IgnoredFunctions("polly-ignore-func", cl::desc("Ignore functions that match a regex. " "Multiple regexes can be comma separated. " "Scop detection will ignore all functions that match " "ANY of the regexes provided."), cl::CommaSeparated, cl::cat(PollyCategory))

ReportLevel
static cl::opt< bool > ReportLevel("polly-report", cl::desc("Print information about the activities of Polly"), cl::cat(PollyCategory))

isErrorBlockImpl
static bool isErrorBlockImpl(BasicBlock &BB, const Region &R, LoopInfo &LI, const DominatorTree &DT)
Definition: ScopDetection.cpp:1418

PollyDelinearizeX
static cl::opt< bool, true > PollyDelinearizeX("polly-delinearize", cl::desc("Delinearize array access functions"), cl::location(PollyDelinearize), cl::Hidden, cl::init(true), cl::cat(PollyCategory))

XPollyAllowUnsignedOperations
static cl::opt< bool, true > XPollyAllowUnsignedOperations("polly-allow-unsigned-operations", cl::desc("Allow unsigned operations such as comparisons or zero-extends."), cl::location(PollyAllowUnsignedOperations), cl::Hidden, cl::init(true), cl::cat(PollyCategory))

updateLoopCountStatistic
static void updateLoopCountStatistic(ScopDetection::LoopStats Stats, bool OnlyProfitable)
Definition: ScopDetection.cpp:1917

AllowNonAffineSubRegions
static cl::opt< bool > AllowNonAffineSubRegions("polly-allow-nonaffine-branches", cl::desc("Allow non affine conditions for branches"), cl::Hidden, cl::init(true), cl::cat(PollyCategory))

XAllowFullFunction
static cl::opt< bool, true > XAllowFullFunction("polly-detect-full-functions", cl::desc("Allow the detection of full functions"), cl::location(polly::PollyAllowFullFunction), cl::init(false), cl::cat(PollyCategory))

XPollyInvariantLoadHoisting
static cl::opt< bool, true > XPollyInvariantLoadHoisting("polly-invariant-load-hoisting", cl::desc("Hoist invariant loads."), cl::location(PollyInvariantLoadHoisting), cl::Hidden, cl::cat(PollyCategory))

AllowNonAffineSubLoops
static cl::opt< bool > AllowNonAffineSubLoops("polly-allow-nonaffine-loops", cl::desc("Allow non affine conditions for loops"), cl::Hidden, cl::cat(PollyCategory))

XPollyUseRuntimeAliasChecks
static cl::opt< bool, true > XPollyUseRuntimeAliasChecks("polly-use-runtime-alias-checks", cl::desc("Use runtime alias checks to resolve possible aliasing."), cl::location(PollyUseRuntimeAliasChecks), cl::Hidden, cl::init(true), cl::cat(PollyCategory))

IgnoreAliasing
static cl::opt< bool > IgnoreAliasing("polly-ignore-aliasing", cl::desc("Ignore possible aliasing of the array bases"), cl::Hidden, cl::cat(PollyCategory))

AllowModrefCall
static cl::opt< bool > AllowModrefCall("polly-allow-modref-calls", cl::desc("Allow functions with known modref behavior"), cl::Hidden, cl::cat(PollyCategory))

ScopDetection.h

ScopHelper.h

ScopLocation.h

polly::MemAccInst
Utility proxy to wrap the common members of LoadInst and StoreInst.
Definition: ScopHelper.h:140

polly::MemAccInst::dyn_cast
static MemAccInst dyn_cast(llvm::Value &V)
Definition: ScopHelper.h:178

polly::MemAccInst::getPointerOperand
llvm::Value * getPointerOperand() const
Definition: ScopHelper.h:248

polly::RejectLog
Stores all errors that occurred during the detection.
Definition: ScopDetectionDiagnostic.h:166

polly::RejectLog::report
void report(RejectReasonPtr Reject)
Definition: ScopDetectionDiagnostic.h:187

polly::RejectLog::hasErrors
bool hasErrors() const
Returns true, if we store at least one error.
Definition: ScopDetectionDiagnostic.h:182

polly::RejectLog::size
size_t size() const
Definition: ScopDetectionDiagnostic.h:177

polly::RejectReason
Base class of all reject reasons found during Scop detection.
Definition: ScopDetectionDiagnostic.h:118

polly::RejectReason::getMessage
virtual std::string getMessage() const =0
Generate a reasonable diagnostic message describing this error.

polly::ScopDetectionWrapperPass
Definition: ScopDetection.h:635

polly::ScopDetectionWrapperPass::Result
std::unique_ptr< ScopDetection > Result
Definition: ScopDetection.h:636

polly::ScopDetectionWrapperPass::releaseMemory
void releaseMemory() override
Definition: ScopDetection.cpp:2029

polly::ScopDetectionWrapperPass::getAnalysisUsage
void getAnalysisUsage(AnalysisUsage &AU) const override
Definition: ScopDetection.cpp:1999

polly::ScopDetectionWrapperPass::ScopDetectionWrapperPass
ScopDetectionWrapperPass()
Definition: ScopDetection.cpp:2017

polly::ScopDetectionWrapperPass::ID
static char ID
Definition: ScopDetection.h:643

polly::ScopDetectionWrapperPass::print
void print(raw_ostream &OS, const Module *M=nullptr) const override
Definition: ScopDetection.cpp:2010

polly::ScopDetectionWrapperPass::runOnFunction
bool runOnFunction(Function &F) override
Definition: ScopDetection.cpp:1986

polly::ScopDetection
Pass to detect the maximal static control parts (Scops) of a function.
Definition: ScopDetection.h:133

polly::ScopDetection::markFunctionAsInvalid
static void markFunctionAsInvalid(Function *F)
Mark the function as invalid so we will not extract any scop from the function.
Definition: ScopDetection.cpp:1816

polly::ScopDetection::addOverApproximatedRegion
bool addOverApproximatedRegion(Region *AR, DetectionContext &Context) const
Add the region AR as over approximated sub-region in Context.
Definition: ScopDetection.cpp:454

polly::ScopDetection::isValidAccess
bool isValidAccess(Instruction *Inst, const SCEV *AF, const SCEVUnknown *BP, DetectionContext &Context) const
Check if the memory access caused by Inst is valid.
Definition: ScopDetection.cpp:1072

polly::ScopDetection::onlyValidRequiredInvariantLoads
bool onlyValidRequiredInvariantLoads(InvariantLoadsSetTy &RequiredILS, DetectionContext &Context) const
Check if the given loads could be invariant and can be hoisted.
Definition: ScopDetection.cpp:472

polly::ScopDetection::isInvariant
bool isInvariant(Value &Val, const Region &Reg, DetectionContext &Ctx) const
Check if a value is invariant in the region Reg.
Definition: ScopDetection.cpp:804

polly::ScopDetection::isReducibleRegion
bool isReducibleRegion(Region &R, DebugLoc &DbgLoc) const
Check if a region is reducible or not.
Definition: ScopDetection.cpp:1843

polly::ScopDetection::computeAccessFunctions
bool computeAccessFunctions(DetectionContext &Context, const SCEVUnknown *BasePointer, std::shared_ptr< ArrayShape > Shape) const
Derive access functions for a given base pointer.
Definition: ScopDetection.cpp:984

polly::ScopDetection::getDetectionContext
DetectionContext * getDetectionContext(const Region *R) const
Return the detection context for R, nullptr if R was invalid.
Definition: ScopDetection.cpp:1959

polly::ScopDetection::removeCachedResultsRecursively
void removeCachedResultsRecursively(const Region &R)
Remove cached results for the children of R recursively.
Definition: ScopDetection.cpp:1554

polly::ScopDetection::hasSufficientCompute
bool hasSufficientCompute(DetectionContext &Context, int NumAffineLoops) const
Check if a region has sufficient compute instructions.
Definition: ScopDetection.cpp:1682

polly::ScopDetection::isProfitableRegion
bool isProfitableRegion(DetectionContext &Context) const
Check if a region is profitable to optimize.
Definition: ScopDetection.cpp:1720

polly::ScopDetection::emitMissedRemarks
void emitMissedRemarks(const Function &F)
Emit rejection remarks for all rejected regions.
Definition: ScopDetection.cpp:1835

polly::ScopDetection::isValidLoop
bool isValidLoop(Loop *L, DetectionContext &Context)
Is a loop valid with respect to a given region.
Definition: ScopDetection.cpp:1304

polly::ScopDetection::countBeneficialLoops
static ScopDetection::LoopStats countBeneficialLoops(Region *R, ScalarEvolution &SE, LoopInfo &LI, unsigned MinProfitableTrips)
Count the number of loops and the maximal loop depth in R.
Definition: ScopDetection.cpp:1390

polly::ScopDetection::lookupRejectionLog
const RejectLog * lookupRejectionLog(const Region *R) const
Return the set of rejection causes for R.
Definition: ScopDetection.cpp:1966

polly::ScopDetection::involvesMultiplePtrs
bool involvesMultiplePtrs(const SCEV *S0, const SCEV *S1, Loop *Scope) const
Check if S0 and S1 do contain multiple possibly aliasing pointers.
Definition: ScopDetection.cpp:508

polly::ScopDetection::isValidSwitch
bool isValidSwitch(BasicBlock &BB, SwitchInst *SI, Value *Condition, bool IsLoopBranch, DetectionContext &Context) const
Check if the switch SI with condition Condition is valid.
Definition: ScopDetection.cpp:554

polly::ScopDetection::isValidRegion
bool isValidRegion(DetectionContext &Context)
Check if a region is a Scop.
Definition: ScopDetection.cpp:1756

polly::ScopDetection::expandRegion
Region * expandRegion(Region &R)
Try to expand the region R.
Definition: ScopDetection.cpp:1487

polly::ScopDetection::DT
const DominatorTree & DT
Analyses used.
Definition: ScopDetection.h:208

polly::ScopDetection::hasBaseAffineAccesses
bool hasBaseAffineAccesses(DetectionContext &Context, const SCEVUnknown *BasePointer, Loop *Scope) const
Check if all accesses to a given BasePointer are affine.
Definition: ScopDetection.cpp:1037

polly::ScopDetection::detect
void detect(Function &F)
Definition: ScopDetection.cpp:345

polly::ScopDetection::SE
ScalarEvolution & SE
Definition: ScopDetection.h:209

polly::ScopDetection::ORE
OptimizationRemarkEmitter & ORE
OptimizationRemarkEmitter object used to emit diagnostic remarks.
Definition: ScopDetection.h:614

polly::ScopDetection::hasAffineMemoryAccesses
bool hasAffineMemoryAccesses(DetectionContext &Context) const
Delinearize all non affine memory accesses and return false when there exists a non affine memory acc...
Definition: ScopDetection.cpp:1054

polly::ScopDetection::isValidMemoryAccess
bool isValidMemoryAccess(MemAccInst Inst, DetectionContext &Context) const
Check if a memory access can be part of a Scop.
Definition: ScopDetection.cpp:1199

polly::ScopDetection::isValidCFG
bool isValidCFG(BasicBlock &BB, bool IsLoopBranch, bool AllowUnreachable, DetectionContext &Context)
Check if the control flow in a basic block is valid.
Definition: ScopDetection.cpp:658

polly::ScopDetection::printLocations
void printLocations(Function &F)
Print the locations of all detected scops.
Definition: ScopDetection.cpp:1824

polly::ScopDetection::hasValidArraySizes
bool hasValidArraySizes(DetectionContext &Context, SmallVectorImpl< const SCEV * > &Sizes, const SCEVUnknown *BasePointer, Loop *Scope) const
Check if the dimension size of a delinearized array is valid.
Definition: ScopDetection.cpp:919

polly::ScopDetection::ErrorBlockCache
DenseMap< std::tuple< const BasicBlock *, const Region * >, bool > ErrorBlockCache
Cache for the isErrorBlock function.
Definition: ScopDetection.h:222

polly::ScopDetection::removeCachedResults
void removeCachedResults(const Region &R)
Remove cached results for R.
Definition: ScopDetection.cpp:1563

polly::ScopDetection::ScopDetection
ScopDetection(const DominatorTree &DT, ScalarEvolution &SE, LoopInfo &LI, RegionInfo &RI, AAResults &AA, OptimizationRemarkEmitter &ORE)
Definition: ScopDetection.cpp:340

polly::ScopDetection::isValidBranch
bool isValidBranch(BasicBlock &BB, BranchInst *BI, Value *Condition, bool IsLoopBranch, DetectionContext &Context)
Check if the branch BI with condition Condition is valid.
Definition: ScopDetection.cpp:578

polly::ScopDetection::hasPossiblyDistributableLoop
bool hasPossiblyDistributableLoop(DetectionContext &Context) const
Check if the unique affine loop might be amendable to distribution.
Definition: ScopDetection.cpp:1698

polly::ScopDetection::verifyAnalysis
void verifyAnalysis()
Verify if all valid Regions in this Function are still valid after some transformations.
Definition: ScopDetection.cpp:1978

polly::ScopDetection::getDelinearizationTerms
SmallVector< const SCEV *, 4 > getDelinearizationTerms(DetectionContext &Context, const SCEVUnknown *BasePointer) const
Find for a given base pointer terms that hint towards dimension sizes of a multi-dimensional array.
Definition: ScopDetection.cpp:870

polly::ScopDetection::isValidInstruction
bool isValidInstruction(Instruction &Inst, DetectionContext &Context)
Check if an instruction can be part of a Scop.
Definition: ScopDetection.cpp:1211

polly::ScopDetection::AA
AAResults & AA
Definition: ScopDetection.h:212

polly::ScopDetection::isAffine
bool isAffine(const SCEV *S, Loop *Scope, DetectionContext &Context) const
Check if the SCEV S is affine in the current Context.
Definition: ScopDetection.cpp:542

polly::ScopDetection::ValidRegions
RegionSet ValidRegions
Definition: ScopDetection.h:138

polly::ScopDetection::DetectionContextMap
DetectionContextMapTy DetectionContextMap
Definition: ScopDetection.h:218

polly::ScopDetection::LI
LoopInfo & LI
Definition: ScopDetection.h:210

polly::ScopDetection::allBlocksValid
bool allBlocksValid(DetectionContext &Context)
Check if all basic block in the region are valid.
Definition: ScopDetection.cpp:1633

polly::ScopDetection::findScops
void findScops(Region &R)
Find the Scops in this region tree.
Definition: ScopDetection.cpp:1567

polly::ScopDetection::isValidIntrinsicInst
bool isValidIntrinsicInst(IntrinsicInst &II, DetectionContext &Context) const
Check if an intrinsic call can be part of a Scop.
Definition: ScopDetection.cpp:758

polly::ScopDetection::regionIsInvalidBecause
std::string regionIsInvalidBecause(const Region *R) const
Get a message why a region is invalid.
Definition: ScopDetection.cpp:440

polly::ScopDetection::isMaxRegionInScop
bool isMaxRegionInScop(const Region &R, bool Verify=true)
Is the region is the maximum region of a Scop?
Definition: ScopDetection.cpp:419

polly::ScopDetection::isValidCallInst
bool isValidCallInst(CallInst &CI, DetectionContext &Context) const
Check if a call instruction can be part of a Scop.
Definition: ScopDetection.cpp:690

polly::ScopDetection::verifyRegion
void verifyRegion(const Region &R)
Verify if R is still a valid part of Scop after some transformations.
Definition: ScopDetection.cpp:1971

polly::ScopDetection::isValidFunction
static bool isValidFunction(Function &F)
Check if the function F is marked as invalid.
Definition: ScopDetection.cpp:1820

polly::ScopDetection::isErrorBlock
bool isErrorBlock(llvm::BasicBlock &BB, const llvm::Region &R)
Check if the block is a error block.
Definition: ScopDetection.cpp:1474

polly::ScopDetection::invalid
bool invalid(DetectionContext &Context, bool Assert, Args &&...Arguments) const
Track diagnostics for invalid scops.
Definition: ScopDetection.cpp:399

polly::ScopDetection::canUseISLTripCount
bool canUseISLTripCount(Loop *L, DetectionContext &Context)
Can ISL compute the trip count of a loop.
Definition: ScopDetection.cpp:1277

polly::ScopDetection::RI
RegionInfo & RI
Definition: ScopDetection.h:211

polly::ScopDetection::countBeneficialSubLoops
static ScopDetection::LoopStats countBeneficialSubLoops(Loop *L, ScalarEvolution &SE, unsigned MinProfitableTrips)
Count the number of loops and the maximal loop depth in L.
Definition: ScopDetection.cpp:1368

assert
#define assert(exp)
Definition: isl_test_cpp-checked.cc:43

llvm
This file contains the declaration of the PolyhedralInfo class, which will provide an interface to ex...
Definition: Canonicalization.h:14

polly
Definition: Canonicalization.h:20

polly::BBPair
std::pair< llvm::BasicBlock *, llvm::BasicBlock * > BBPair
Type to hold region delimiters (entry & exit block).
Definition: Utils.h:31

polly::findValues
void findValues(const llvm::SCEV *Expr, llvm::ScalarEvolution &SE, llvm::SetVector< llvm::Value * > &Values)
Find the values referenced by SCEVUnknowns in a given SCEV expression.

polly::findLoops
void findLoops(const llvm::SCEV *Expr, llvm::SetVector< const llvm::Loop * > &Loops)
Find the loops referenced from a SCEV expression.

polly::getConditionFromTerminator
llvm::Value * getConditionFromTerminator(llvm::Instruction *TI)
Return the condition for the terminator TI.

polly::PollySkipFnAttr
StringRef PollySkipFnAttr
A function attribute which will cause Polly to skip the function.
Definition: ScopDetection.cpp:236

polly::PollyAllowFullFunction
bool PollyAllowFullFunction
Definition: ScopDetection.cpp:131

polly::RejectReasonPtr
std::shared_ptr< RejectReason > RejectReasonPtr
Definition: ScopDetectionDiagnostic.h:163

polly::PollyTrackFailures
bool PollyTrackFailures
Definition: ScopDetection.cpp:234

polly::isAffineExpr
bool isAffineExpr(const llvm::Region *R, llvm::Loop *Scope, const llvm::SCEV *Expression, llvm::ScalarEvolution &SE, InvariantLoadsSetTy *ILS=nullptr)

polly::MemoryKind::Value
@ Value
MemoryKind::Value: Models an llvm::Value.

polly::MemoryKind::PHI
@ PHI
MemoryKind::PHI: Models PHI nodes within the SCoP.

polly::emitRejectionRemarks
void emitRejectionRemarks(const BBPair &P, const RejectLog &Log, OptimizationRemarkEmitter &ORE)
Emit optimization remarks about the rejected regions to the user.
Definition: ScopDetectionDiagnostic.cpp:134

polly::getDebugLocation
void getDebugLocation(const llvm::Region *R, unsigned &LineBegin, unsigned &LineEnd, std::string &FileName)
Get the location of a region from the debug info.

polly::tryForwardThroughPHI
const llvm::SCEV * tryForwardThroughPHI(const llvm::SCEV *Expr, llvm::Region &R, llvm::ScalarEvolution &SE, ScopDetection *SD)
Try to look through PHI nodes, where some incoming edges come from error blocks.

polly::isDebugCall
bool isDebugCall(llvm::Instruction *Inst)
Is the given instruction a call to a debug function?

polly::getBBPairForRegion
BBPair getBBPairForRegion(const Region *R)
Return the region delimiters (entry & exit block) of R.
Definition: ScopDetectionDiagnostic.cpp:108

polly::PollyProcessUnprofitable
bool PollyProcessUnprofitable
Definition: ScopDetection.cpp:107

polly::createScopDetectionPrinterLegacyPass
llvm::Pass * createScopDetectionPrinterLegacyPass(llvm::raw_ostream &OS)

polly::InvariantLoadsSetTy
llvm::SetVector< llvm::AssertingVH< llvm::LoadInst > > InvariantLoadsSetTy
Type for a set of invariant loads.
Definition: ScopHelper.h:109

polly::MapInsnToMemAcc
std::map< const Instruction *, MemAcc > MapInsnToMemAcc
Definition: ScopDetection.h:113

polly::isHoistableLoad
bool isHoistableLoad(llvm::LoadInst *LInst, llvm::Region &R, llvm::LoopInfo &LI, llvm::ScalarEvolution &SE, const llvm::DominatorTree &DT, const InvariantLoadsSetTy &KnownInvariantLoads)
Check if LInst can be hoisted in R.

polly::PollyUseRuntimeAliasChecks
bool PollyUseRuntimeAliasChecks
Definition: ScopDetection.cpp:159

polly::PollyDelinearize
bool PollyDelinearize
Definition: ScopDetection.cpp:235

polly::hasScalarDepsInsideRegion
bool hasScalarDepsInsideRegion(const llvm::SCEV *Expr, const llvm::Region *R, llvm::Loop *Scope, bool AllowLoops, const InvariantLoadsSetTy &ILS)
Returns true when the SCEV contains references to instructions within the region.

polly::PollyAllowUnsignedOperations
bool PollyAllowUnsignedOperations
Definition: ScopDetection.cpp:151

polly::RejectReasonKind::Entry
@ Entry

polly::getUniqueNonErrorValue
llvm::Value * getUniqueNonErrorValue(llvm::PHINode *PHI, llvm::Region *R, ScopDetection *SD)
Return a unique non-error block incoming value for PHI if available.

polly::PollyInvariantLoadHoisting
bool PollyInvariantLoadHoisting
Definition: ScopDetection.cpp:218

polly::isIgnoredIntrinsic
bool isIgnoredIntrinsic(const llvm::Value *V)
Return true iff V is an intrinsic that we ignore during code generation.

polly::createScopDetectionWrapperPassPass
llvm::Pass * createScopDetectionWrapperPassPass()
Definition: ScopDetection.cpp:2059

Pair
Definition: template_cpp.cc:176

S
Definition: isl_test_cpp17-generic.cc:3

polly::ArrayShape
Definition: ScopDetection.h:90

polly::MemAcc
Definition: ScopDetection.h:100

polly::MemAcc::DelinearizedSubscripts
SmallVector< const SCEV *, 4 > DelinearizedSubscripts
Definition: ScopDetection.h:107

polly::ScopAnalysisPrinterPass::OS
raw_ostream & OS
Definition: ScopDetection.h:632

polly::ScopAnalysisPrinterPass::run
PreservedAnalyses run(Function &F, FunctionAnalysisManager &FAM)
Definition: ScopDetection.cpp:2048

polly::ScopAnalysis
Definition: ScopDetection.h:617

polly::ScopAnalysis::Result
ScopDetection Result
Definition: ScopDetection.h:620

polly::ScopAnalysis::run
Result run(Function &F, FunctionAnalysisManager &FAM)
Definition: ScopDetection.cpp:2035

polly::ScopAnalysis::ScopAnalysis
ScopAnalysis()
Definition: ScopDetection.cpp:2023

polly::ScopAnalysis::Key
static AnalysisKey Key
Definition: ScopDetection.h:618

polly::ScopDetection::DetectionContext
Context variables for SCoP detection.
Definition: ScopDetection.h:141

polly::ScopDetection::DetectionContext::Accesses
BaseToAFs Accesses
Map a base pointer to all access functions accessing it.
Definition: ScopDetection.h:158

polly::ScopDetection::DetectionContext::RequiredILS
InvariantLoadsSetTy RequiredILS
Loads that need to be invariant during execution.
Definition: ScopDetection.h:183

polly::ScopDetection::DetectionContext::ElementSize
BaseToElSize ElementSize
Definition: ScopDetection.h:165

polly::ScopDetection::DetectionContext::hasLoads
bool hasLoads
The region has at least one load instruction.
Definition: ScopDetection.h:168

polly::ScopDetection::DetectionContext::IsInvalid
bool IsInvalid
If this flag is set, the SCoP must eventually be rejected, even with KeepGoing.
Definition: ScopDetection.h:149

polly::ScopDetection::DetectionContext::HasUnknownAccess
bool HasUnknownAccess
Flag to indicate the region has at least one unknown access.
Definition: ScopDetection.h:174

polly::ScopDetection::DetectionContext::BoxedLoopsSet
BoxedLoopsSetTy BoxedLoopsSet
The set of loops contained in non-affine regions.
Definition: ScopDetection.h:180

polly::ScopDetection::DetectionContext::Verifying
bool Verifying
Definition: ScopDetection.h:145

polly::ScopDetection::DetectionContext::InsnToMemAcc
MapInsnToMemAcc InsnToMemAcc
Map to memory access description for the corresponding LLVM instructions.
Definition: ScopDetection.h:187

polly::ScopDetection::DetectionContext::Log
RejectLog Log
Container to remember rejection reasons for this region.
Definition: ScopDetection.h:152

polly::ScopDetection::DetectionContext::CurRegion
Region & CurRegion
Definition: ScopDetection.h:142

polly::ScopDetection::DetectionContext::NonAffineSubRegionSet
RegionSet NonAffineSubRegionSet
The set of non-affine subregions in the region we analyze.
Definition: ScopDetection.h:177

polly::ScopDetection::DetectionContext::NonAffineAccesses
llvm::SetVector< std::pair< const SCEVUnknown *, Loop * > > NonAffineAccesses
The set of base pointers with non-affine accesses.
Definition: ScopDetection.h:164

polly::ScopDetection::DetectionContext::AST
AliasSetTracker AST
Definition: ScopDetection.h:144

polly::ScopDetection::DetectionContext::hasStores
bool hasStores
The region has at least one store instruction.
Definition: ScopDetection.h:171

polly::ScopDetection::LoopStats
Helper data structure to collect statistics about loop counts.
Definition: ScopDetection.h:195

polly::ScopDetection::LoopStats::MaxDepth
int MaxDepth
Definition: ScopDetection.h:197

polly::ScopDetection::LoopStats::NumLoops
int NumLoops
Definition: ScopDetection.h:196

Res
static TupleKindPtr Res
Definition: template_cpp.cc:125

Str
static TupleKindPtr Str
Definition: template_cpp.cc:124

Ctx
static TupleKindPtr Ctx
Definition: template_cpp.cc:122