llvm.org/doxygen/LoopUtils_8cpp_source.html

//===-- LoopUtils.cpp - Loop Utility functions -------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file defines common loop utility functions.

//

//===----------------------------------------------------------------------===//


#include "llvm/Transforms/Utils/LoopUtils.h"

#include "llvm/ADT/DenseSet.h"

#include "llvm/ADT/PriorityWorklist.h"

#include "llvm/ADT/ScopeExit.h"

#include "llvm/ADT/SetVector.h"

#include "llvm/ADT/SmallPtrSet.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/Analysis/AliasAnalysis.h"

#include "llvm/Analysis/BasicAliasAnalysis.h"

#include "llvm/Analysis/DomTreeUpdater.h"

#include "llvm/Analysis/GlobalsModRef.h"

#include "llvm/Analysis/InstSimplifyFolder.h"

#include "llvm/Analysis/LoopAccessAnalysis.h"

#include "llvm/Analysis/LoopInfo.h"

#include "llvm/Analysis/LoopPass.h"

#include "llvm/Analysis/MemorySSA.h"

#include "llvm/Analysis/MemorySSAUpdater.h"

#include "llvm/Analysis/ScalarEvolution.h"

#include "llvm/Analysis/ScalarEvolutionAliasAnalysis.h"

#include "llvm/Analysis/ScalarEvolutionExpressions.h"

#include "llvm/IR/DIBuilder.h"

#include "llvm/IR/Dominators.h"

#include "llvm/IR/Instructions.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/MDBuilder.h"

#include "llvm/IR/Module.h"

#include "llvm/IR/PatternMatch.h"

#include "llvm/IR/ProfDataUtils.h"

#include "llvm/IR/ValueHandle.h"

#include "llvm/InitializePasses.h"

#include "llvm/Pass.h"

#include "llvm/Support/Compiler.h"

#include "llvm/Support/Debug.h"

#include "llvm/Transforms/Utils/BasicBlockUtils.h"

#include "llvm/Transforms/Utils/Local.h"

#include "llvm/Transforms/Utils/ScalarEvolutionExpander.h"


using namespace llvm;

using namespace llvm::PatternMatch;


#define DEBUG_TYPE "loop-utils"


static const char *LLVMLoopDisableNonforced = "llvm.loop.disable_nonforced";

static const char *LLVMLoopDisableLICM = "llvm.licm.disable";


bool llvm::formDedicatedExitBlocks(Loop *L, DominatorTree *DT, LoopInfo *LI,

                                   MemorySSAUpdater *MSSAU,

                                   bool PreserveLCSSA) {

  bool Changed = false;


  // We re-use a vector for the in-loop predecesosrs.

  SmallVector<BasicBlock *, 4> InLoopPredecessors;


  auto RewriteExit = [&](BasicBlock *BB) {

    assert(InLoopPredecessors.empty() &&

           "Must start with an empty predecessors list!");

    auto Cleanup = make_scope_exit([&] { InLoopPredecessors.clear(); });


    // See if there are any non-loop predecessors of this exit block and

    // keep track of the in-loop predecessors.

    bool IsDedicatedExit = true;

    for (auto *PredBB : predecessors(BB))

      if (L->contains(PredBB)) {

        if (isa<IndirectBrInst>(PredBB->getTerminator()))

          // We cannot rewrite exiting edges from an indirectbr.

          return false;


        InLoopPredecessors.push_back(PredBB);

      } else {

        IsDedicatedExit = false;

      }


    assert(!InLoopPredecessors.empty() && "Must have *some* loop predecessor!");


    // Nothing to do if this is already a dedicated exit.

    if (IsDedicatedExit)

      return false;


    auto *NewExitBB = SplitBlockPredecessors(

        BB, InLoopPredecessors, ".loopexit", DT, LI, MSSAU, PreserveLCSSA);


    if (!NewExitBB)

      LLVM_DEBUG(

          dbgs() << "WARNING: Can't create a dedicated exit block for loop: "

                 << *L << "\n");

    else

      LLVM_DEBUG(dbgs() << "LoopSimplify: Creating dedicated exit block "

                        << NewExitBB->getName() << "\n");

    return true;

  };


  // Walk the exit blocks directly rather than building up a data structure for

  // them, but only visit each one once.

  SmallPtrSet<BasicBlock *, 4> Visited;

  for (auto *BB : L->blocks())

    for (auto *SuccBB : successors(BB)) {

      // We're looking for exit blocks so skip in-loop successors.

      if (L->contains(SuccBB))

        continue;


      // Visit each exit block exactly once.

      if (!Visited.insert(SuccBB).second)

        continue;


      Changed |= RewriteExit(SuccBB);

    }


  return Changed;

}


/// Returns the instructions that use values defined in the loop.


SmallVector<Instruction *, 8> llvm::findDefsUsedOutsideOfLoop(Loop *L) {

  SmallVector<Instruction *, 8> UsedOutside;


  for (auto *Block : L->getBlocks())

    // FIXME: I believe that this could use copy_if if the Inst reference could

    // be adapted into a pointer.

    for (auto &Inst : *Block) {

      auto Users = Inst.users();

      if (any_of(Users, [&](User *U) {

            auto *Use = cast<Instruction>(U);

            return !L->contains(Use->getParent());

          }))

        UsedOutside.push_back(&Inst);

    }


  return UsedOutside;

}


void llvm::getLoopAnalysisUsage(AnalysisUsage &AU) {

  // By definition, all loop passes need the LoopInfo analysis and the

  // Dominator tree it depends on. Because they all participate in the loop

  // pass manager, they must also preserve these.

  AU.addRequired<DominatorTreeWrapperPass>();

  AU.addPreserved<DominatorTreeWrapperPass>();

  AU.addRequired<LoopInfoWrapperPass>();

  AU.addPreserved<LoopInfoWrapperPass>();


  // We must also preserve LoopSimplify and LCSSA. We locally access their IDs

  // here because users shouldn't directly get them from this header.

  extern char &LoopSimplifyID;

  extern char &LCSSAID;

  AU.addRequiredID(LoopSimplifyID);

  AU.addPreservedID(LoopSimplifyID);

  AU.addRequiredID(LCSSAID);

  AU.addPreservedID(LCSSAID);

  // This is used in the LPPassManager to perform LCSSA verification on passes

  // which preserve lcssa form

  AU.addRequired<LCSSAVerificationPass>();

  AU.addPreserved<LCSSAVerificationPass>();


  // Loop passes are designed to run inside of a loop pass manager which means

  // that any function analyses they require must be required by the first loop

  // pass in the manager (so that it is computed before the loop pass manager

  // runs) and preserved by all loop pasess in the manager. To make this

  // reasonably robust, the set needed for most loop passes is maintained here.

  // If your loop pass requires an analysis not listed here, you will need to

  // carefully audit the loop pass manager nesting structure that results.

  AU.addRequired<AAResultsWrapperPass>();

  AU.addPreserved<AAResultsWrapperPass>();

  AU.addPreserved<BasicAAWrapperPass>();

  AU.addPreserved<GlobalsAAWrapperPass>();

  AU.addPreserved<SCEVAAWrapperPass>();

  AU.addRequired<ScalarEvolutionWrapperPass>();

  AU.addPreserved<ScalarEvolutionWrapperPass>();

  // FIXME: When all loop passes preserve MemorySSA, it can be required and

  // preserved here instead of the individual handling in each pass.

}


/// Manually defined generic "LoopPass" dependency initialization. This is used

/// to initialize the exact set of passes from above in \c

/// getLoopAnalysisUsage. It can be used within a loop pass's initialization

/// with:

///

///   INITIALIZE_PASS_DEPENDENCY(LoopPass)

///

/// As-if "LoopPass" were a pass.


void llvm::initializeLoopPassPass(PassRegistry &Registry) {

  INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)

  INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass)

  INITIALIZE_PASS_DEPENDENCY(LoopSimplify)

  INITIALIZE_PASS_DEPENDENCY(LCSSAWrapperPass)

  INITIALIZE_PASS_DEPENDENCY(AAResultsWrapperPass)

  INITIALIZE_PASS_DEPENDENCY(BasicAAWrapperPass)

  INITIALIZE_PASS_DEPENDENCY(GlobalsAAWrapperPass)

  INITIALIZE_PASS_DEPENDENCY(SCEVAAWrapperPass)

  INITIALIZE_PASS_DEPENDENCY(ScalarEvolutionWrapperPass)

  INITIALIZE_PASS_DEPENDENCY(MemorySSAWrapperPass)

}


/// Create MDNode for input string.


static MDNode *createStringMetadata(Loop *TheLoop, StringRef Name, unsigned V) {

  LLVMContext &Context = TheLoop->getHeader()->getContext();

  Metadata *MDs[] = {

      MDString::get(Context, Name),

      ConstantAsMetadata::get(ConstantInt::get(Type::getInt32Ty(Context), V))};

  return MDNode::get(Context, MDs);

}


/// Set input string into loop metadata by keeping other values intact.

/// If the string is already in loop metadata update value if it is

/// different.


void llvm::addStringMetadataToLoop(Loop *TheLoop, const char *StringMD,

                                   unsigned V) {

  SmallVector<Metadata *, 4> MDs(1);

  // If the loop already has metadata, retain it.

  MDNode *LoopID = TheLoop->getLoopID();

  if (LoopID) {

    for (unsigned i = 1, ie = LoopID->getNumOperands(); i < ie; ++i) {

      MDNode *Node = cast<MDNode>(LoopID->getOperand(i));

      // If it is of form key = value, try to parse it.

      if (Node->getNumOperands() == 2) {

        MDString *S = dyn_cast<MDString>(Node->getOperand(0));

        if (S && S->getString() == StringMD) {

          ConstantInt *IntMD =

              mdconst::extract_or_null<ConstantInt>(Node->getOperand(1));

          if (IntMD && IntMD->getSExtValue() == V)

            // It is already in place. Do nothing.

            return;

          // We need to update the value, so just skip it here and it will

          // be added after copying other existed nodes.

          continue;

        }

      }

      MDs.push_back(Node);

    }

  }

  // Add new metadata.

  MDs.push_back(createStringMetadata(TheLoop, StringMD, V));

  // Replace current metadata node with new one.

  LLVMContext &Context = TheLoop->getHeader()->getContext();

  MDNode *NewLoopID = MDNode::get(Context, MDs);

  // Set operand 0 to refer to the loop id itself.

  NewLoopID->replaceOperandWith(0, NewLoopID);

  TheLoop->setLoopID(NewLoopID);

}


std::optional<ElementCount>


llvm::getOptionalElementCountLoopAttribute(const Loop *TheLoop) {

  std::optional<int> Width =

      getOptionalIntLoopAttribute(TheLoop, "llvm.loop.vectorize.width");


  if (Width) {

    std::optional<int> IsScalable = getOptionalIntLoopAttribute(

        TheLoop, "llvm.loop.vectorize.scalable.enable");

    return ElementCount::get(*Width, IsScalable.value_or(false));

  }


  return std::nullopt;

}


std::optional<MDNode *> llvm::makeFollowupLoopID(

    MDNode *OrigLoopID, ArrayRef<StringRef> FollowupOptions,

    const char *InheritOptionsExceptPrefix, bool AlwaysNew) {

  if (!OrigLoopID) {

    if (AlwaysNew)

      return nullptr;

    return std::nullopt;

  }


  assert(OrigLoopID->getOperand(0) == OrigLoopID);


  bool InheritAllAttrs = !InheritOptionsExceptPrefix;

  bool InheritSomeAttrs =

      InheritOptionsExceptPrefix && InheritOptionsExceptPrefix[0] != '\0';

  SmallVector<Metadata *, 8> MDs;

  MDs.push_back(nullptr);


  bool Changed = false;

  if (InheritAllAttrs || InheritSomeAttrs) {

    for (const MDOperand &Existing : drop_begin(OrigLoopID->operands())) {

      MDNode *Op = cast<MDNode>(Existing.get());


      auto InheritThisAttribute = [InheritSomeAttrs,

                                   InheritOptionsExceptPrefix](MDNode *Op) {

        if (!InheritSomeAttrs)

          return false;


        // Skip malformatted attribute metadata nodes.

        if (Op->getNumOperands() == 0)

          return true;

        Metadata *NameMD = Op->getOperand(0).get();

        if (!isa<MDString>(NameMD))

          return true;

        StringRef AttrName = cast<MDString>(NameMD)->getString();


        // Do not inherit excluded attributes.

        return !AttrName.starts_with(InheritOptionsExceptPrefix);

      };


      if (InheritThisAttribute(Op))

        MDs.push_back(Op);

      else

        Changed = true;

    }

  } else {

    // Modified if we dropped at least one attribute.

    Changed = OrigLoopID->getNumOperands() > 1;

  }


  bool HasAnyFollowup = false;

  for (StringRef OptionName : FollowupOptions) {

    MDNode *FollowupNode = findOptionMDForLoopID(OrigLoopID, OptionName);

    if (!FollowupNode)

      continue;


    HasAnyFollowup = true;

    for (const MDOperand &Option : drop_begin(FollowupNode->operands())) {

      MDs.push_back(Option.get());

      Changed = true;

    }

  }


  // Attributes of the followup loop not specified explicity, so signal to the

  // transformation pass to add suitable attributes.

  if (!AlwaysNew && !HasAnyFollowup)

    return std::nullopt;


  // If no attributes were added or remove, the previous loop Id can be reused.

  if (!AlwaysNew && !Changed)

    return OrigLoopID;


  // No attributes is equivalent to having no !llvm.loop metadata at all.

  if (MDs.size() == 1)

    return nullptr;


  // Build the new loop ID.

  MDTuple *FollowupLoopID = MDNode::get(OrigLoopID->getContext(), MDs);

  FollowupLoopID->replaceOperandWith(0, FollowupLoopID);

  return FollowupLoopID;

}


bool llvm::hasDisableAllTransformsHint(const Loop *L) {

  return getBooleanLoopAttribute(L, LLVMLoopDisableNonforced);

}


bool llvm::hasDisableLICMTransformsHint(const Loop *L) {

  return getBooleanLoopAttribute(L, LLVMLoopDisableLICM);

}


TransformationMode llvm::hasUnrollTransformation(const Loop *L) {

  if (getBooleanLoopAttribute(L, "llvm.loop.unroll.disable"))

    return TM_SuppressedByUser;


  std::optional<int> Count =

      getOptionalIntLoopAttribute(L, "llvm.loop.unroll.count");

  if (Count)

    return *Count == 1 ? TM_SuppressedByUser : TM_ForcedByUser;


  if (getBooleanLoopAttribute(L, "llvm.loop.unroll.enable"))

    return TM_ForcedByUser;


  if (getBooleanLoopAttribute(L, "llvm.loop.unroll.full"))

    return TM_ForcedByUser;


  if (hasDisableAllTransformsHint(L))

    return TM_Disable;


  return TM_Unspecified;

}


TransformationMode llvm::hasUnrollAndJamTransformation(const Loop *L) {

  if (getBooleanLoopAttribute(L, "llvm.loop.unroll_and_jam.disable"))

    return TM_SuppressedByUser;


  std::optional<int> Count =

      getOptionalIntLoopAttribute(L, "llvm.loop.unroll_and_jam.count");

  if (Count)

    return *Count == 1 ? TM_SuppressedByUser : TM_ForcedByUser;


  if (getBooleanLoopAttribute(L, "llvm.loop.unroll_and_jam.enable"))

    return TM_ForcedByUser;


  if (hasDisableAllTransformsHint(L))

    return TM_Disable;


  return TM_Unspecified;

}


TransformationMode llvm::hasVectorizeTransformation(const Loop *L) {

  std::optional<bool> Enable =

      getOptionalBoolLoopAttribute(L, "llvm.loop.vectorize.enable");


  if (Enable == false)

    return TM_SuppressedByUser;


  std::optional<ElementCount> VectorizeWidth =

      getOptionalElementCountLoopAttribute(L);

  std::optional<int> InterleaveCount =

      getOptionalIntLoopAttribute(L, "llvm.loop.interleave.count");


  // 'Forcing' vector width and interleave count to one effectively disables

  // this tranformation.

  if (Enable == true && VectorizeWidth && VectorizeWidth->isScalar() &&

      InterleaveCount == 1)

    return TM_SuppressedByUser;


  if (getBooleanLoopAttribute(L, "llvm.loop.isvectorized"))

    return TM_Disable;


  if (Enable == true)

    return TM_ForcedByUser;


  if ((VectorizeWidth && VectorizeWidth->isScalar()) && InterleaveCount == 1)

    return TM_Disable;


  if ((VectorizeWidth && VectorizeWidth->isVector()) || InterleaveCount > 1)

    return TM_Enable;


  if (hasDisableAllTransformsHint(L))

    return TM_Disable;


  return TM_Unspecified;

}


TransformationMode llvm::hasDistributeTransformation(const Loop *L) {

  if (getBooleanLoopAttribute(L, "llvm.loop.distribute.enable"))

    return TM_ForcedByUser;


  if (hasDisableAllTransformsHint(L))

    return TM_Disable;


  return TM_Unspecified;

}


TransformationMode llvm::hasLICMVersioningTransformation(const Loop *L) {

  if (getBooleanLoopAttribute(L, "llvm.loop.licm_versioning.disable"))

    return TM_SuppressedByUser;


  if (hasDisableAllTransformsHint(L))

    return TM_Disable;


  return TM_Unspecified;

}


/// Does a BFS from a given node to all of its children inside a given loop.

/// The returned vector of basic blocks includes the starting point.


SmallVector<BasicBlock *, 16> llvm::collectChildrenInLoop(DominatorTree *DT,

                                                          DomTreeNode *N,

                                                          const Loop *CurLoop) {

  SmallVector<BasicBlock *, 16> Worklist;

  auto AddRegionToWorklist = [&](DomTreeNode *DTN) {

    // Only include subregions in the top level loop.

    BasicBlock *BB = DTN->getBlock();

    if (CurLoop->contains(BB))

      Worklist.push_back(DTN->getBlock());

  };


  AddRegionToWorklist(N);


  for (size_t I = 0; I < Worklist.size(); I++) {

    for (DomTreeNode *Child : DT->getNode(Worklist[I])->children())

      AddRegionToWorklist(Child);

  }


  return Worklist;

}


bool llvm::isAlmostDeadIV(PHINode *PN, BasicBlock *LatchBlock, Value *Cond) {

  int LatchIdx = PN->getBasicBlockIndex(LatchBlock);

  assert(LatchIdx != -1 && "LatchBlock is not a case in this PHINode");

  Value *IncV = PN->getIncomingValue(LatchIdx);


  for (User *U : PN->users())

    if (U != Cond && U != IncV) return false;


  for (User *U : IncV->users())

    if (U != Cond && U != PN) return false;

  return true;

}


void llvm::deleteDeadLoop(Loop *L, DominatorTree *DT, ScalarEvolution *SE,

                          LoopInfo *LI, MemorySSA *MSSA) {

  assert((!DT || L->isLCSSAForm(*DT)) && "Expected LCSSA!");

  auto *Preheader = L->getLoopPreheader();

  assert(Preheader && "Preheader should exist!");


  std::unique_ptr<MemorySSAUpdater> MSSAU;

  if (MSSA)

    MSSAU = std::make_unique<MemorySSAUpdater>(MSSA);


  // Now that we know the removal is safe, remove the loop by changing the

  // branch from the preheader to go to the single exit block.

  //

  // Because we're deleting a large chunk of code at once, the sequence in which

  // we remove things is very important to avoid invalidation issues.


  // Tell ScalarEvolution that the loop is deleted. Do this before

  // deleting the loop so that ScalarEvolution can look at the loop

  // to determine what it needs to clean up.

  if (SE) {

    SE->forgetLoop(L);

    SE->forgetBlockAndLoopDispositions();

  }


  Instruction *OldTerm = Preheader->getTerminator();

  assert(!OldTerm->mayHaveSideEffects() &&

         "Preheader must end with a side-effect-free terminator");

  assert(OldTerm->getNumSuccessors() == 1 &&

         "Preheader must have a single successor");

  // Connect the preheader to the exit block. Keep the old edge to the header

  // around to perform the dominator tree update in two separate steps

  // -- #1 insertion of the edge preheader -> exit and #2 deletion of the edge

  // preheader -> header.

  //

  //

  // 0.  Preheader          1.  Preheader           2.  Preheader

  //        |                    |   |                   |

  //        V                    |   V                   |

  //      Header <--\            | Header <--\           | Header <--\

  //       |  |     |            |  |  |     |           |  |  |     |

  //       |  V     |            |  |  V     |           |  |  V     |

  //       | Body --/            |  | Body --/           |  | Body --/

  //       V                     V  V                    V  V

  //      Exit                   Exit                    Exit

  //

  // By doing this is two separate steps we can perform the dominator tree

  // update without using the batch update API.

  //

  // Even when the loop is never executed, we cannot remove the edge from the

  // source block to the exit block. Consider the case where the unexecuted loop

  // branches back to an outer loop. If we deleted the loop and removed the edge

  // coming to this inner loop, this will break the outer loop structure (by

  // deleting the backedge of the outer loop). If the outer loop is indeed a

  // non-loop, it will be deleted in a future iteration of loop deletion pass.

  IRBuilder<> Builder(OldTerm);


  auto *ExitBlock = L->getUniqueExitBlock();

  DomTreeUpdater DTU(DT, DomTreeUpdater::UpdateStrategy::Eager);

  if (ExitBlock) {

    assert(ExitBlock && "Should have a unique exit block!");

    assert(L->hasDedicatedExits() && "Loop should have dedicated exits!");


    Builder.CreateCondBr(Builder.getFalse(), L->getHeader(), ExitBlock);

    // Remove the old branch. The conditional branch becomes a new terminator.

    OldTerm->eraseFromParent();


    // Rewrite phis in the exit block to get their inputs from the Preheader

    // instead of the exiting block.

    for (PHINode &P : ExitBlock->phis()) {

      // Set the zero'th element of Phi to be from the preheader and remove all

      // other incoming values. Given the loop has dedicated exits, all other

      // incoming values must be from the exiting blocks.

      int PredIndex = 0;

      P.setIncomingBlock(PredIndex, Preheader);

      // Removes all incoming values from all other exiting blocks (including

      // duplicate values from an exiting block).

      // Nuke all entries except the zero'th entry which is the preheader entry.

      P.removeIncomingValueIf([](unsigned Idx) { return Idx != 0; },

                              /* DeletePHIIfEmpty */ false);


      assert((P.getNumIncomingValues() == 1 &&

              P.getIncomingBlock(PredIndex) == Preheader) &&

             "Should have exactly one value and that's from the preheader!");

    }


    if (DT) {

      DTU.applyUpdates({{DominatorTree::Insert, Preheader, ExitBlock}});

      if (MSSA) {

        MSSAU->applyUpdates({{DominatorTree::Insert, Preheader, ExitBlock}},

                            *DT);

        if (VerifyMemorySSA)

          MSSA->verifyMemorySSA();

      }

    }


    // Disconnect the loop body by branching directly to its exit.

    Builder.SetInsertPoint(Preheader->getTerminator());

    Builder.CreateBr(ExitBlock);

    // Remove the old branch.

    Preheader->getTerminator()->eraseFromParent();

  } else {

    assert(L->hasNoExitBlocks() &&

           "Loop should have either zero or one exit blocks.");


    Builder.SetInsertPoint(OldTerm);

    Builder.CreateUnreachable();

    Preheader->getTerminator()->eraseFromParent();

  }


  if (DT) {

    DTU.applyUpdates({{DominatorTree::Delete, Preheader, L->getHeader()}});

    if (MSSA) {

      MSSAU->applyUpdates({{DominatorTree::Delete, Preheader, L->getHeader()}},

                          *DT);

      SmallSetVector<BasicBlock *, 8> DeadBlockSet(L->block_begin(),

                                                   L->block_end());

      MSSAU->removeBlocks(DeadBlockSet);

      if (VerifyMemorySSA)

        MSSA->verifyMemorySSA();

    }

  }


  // Use a map to unique and a vector to guarantee deterministic ordering.

  llvm::SmallDenseSet<DebugVariable, 4> DeadDebugSet;

  llvm::SmallVector<DbgVariableRecord *, 4> DeadDbgVariableRecords;


  if (ExitBlock) {

    // Given LCSSA form is satisfied, we should not have users of instructions

    // within the dead loop outside of the loop. However, LCSSA doesn't take

    // unreachable uses into account. We handle them here.

    // We could do it after drop all references (in this case all users in the

    // loop will be already eliminated and we have less work to do but according

    // to API doc of User::dropAllReferences only valid operation after dropping

    // references, is deletion. So let's substitute all usages of

    // instruction from the loop with poison value of corresponding type first.

    for (auto *Block : L->blocks())

      for (Instruction &I : *Block) {

        auto *Poison = PoisonValue::get(I.getType());

        for (Use &U : llvm::make_early_inc_range(I.uses())) {

          if (auto *Usr = dyn_cast<Instruction>(U.getUser()))

            if (L->contains(Usr->getParent()))

              continue;

          // If we have a DT then we can check that uses outside a loop only in

          // unreachable block.

          if (DT)

            assert(!DT->isReachableFromEntry(U) &&

                   "Unexpected user in reachable block");

          U.set(Poison);

        }


        // For one of each variable encountered, preserve a debug record (set

        // to Poison) and transfer it to the loop exit. This terminates any

        // variable locations that were set during the loop.

        for (DbgVariableRecord &DVR :

             llvm::make_early_inc_range(filterDbgVars(I.getDbgRecordRange()))) {

          DebugVariable Key(DVR.getVariable(), DVR.getExpression(),

                            DVR.getDebugLoc().get());

          if (!DeadDebugSet.insert(Key).second)

            continue;

          // Unlinks the DVR from it's container, for later insertion.

          DVR.removeFromParent();

          DeadDbgVariableRecords.push_back(&DVR);

        }

      }


    // After the loop has been deleted all the values defined and modified

    // inside the loop are going to be unavailable. Values computed in the

    // loop will have been deleted, automatically causing their debug uses

    // be be replaced with undef. Loop invariant values will still be available.

    // Move dbg.values out the loop so that earlier location ranges are still

    // terminated and loop invariant assignments are preserved.

    DIBuilder DIB(*ExitBlock->getModule());

    BasicBlock::iterator InsertDbgValueBefore =

        ExitBlock->getFirstInsertionPt();

    assert(InsertDbgValueBefore != ExitBlock->end() &&

           "There should be a non-PHI instruction in exit block, else these "

           "instructions will have no parent.");


    // Due to the "head" bit in BasicBlock::iterator, we're going to insert

    // each DbgVariableRecord right at the start of the block, wheras dbg.values

    // would be repeatedly inserted before the first instruction. To replicate

    // this behaviour, do it backwards.

    for (DbgVariableRecord *DVR : llvm::reverse(DeadDbgVariableRecords))

      ExitBlock->insertDbgRecordBefore(DVR, InsertDbgValueBefore);

  }


  // Remove the block from the reference counting scheme, so that we can

  // delete it freely later.

  for (auto *Block : L->blocks())

    Block->dropAllReferences();


  if (MSSA && VerifyMemorySSA)

    MSSA->verifyMemorySSA();


  if (LI) {

    // Erase the instructions and the blocks without having to worry

    // about ordering because we already dropped the references.

    // NOTE: This iteration is safe because erasing the block does not remove

    // its entry from the loop's block list.  We do that in the next section.

    for (BasicBlock *BB : L->blocks())

      BB->eraseFromParent();


    // Finally, the blocks from loopinfo.  This has to happen late because

    // otherwise our loop iterators won't work.


    SmallPtrSet<BasicBlock *, 8> blocks(llvm::from_range, L->blocks());

    for (BasicBlock *BB : blocks)

      LI->removeBlock(BB);


    // The last step is to update LoopInfo now that we've eliminated this loop.

    // Note: LoopInfo::erase remove the given loop and relink its subloops with

    // its parent. While removeLoop/removeChildLoop remove the given loop but

    // not relink its subloops, which is what we want.

    if (Loop *ParentLoop = L->getParentLoop()) {

      Loop::iterator I = find(*ParentLoop, L);

      assert(I != ParentLoop->end() && "Couldn't find loop");

      ParentLoop->removeChildLoop(I);

    } else {

      Loop::iterator I = find(*LI, L);

      assert(I != LI->end() && "Couldn't find loop");

      LI->removeLoop(I);

    }

    LI->destroy(L);

  }

}


void llvm::breakLoopBackedge(Loop *L, DominatorTree &DT, ScalarEvolution &SE,

                             LoopInfo &LI, MemorySSA *MSSA) {

  auto *Latch = L->getLoopLatch();

  assert(Latch && "multiple latches not yet supported");

  auto *Header = L->getHeader();

  Loop *OutermostLoop = L->getOutermostLoop();


  SE.forgetLoop(L);

  SE.forgetBlockAndLoopDispositions();


  std::unique_ptr<MemorySSAUpdater> MSSAU;

  if (MSSA)

    MSSAU = std::make_unique<MemorySSAUpdater>(MSSA);


  // Update the CFG and domtree.  We chose to special case a couple of

  // of common cases for code quality and test readability reasons.

  [&]() -> void {

    if (auto *BI = dyn_cast<BranchInst>(Latch->getTerminator())) {

      if (!BI->isConditional()) {

        DomTreeUpdater DTU(&DT, DomTreeUpdater::UpdateStrategy::Eager);

        (void)changeToUnreachable(BI, /*PreserveLCSSA*/ true, &DTU,

                                  MSSAU.get());

        return;

      }


      // Conditional latch/exit - note that latch can be shared by inner

      // and outer loop so the other target doesn't need to an exit

      if (L->isLoopExiting(Latch)) {

        // TODO: Generalize ConstantFoldTerminator so that it can be used

        // here without invalidating LCSSA or MemorySSA.  (Tricky case for

        // LCSSA: header is an exit block of a preceeding sibling loop w/o

        // dedicated exits.)

        const unsigned ExitIdx = L->contains(BI->getSuccessor(0)) ? 1 : 0;

        BasicBlock *ExitBB = BI->getSuccessor(ExitIdx);


        DomTreeUpdater DTU(&DT, DomTreeUpdater::UpdateStrategy::Eager);

        Header->removePredecessor(Latch, true);


        IRBuilder<> Builder(BI);

        auto *NewBI = Builder.CreateBr(ExitBB);

        // Transfer the metadata to the new branch instruction (minus the

        // loop info since this is no longer a loop)

        NewBI->copyMetadata(*BI, {LLVMContext::MD_dbg,

                                  LLVMContext::MD_annotation});


        BI->eraseFromParent();

        DTU.applyUpdates({{DominatorTree::Delete, Latch, Header}});

        if (MSSA)

          MSSAU->applyUpdates({{DominatorTree::Delete, Latch, Header}}, DT);

        return;

      }

    }


    // General case.  By splitting the backedge, and then explicitly making it

    // unreachable we gracefully handle corner cases such as switch and invoke

    // termiantors.

    auto *BackedgeBB = SplitEdge(Latch, Header, &DT, &LI, MSSAU.get());


    DomTreeUpdater DTU(&DT, DomTreeUpdater::UpdateStrategy::Eager);

    (void)changeToUnreachable(BackedgeBB->getTerminator(),

                              /*PreserveLCSSA*/ true, &DTU, MSSAU.get());

  }();


  // Erase (and destroy) this loop instance.  Handles relinking sub-loops

  // and blocks within the loop as needed.

  LI.erase(L);


  // If the loop we broke had a parent, then changeToUnreachable might have

  // caused a block to be removed from the parent loop (see loop_nest_lcssa

  // test case in zero-btc.ll for an example), thus changing the parent's

  // exit blocks.  If that happened, we need to rebuild LCSSA on the outermost

  // loop which might have a had a block removed.

  if (OutermostLoop != L)

    formLCSSARecursively(*OutermostLoop, DT, &LI, &SE);

}


/// Checks if \p L has an exiting latch branch.  There may also be other

/// exiting blocks.  Returns branch instruction terminating the loop

/// latch if above check is successful, nullptr otherwise.


static BranchInst *getExpectedExitLoopLatchBranch(Loop *L) {

  BasicBlock *Latch = L->getLoopLatch();

  if (!Latch)

    return nullptr;


  BranchInst *LatchBR = dyn_cast<BranchInst>(Latch->getTerminator());

  if (!LatchBR || LatchBR->getNumSuccessors() != 2 || !L->isLoopExiting(Latch))

    return nullptr;


  assert((LatchBR->getSuccessor(0) == L->getHeader() ||

          LatchBR->getSuccessor(1) == L->getHeader()) &&

         "At least one edge out of the latch must go to the header");


  return LatchBR;

}


struct DbgLoop {

  const Loop *L;

  explicit DbgLoop(const Loop *L) : L(L) {}

};


#ifndef NDEBUG


static inline raw_ostream &operator<<(raw_ostream &OS, DbgLoop D) {

  OS << "function ";

  D.L->getHeader()->getParent()->printAsOperand(OS, /*PrintType=*/false);

  return OS << " " << *D.L;

}


#endif // NDEBUG


static std::optional<unsigned> estimateLoopTripCount(Loop *L) {

  // Currently we take the estimate exit count only from the loop latch,

  // ignoring other exiting blocks.  This can overestimate the trip count

  // if we exit through another exit, but can never underestimate it.

  // TODO: incorporate information from other exits

  BranchInst *ExitingBranch = getExpectedExitLoopLatchBranch(L);

  if (!ExitingBranch) {

    LLVM_DEBUG(dbgs() << "estimateLoopTripCount: Failed to find exiting "

                      << "latch branch of required form in " << DbgLoop(L)

                      << "\n");

    return std::nullopt;

  }


  // To estimate the number of times the loop body was executed, we want to

  // know the number of times the backedge was taken, vs. the number of times

  // we exited the loop.

  uint64_t LoopWeight, ExitWeight;

  if (!extractBranchWeights(*ExitingBranch, LoopWeight, ExitWeight)) {

    LLVM_DEBUG(dbgs() << "estimateLoopTripCount: Failed to extract branch "

                      << "weights for " << DbgLoop(L) << "\n");

    return std::nullopt;

  }


  if (L->contains(ExitingBranch->getSuccessor(1)))

    std::swap(LoopWeight, ExitWeight);


  if (!ExitWeight) {

    // Don't have a way to return predicated infinite

    LLVM_DEBUG(dbgs() << "estimateLoopTripCount: Failed because of zero exit "

                      << "probability for " << DbgLoop(L) << "\n");

    return std::nullopt;

  }


  // Estimated exit count is a ratio of the loop weight by the weight of the

  // edge exiting the loop, rounded to nearest.

  uint64_t ExitCount = llvm::divideNearest(LoopWeight, ExitWeight);


  // When ExitCount + 1 would wrap in unsigned, saturate at UINT_MAX.

  if (ExitCount >= std::numeric_limits<unsigned>::max())

    return std::numeric_limits<unsigned>::max();


  // Estimated trip count is one plus estimated exit count.

  uint64_t TC = ExitCount + 1;

  LLVM_DEBUG(dbgs() << "estimateLoopTripCount: Estimated trip count of " << TC

                    << " for " << DbgLoop(L) << "\n");

  return TC;

}


std::optional<unsigned>


llvm::getLoopEstimatedTripCount(Loop *L,

                                unsigned *EstimatedLoopInvocationWeight) {

  // If EstimatedLoopInvocationWeight, we do not support this loop if

  // getExpectedExitLoopLatchBranch returns nullptr.

  //

  // FIXME: Also, this is a stop-gap solution for nested loops.  It avoids

  // mistaking LLVMLoopEstimatedTripCount metadata to be for an outer loop when

  // it was created for an inner loop.  The problem is that loop metadata is

  // attached to the branch instruction in the loop latch block, but that can be

  // shared by the loops.  A solution is to attach loop metadata to loop headers

  // instead, but that would be a large change to LLVM.

  //

  // Until that happens, we work around the problem as follows.

  // getExpectedExitLoopLatchBranch (which also guards

  // setLoopEstimatedTripCount) returns nullptr for a loop unless the loop has

  // one latch and that latch has exactly two successors one of which is an exit

  // from the loop.  If the latch is shared by nested loops, then that condition

  // might hold for the inner loop but cannot hold for the outer loop:

  // - Because the latch is shared, it must have at least two successors: the

  //   inner loop header and the outer loop header, which is also an exit for

  //   the inner loop.  That satisifies the condition for the inner loop.

  // - To satsify the condition for the outer loop, the latch must have a third

  //   successor that is an exit for the outer loop.  But that violates the

  //   condition for both loops.

  BranchInst *ExitingBranch = getExpectedExitLoopLatchBranch(L);

  if (!ExitingBranch)

    return std::nullopt;


  // If requested, either compute *EstimatedLoopInvocationWeight or return

  // nullopt if cannot.

  //

  // TODO: Eventually, once all passes have migrated away from setting branch

  // weights to indicate estimated trip counts, this function will drop the

  // EstimatedLoopInvocationWeight parameter.

  if (EstimatedLoopInvocationWeight) {

    uint64_t LoopWeight = 0, ExitWeight = 0; // Inits expected to be unused.

    if (!extractBranchWeights(*ExitingBranch, LoopWeight, ExitWeight))

      return std::nullopt;

    if (L->contains(ExitingBranch->getSuccessor(1)))

      std::swap(LoopWeight, ExitWeight);

    if (!ExitWeight)

      return std::nullopt;

    *EstimatedLoopInvocationWeight = ExitWeight;

  }


  // Return the estimated trip count from metadata unless the metadata is

  // missing or has no value.

  if (auto TC = getOptionalIntLoopAttribute(L, LLVMLoopEstimatedTripCount)) {

    LLVM_DEBUG(dbgs() << "getLoopEstimatedTripCount: "

                      << LLVMLoopEstimatedTripCount << " metadata has trip "

                      << "count of " << *TC << " for " << DbgLoop(L) << "\n");

    return TC;

  }


  // Estimate the trip count from latch branch weights.

  return estimateLoopTripCount(L);

}


bool llvm::setLoopEstimatedTripCount(

    Loop *L, unsigned EstimatedTripCount,

    std::optional<unsigned> EstimatedloopInvocationWeight) {

  // If EstimatedLoopInvocationWeight, we do not support this loop if

  // getExpectedExitLoopLatchBranch returns nullptr.

  //

  // FIXME: See comments in getLoopEstimatedTripCount for why this is required

  // here regardless of EstimatedLoopInvocationWeight.

  BranchInst *LatchBranch = getExpectedExitLoopLatchBranch(L);

  if (!LatchBranch)

    return false;


  // Set the metadata.

  addStringMetadataToLoop(L, LLVMLoopEstimatedTripCount, EstimatedTripCount);


  // At the moment, we currently support changing the estimated trip count in

  // the latch branch's branch weights only.  We could extend this API to

  // manipulate estimated trip counts for any exit.

  //

  // TODO: Eventually, once all passes have migrated away from setting branch

  // weights to indicate estimated trip counts, we will not set branch weights

  // here at all.

  if (!EstimatedloopInvocationWeight)

    return true;


  // Calculate taken and exit weights.

  unsigned LatchExitWeight = 0;

  unsigned BackedgeTakenWeight = 0;


  if (EstimatedTripCount != 0) {

    LatchExitWeight = *EstimatedloopInvocationWeight;

    BackedgeTakenWeight = (EstimatedTripCount - 1) * LatchExitWeight;

  }


  // Make a swap if back edge is taken when condition is "false".

  if (LatchBranch->getSuccessor(0) != L->getHeader())

    std::swap(BackedgeTakenWeight, LatchExitWeight);


  MDBuilder MDB(LatchBranch->getContext());


  // Set/Update profile metadata.

  LatchBranch->setMetadata(

      LLVMContext::MD_prof,

      MDB.createBranchWeights(BackedgeTakenWeight, LatchExitWeight));


  return true;

}


bool llvm::hasIterationCountInvariantInParent(Loop *InnerLoop,

                                              ScalarEvolution &SE) {

  Loop *OuterL = InnerLoop->getParentLoop();

  if (!OuterL)

    return true;


  // Get the backedge taken count for the inner loop

  BasicBlock *InnerLoopLatch = InnerLoop->getLoopLatch();

  const SCEV *InnerLoopBECountSC = SE.getExitCount(InnerLoop, InnerLoopLatch);

  if (isa<SCEVCouldNotCompute>(InnerLoopBECountSC) ||

      !InnerLoopBECountSC->getType()->isIntegerTy())

    return false;


  // Get whether count is invariant to the outer loop

  ScalarEvolution::LoopDisposition LD =

      SE.getLoopDisposition(InnerLoopBECountSC, OuterL);

  if (LD != ScalarEvolution::LoopInvariant)

    return false;


  return true;

}


constexpr Intrinsic::ID llvm::getReductionIntrinsicID(RecurKind RK) {

  switch (RK) {

  default:

    llvm_unreachable("Unexpected recurrence kind");

  case RecurKind::AddChainWithSubs:

  case RecurKind::Sub:

  case RecurKind::Add:

    return Intrinsic::vector_reduce_add;

  case RecurKind::Mul:

    return Intrinsic::vector_reduce_mul;

  case RecurKind::And:

    return Intrinsic::vector_reduce_and;

  case RecurKind::Or:

    return Intrinsic::vector_reduce_or;

  case RecurKind::Xor:

    return Intrinsic::vector_reduce_xor;

  case RecurKind::FMulAdd:

  case RecurKind::FAdd:

    return Intrinsic::vector_reduce_fadd;

  case RecurKind::FMul:

    return Intrinsic::vector_reduce_fmul;

  case RecurKind::SMax:

    return Intrinsic::vector_reduce_smax;

  case RecurKind::SMin:

    return Intrinsic::vector_reduce_smin;

  case RecurKind::UMax:

    return Intrinsic::vector_reduce_umax;

  case RecurKind::UMin:

    return Intrinsic::vector_reduce_umin;

  case RecurKind::FMax:

  case RecurKind::FMaxNum:

    return Intrinsic::vector_reduce_fmax;

  case RecurKind::FMin:

  case RecurKind::FMinNum:

    return Intrinsic::vector_reduce_fmin;

  case RecurKind::FMaximum:

    return Intrinsic::vector_reduce_fmaximum;

  case RecurKind::FMinimum:

    return Intrinsic::vector_reduce_fminimum;

  case RecurKind::FMaximumNum:

    return Intrinsic::vector_reduce_fmax;

  case RecurKind::FMinimumNum:

    return Intrinsic::vector_reduce_fmin;

  }

}


Intrinsic::ID llvm::getMinMaxReductionIntrinsicID(Intrinsic::ID IID) {

  switch (IID) {

  default:

    llvm_unreachable("Unexpected intrinsic id");

  case Intrinsic::umin:

    return Intrinsic::vector_reduce_umin;

  case Intrinsic::umax:

    return Intrinsic::vector_reduce_umax;

  case Intrinsic::smin:

    return Intrinsic::vector_reduce_smin;

  case Intrinsic::smax:

    return Intrinsic::vector_reduce_smax;

  }

}


// This is the inverse to getReductionForBinop


unsigned llvm::getArithmeticReductionInstruction(Intrinsic::ID RdxID) {

  switch (RdxID) {

  case Intrinsic::vector_reduce_fadd:

    return Instruction::FAdd;

  case Intrinsic::vector_reduce_fmul:

    return Instruction::FMul;

  case Intrinsic::vector_reduce_add:

    return Instruction::Add;

  case Intrinsic::vector_reduce_mul:

    return Instruction::Mul;

  case Intrinsic::vector_reduce_and:

    return Instruction::And;

  case Intrinsic::vector_reduce_or:

    return Instruction::Or;

  case Intrinsic::vector_reduce_xor:

    return Instruction::Xor;

  case Intrinsic::vector_reduce_smax:

  case Intrinsic::vector_reduce_smin:

  case Intrinsic::vector_reduce_umax:

  case Intrinsic::vector_reduce_umin:

    return Instruction::ICmp;

  case Intrinsic::vector_reduce_fmax:

  case Intrinsic::vector_reduce_fmin:

    return Instruction::FCmp;

  default:

    llvm_unreachable("Unexpected ID");

  }

}


// This is the inverse to getArithmeticReductionInstruction


Intrinsic::ID llvm::getReductionForBinop(Instruction::BinaryOps Opc) {

  switch (Opc) {

  default:

    break;

  case Instruction::Add:

    return Intrinsic::vector_reduce_add;

  case Instruction::Mul:

    return Intrinsic::vector_reduce_mul;

  case Instruction::And:

    return Intrinsic::vector_reduce_and;

  case Instruction::Or:

    return Intrinsic::vector_reduce_or;

  case Instruction::Xor:

    return Intrinsic::vector_reduce_xor;

  }

  return Intrinsic::not_intrinsic;

}


Intrinsic::ID llvm::getMinMaxReductionIntrinsicOp(Intrinsic::ID RdxID) {

  switch (RdxID) {

  default:

    llvm_unreachable("Unknown min/max recurrence kind");

  case Intrinsic::vector_reduce_umin:

    return Intrinsic::umin;

  case Intrinsic::vector_reduce_umax:

    return Intrinsic::umax;

  case Intrinsic::vector_reduce_smin:

    return Intrinsic::smin;

  case Intrinsic::vector_reduce_smax:

    return Intrinsic::smax;

  case Intrinsic::vector_reduce_fmin:

    return Intrinsic::minnum;

  case Intrinsic::vector_reduce_fmax:

    return Intrinsic::maxnum;

  case Intrinsic::vector_reduce_fminimum:

    return Intrinsic::minimum;

  case Intrinsic::vector_reduce_fmaximum:

    return Intrinsic::maximum;

  }

}


Intrinsic::ID llvm::getMinMaxReductionIntrinsicOp(RecurKind RK) {

  switch (RK) {

  default:

    llvm_unreachable("Unknown min/max recurrence kind");

  case RecurKind::UMin:

    return Intrinsic::umin;

  case RecurKind::UMax:

    return Intrinsic::umax;

  case RecurKind::SMin:

    return Intrinsic::smin;

  case RecurKind::SMax:

    return Intrinsic::smax;

  case RecurKind::FMin:

  case RecurKind::FMinNum:

    return Intrinsic::minnum;

  case RecurKind::FMax:

  case RecurKind::FMaxNum:

    return Intrinsic::maxnum;

  case RecurKind::FMinimum:

    return Intrinsic::minimum;

  case RecurKind::FMaximum:

    return Intrinsic::maximum;

  case RecurKind::FMinimumNum:

    return Intrinsic::minimumnum;

  case RecurKind::FMaximumNum:

    return Intrinsic::maximumnum;

  }

}


RecurKind llvm::getMinMaxReductionRecurKind(Intrinsic::ID RdxID) {

  switch (RdxID) {

  case Intrinsic::vector_reduce_smax:

    return RecurKind::SMax;

  case Intrinsic::vector_reduce_smin:

    return RecurKind::SMin;

  case Intrinsic::vector_reduce_umax:

    return RecurKind::UMax;

  case Intrinsic::vector_reduce_umin:

    return RecurKind::UMin;

  case Intrinsic::vector_reduce_fmax:

    return RecurKind::FMax;

  case Intrinsic::vector_reduce_fmin:

    return RecurKind::FMin;

  default:

    return RecurKind::None;

  }

}


CmpInst::Predicate llvm::getMinMaxReductionPredicate(RecurKind RK) {

  switch (RK) {

  default:

    llvm_unreachable("Unknown min/max recurrence kind");

  case RecurKind::UMin:

    return CmpInst::ICMP_ULT;

  case RecurKind::UMax:

    return CmpInst::ICMP_UGT;

  case RecurKind::SMin:

    return CmpInst::ICMP_SLT;

  case RecurKind::SMax:

    return CmpInst::ICMP_SGT;

  case RecurKind::FMin:

    return CmpInst::FCMP_OLT;

  case RecurKind::FMax:

    return CmpInst::FCMP_OGT;

  // We do not add FMinimum/FMaximum recurrence kind here since there is no

  // equivalent predicate which compares signed zeroes according to the

  // semantics of the intrinsics (llvm.minimum/maximum).

  }

}


Value *llvm::createMinMaxOp(IRBuilderBase &Builder, RecurKind RK, Value *Left,

                            Value *Right) {

  Type *Ty = Left->getType();

  if (Ty->isIntOrIntVectorTy() ||

      (RK == RecurKind::FMinNum || RK == RecurKind::FMaxNum ||

       RK == RecurKind::FMinimum || RK == RecurKind::FMaximum ||

       RK == RecurKind::FMinimumNum || RK == RecurKind::FMaximumNum)) {

    Intrinsic::ID Id = getMinMaxReductionIntrinsicOp(RK);

    return Builder.CreateIntrinsic(Ty, Id, {Left, Right}, nullptr,

                                   "rdx.minmax");

  }

  CmpInst::Predicate Pred = getMinMaxReductionPredicate(RK);

  Value *Cmp = Builder.CreateCmp(Pred, Left, Right, "rdx.minmax.cmp");

  Value *Select = Builder.CreateSelect(Cmp, Left, Right, "rdx.minmax.select");

  return Select;

}


// Helper to generate an ordered reduction.


Value *llvm::getOrderedReduction(IRBuilderBase &Builder, Value *Acc, Value *Src,

                                 unsigned Op, RecurKind RdxKind) {

  unsigned VF = cast<FixedVectorType>(Src->getType())->getNumElements();


  // Extract and apply reduction ops in ascending order:

  // e.g. ((((Acc + Scl[0]) + Scl[1]) + Scl[2]) + ) ... + Scl[VF-1]

  Value *Result = Acc;

  for (unsigned ExtractIdx = 0; ExtractIdx != VF; ++ExtractIdx) {

    Value *Ext =

        Builder.CreateExtractElement(Src, Builder.getInt32(ExtractIdx));


    if (Op != Instruction::ICmp && Op != Instruction::FCmp) {

      Result = Builder.CreateBinOp((Instruction::BinaryOps)Op, Result, Ext,

                                   "bin.rdx");

    } else {

      assert(RecurrenceDescriptor::isMinMaxRecurrenceKind(RdxKind) &&

             "Invalid min/max");

      Result = createMinMaxOp(Builder, RdxKind, Result, Ext);

    }

  }


  return Result;

}


// Helper to generate a log2 shuffle reduction.


Value *llvm::getShuffleReduction(IRBuilderBase &Builder, Value *Src,

                                 unsigned Op,

                                 TargetTransformInfo::ReductionShuffle RS,

                                 RecurKind RdxKind) {

  unsigned VF = cast<FixedVectorType>(Src->getType())->getNumElements();

  // VF is a power of 2 so we can emit the reduction using log2(VF) shuffles

  // and vector ops, reducing the set of values being computed by half each

  // round.

  assert(isPowerOf2_32(VF) &&

         "Reduction emission only supported for pow2 vectors!");

  // Note: fast-math-flags flags are controlled by the builder configuration

  // and are assumed to apply to all generated arithmetic instructions.  Other

  // poison generating flags (nsw/nuw/inbounds/inrange/exact) are not part

  // of the builder configuration, and since they're not passed explicitly,

  // will never be relevant here.  Note that it would be generally unsound to

  // propagate these from an intrinsic call to the expansion anyways as we/

  // change the order of operations.

  auto BuildShuffledOp = [&Builder, &Op,

                          &RdxKind](SmallVectorImpl<int> &ShuffleMask,

                                    Value *&TmpVec) -> void {

    Value *Shuf = Builder.CreateShuffleVector(TmpVec, ShuffleMask, "rdx.shuf");

    if (Op != Instruction::ICmp && Op != Instruction::FCmp) {

      TmpVec = Builder.CreateBinOp((Instruction::BinaryOps)Op, TmpVec, Shuf,

                                   "bin.rdx");

    } else {

      assert(RecurrenceDescriptor::isMinMaxRecurrenceKind(RdxKind) &&

             "Invalid min/max");

      TmpVec = createMinMaxOp(Builder, RdxKind, TmpVec, Shuf);

    }

  };


  Value *TmpVec = Src;

  if (TargetTransformInfo::ReductionShuffle::Pairwise == RS) {

    SmallVector<int, 32> ShuffleMask(VF);

    for (unsigned stride = 1; stride < VF; stride <<= 1) {

      // Initialise the mask with undef.

      llvm::fill(ShuffleMask, -1);

      for (unsigned j = 0; j < VF; j += stride << 1) {

        ShuffleMask[j] = j + stride;

      }

      BuildShuffledOp(ShuffleMask, TmpVec);

    }

  } else {

    SmallVector<int, 32> ShuffleMask(VF);

    for (unsigned i = VF; i != 1; i >>= 1) {

      // Move the upper half of the vector to the lower half.

      for (unsigned j = 0; j != i / 2; ++j)

        ShuffleMask[j] = i / 2 + j;


      // Fill the rest of the mask with undef.

      std::fill(&ShuffleMask[i / 2], ShuffleMask.end(), -1);

      BuildShuffledOp(ShuffleMask, TmpVec);

    }

  }

  // The result is in the first element of the vector.

  return Builder.CreateExtractElement(TmpVec, Builder.getInt32(0));

}


Value *llvm::createAnyOfReduction(IRBuilderBase &Builder, Value *Src,

                                  Value *InitVal, PHINode *OrigPhi) {

  Value *NewVal = nullptr;


  // First use the original phi to determine the new value we're trying to

  // select from in the loop.

  SelectInst *SI = nullptr;

  for (auto *U : OrigPhi->users()) {

    if ((SI = dyn_cast<SelectInst>(U)))

      break;

  }

  assert(SI && "One user of the original phi should be a select");


  if (SI->getTrueValue() == OrigPhi)

    NewVal = SI->getFalseValue();

  else {

    assert(SI->getFalseValue() == OrigPhi &&

           "At least one input to the select should be the original Phi");

    NewVal = SI->getTrueValue();

  }


  // If any predicate is true it means that we want to select the new value.

  Value *AnyOf =

      Src->getType()->isVectorTy() ? Builder.CreateOrReduce(Src) : Src;

  // The compares in the loop may yield poison, which propagates through the

  // bitwise ORs. Freeze it here before the condition is used.

  AnyOf = Builder.CreateFreeze(AnyOf);

  return Builder.CreateSelect(AnyOf, NewVal, InitVal, "rdx.select");

}


Value *llvm::createFindLastIVReduction(IRBuilderBase &Builder, Value *Src,

                                       RecurKind RdxKind, Value *Start,

                                       Value *Sentinel) {

  bool IsSigned = RecurrenceDescriptor::isSignedRecurrenceKind(RdxKind);

  bool IsMaxRdx = RecurrenceDescriptor::isFindLastIVRecurrenceKind(RdxKind);

  Value *MaxRdx = Src->getType()->isVectorTy()

                      ? (IsMaxRdx ? Builder.CreateIntMaxReduce(Src, IsSigned)

                                  : Builder.CreateIntMinReduce(Src, IsSigned))

                      : Src;

  // Correct the final reduction result back to the start value if the maximum

  // reduction is sentinel value.

  Value *Cmp =

      Builder.CreateCmp(CmpInst::ICMP_NE, MaxRdx, Sentinel, "rdx.select.cmp");

  return Builder.CreateSelect(Cmp, MaxRdx, Start, "rdx.select");

}


Value *llvm::getReductionIdentity(Intrinsic::ID RdxID, Type *Ty,

                                  FastMathFlags Flags) {

  bool Negative = false;

  switch (RdxID) {

  default:

    llvm_unreachable("Expecting a reduction intrinsic");

  case Intrinsic::vector_reduce_add:

  case Intrinsic::vector_reduce_mul:

  case Intrinsic::vector_reduce_or:

  case Intrinsic::vector_reduce_xor:

  case Intrinsic::vector_reduce_and:

  case Intrinsic::vector_reduce_fadd:

  case Intrinsic::vector_reduce_fmul: {

    unsigned Opc = getArithmeticReductionInstruction(RdxID);

    return ConstantExpr::getBinOpIdentity(Opc, Ty, false,

                                          Flags.noSignedZeros());

  }

  case Intrinsic::vector_reduce_umax:

  case Intrinsic::vector_reduce_umin:

  case Intrinsic::vector_reduce_smin:

  case Intrinsic::vector_reduce_smax: {

    Intrinsic::ID ScalarID = getMinMaxReductionIntrinsicOp(RdxID);

    return ConstantExpr::getIntrinsicIdentity(ScalarID, Ty);

  }

  case Intrinsic::vector_reduce_fmax:

  case Intrinsic::vector_reduce_fmaximum:

    Negative = true;

    [[fallthrough]];

  case Intrinsic::vector_reduce_fmin:

  case Intrinsic::vector_reduce_fminimum: {

    bool PropagatesNaN = RdxID == Intrinsic::vector_reduce_fminimum ||

                         RdxID == Intrinsic::vector_reduce_fmaximum;

    const fltSemantics &Semantics = Ty->getFltSemantics();

    return (!Flags.noNaNs() && !PropagatesNaN)

               ? ConstantFP::getQNaN(Ty, Negative)

           : !Flags.noInfs()

               ? ConstantFP::getInfinity(Ty, Negative)

               : ConstantFP::get(Ty, APFloat::getLargest(Semantics, Negative));

  }

  }

}


Value *llvm::getRecurrenceIdentity(RecurKind K, Type *Tp, FastMathFlags FMF) {

  assert((!(K == RecurKind::FMin || K == RecurKind::FMax) ||

          (FMF.noNaNs() && FMF.noSignedZeros())) &&

         "nnan, nsz is expected to be set for FP min/max reduction.");

  Intrinsic::ID RdxID = getReductionIntrinsicID(K);

  return getReductionIdentity(RdxID, Tp, FMF);

}


Value *llvm::createSimpleReduction(IRBuilderBase &Builder, Value *Src,

                                   RecurKind RdxKind) {

  auto *SrcVecEltTy = cast<VectorType>(Src->getType())->getElementType();

  auto getIdentity = [&]() {

    return getRecurrenceIdentity(RdxKind, SrcVecEltTy,

                                 Builder.getFastMathFlags());

  };

  switch (RdxKind) {

  case RecurKind::AddChainWithSubs:

  case RecurKind::Sub:

  case RecurKind::Add:

  case RecurKind::Mul:

  case RecurKind::And:

  case RecurKind::Or:

  case RecurKind::Xor:

  case RecurKind::SMax:

  case RecurKind::SMin:

  case RecurKind::UMax:

  case RecurKind::UMin:

  case RecurKind::FMax:

  case RecurKind::FMin:

  case RecurKind::FMinNum:

  case RecurKind::FMaxNum:

  case RecurKind::FMinimum:

  case RecurKind::FMaximum:

  case RecurKind::FMinimumNum:

  case RecurKind::FMaximumNum:

    return Builder.CreateUnaryIntrinsic(getReductionIntrinsicID(RdxKind), Src);

  case RecurKind::FMulAdd:

  case RecurKind::FAdd:

    return Builder.CreateFAddReduce(getIdentity(), Src);

  case RecurKind::FMul:

    return Builder.CreateFMulReduce(getIdentity(), Src);

  default:

    llvm_unreachable("Unhandled opcode");

  }

}


Value *llvm::createSimpleReduction(IRBuilderBase &Builder, Value *Src,

                                   RecurKind Kind, Value *Mask, Value *EVL) {

  assert(!RecurrenceDescriptor::isAnyOfRecurrenceKind(Kind) &&

         !RecurrenceDescriptor::isFindIVRecurrenceKind(Kind) &&

         "AnyOf and FindIV reductions are not supported.");

  Intrinsic::ID Id = getReductionIntrinsicID(Kind);

  auto VPID = VPIntrinsic::getForIntrinsic(Id);

  assert(VPReductionIntrinsic::isVPReduction(VPID) &&

         "No VPIntrinsic for this reduction");

  auto *EltTy = cast<VectorType>(Src->getType())->getElementType();

  Value *Iden = getRecurrenceIdentity(Kind, EltTy, Builder.getFastMathFlags());

  Value *Ops[] = {Iden, Src, Mask, EVL};

  return Builder.CreateIntrinsic(EltTy, VPID, Ops);

}


Value *llvm::createOrderedReduction(IRBuilderBase &B, RecurKind Kind,

                                    Value *Src, Value *Start) {

  assert((Kind == RecurKind::FAdd || Kind == RecurKind::FMulAdd) &&

         "Unexpected reduction kind");

  assert(Src->getType()->isVectorTy() && "Expected a vector type");

  assert(!Start->getType()->isVectorTy() && "Expected a scalar type");


  return B.CreateFAddReduce(Start, Src);

}


Value *llvm::createOrderedReduction(IRBuilderBase &Builder, RecurKind Kind,

                                    Value *Src, Value *Start, Value *Mask,

                                    Value *EVL) {

  assert((Kind == RecurKind::FAdd || Kind == RecurKind::FMulAdd) &&

         "Unexpected reduction kind");

  assert(Src->getType()->isVectorTy() && "Expected a vector type");

  assert(!Start->getType()->isVectorTy() && "Expected a scalar type");


  Intrinsic::ID Id = getReductionIntrinsicID(RecurKind::FAdd);

  auto VPID = VPIntrinsic::getForIntrinsic(Id);

  assert(VPReductionIntrinsic::isVPReduction(VPID) &&

         "No VPIntrinsic for this reduction");

  auto *EltTy = cast<VectorType>(Src->getType())->getElementType();

  Value *Ops[] = {Start, Src, Mask, EVL};

  return Builder.CreateIntrinsic(EltTy, VPID, Ops);

}


void llvm::propagateIRFlags(Value *I, ArrayRef<Value *> VL, Value *OpValue,

                            bool IncludeWrapFlags) {

  auto *VecOp = dyn_cast<Instruction>(I);

  if (!VecOp)

    return;

  auto *Intersection = (OpValue == nullptr) ? dyn_cast<Instruction>(VL[0])

                                            : dyn_cast<Instruction>(OpValue);

  if (!Intersection)

    return;

  const unsigned Opcode = Intersection->getOpcode();

  VecOp->copyIRFlags(Intersection, IncludeWrapFlags);

  for (auto *V : VL) {

    auto *Instr = dyn_cast<Instruction>(V);

    if (!Instr)

      continue;

    if (OpValue == nullptr || Opcode == Instr->getOpcode())

      VecOp->andIRFlags(V);

  }

}


bool llvm::isKnownNegativeInLoop(const SCEV *S, const Loop *L,

                                 ScalarEvolution &SE) {

  const SCEV *Zero = SE.getZero(S->getType());

  return SE.isAvailableAtLoopEntry(S, L) &&

         SE.isLoopEntryGuardedByCond(L, ICmpInst::ICMP_SLT, S, Zero);

}


bool llvm::isKnownNonNegativeInLoop(const SCEV *S, const Loop *L,

                                    ScalarEvolution &SE) {

  const SCEV *Zero = SE.getZero(S->getType());

  return SE.isAvailableAtLoopEntry(S, L) &&

         SE.isLoopEntryGuardedByCond(L, ICmpInst::ICMP_SGE, S, Zero);

}


bool llvm::isKnownPositiveInLoop(const SCEV *S, const Loop *L,

                                 ScalarEvolution &SE) {

  const SCEV *Zero = SE.getZero(S->getType());

  return SE.isAvailableAtLoopEntry(S, L) &&

         SE.isLoopEntryGuardedByCond(L, ICmpInst::ICMP_SGT, S, Zero);

}


bool llvm::isKnownNonPositiveInLoop(const SCEV *S, const Loop *L,

                                    ScalarEvolution &SE) {

  const SCEV *Zero = SE.getZero(S->getType());

  return SE.isAvailableAtLoopEntry(S, L) &&

         SE.isLoopEntryGuardedByCond(L, ICmpInst::ICMP_SLE, S, Zero);

}


bool llvm::cannotBeMinInLoop(const SCEV *S, const Loop *L, ScalarEvolution &SE,

                             bool Signed) {

  unsigned BitWidth = cast<IntegerType>(S->getType())->getBitWidth();

  APInt Min = Signed ? APInt::getSignedMinValue(BitWidth) :

    APInt::getMinValue(BitWidth);

  auto Predicate = Signed ? ICmpInst::ICMP_SGT : ICmpInst::ICMP_UGT;

  return SE.isAvailableAtLoopEntry(S, L) &&

         SE.isLoopEntryGuardedByCond(L, Predicate, S,

                                     SE.getConstant(Min));

}


bool llvm::cannotBeMaxInLoop(const SCEV *S, const Loop *L, ScalarEvolution &SE,

                             bool Signed) {

  unsigned BitWidth = cast<IntegerType>(S->getType())->getBitWidth();

  APInt Max = Signed ? APInt::getSignedMaxValue(BitWidth) :

    APInt::getMaxValue(BitWidth);

  auto Predicate = Signed ? ICmpInst::ICMP_SLT : ICmpInst::ICMP_ULT;

  return SE.isAvailableAtLoopEntry(S, L) &&

         SE.isLoopEntryGuardedByCond(L, Predicate, S,

                                     SE.getConstant(Max));

}


//===----------------------------------------------------------------------===//

// rewriteLoopExitValues - Optimize IV users outside the loop.

// As a side effect, reduces the amount of IV processing within the loop.

//===----------------------------------------------------------------------===//


static bool hasHardUserWithinLoop(const Loop *L, const Instruction *I) {

  SmallPtrSet<const Instruction *, 8> Visited;

  SmallVector<const Instruction *, 8> WorkList;

  Visited.insert(I);

  WorkList.push_back(I);

  while (!WorkList.empty()) {

    const Instruction *Curr = WorkList.pop_back_val();

    // This use is outside the loop, nothing to do.

    if (!L->contains(Curr))

      continue;

    // Do we assume it is a "hard" use which will not be eliminated easily?

    if (Curr->mayHaveSideEffects())

      return true;

    // Otherwise, add all its users to worklist.

    for (const auto *U : Curr->users()) {

      auto *UI = cast<Instruction>(U);

      if (Visited.insert(UI).second)

        WorkList.push_back(UI);

    }

  }

  return false;

}


// Collect information about PHI nodes which can be transformed in

// rewriteLoopExitValues.


struct RewritePhi {

  PHINode *PN;               // For which PHI node is this replacement?

  unsigned Ith;              // For which incoming value?

  const SCEV *ExpansionSCEV; // The SCEV of the incoming value we are rewriting.

  Instruction *ExpansionPoint; // Where we'd like to expand that SCEV?

  bool HighCost;               // Is this expansion a high-cost?


  RewritePhi(PHINode *P, unsigned I, const SCEV *Val, Instruction *ExpansionPt,

             bool H)

      : PN(P), Ith(I), ExpansionSCEV(Val), ExpansionPoint(ExpansionPt),

        HighCost(H) {}


};


// Check whether it is possible to delete the loop after rewriting exit

// value. If it is possible, ignore ReplaceExitValue and do rewriting

// aggressively.


static bool canLoopBeDeleted(Loop *L, SmallVector<RewritePhi, 8> &RewritePhiSet) {

  BasicBlock *Preheader = L->getLoopPreheader();

  // If there is no preheader, the loop will not be deleted.

  if (!Preheader)

    return false;


  // In LoopDeletion pass Loop can be deleted when ExitingBlocks.size() > 1.

  // We obviate multiple ExitingBlocks case for simplicity.

  // TODO: If we see testcase with multiple ExitingBlocks can be deleted

  // after exit value rewriting, we can enhance the logic here.

  SmallVector<BasicBlock *, 4> ExitingBlocks;

  L->getExitingBlocks(ExitingBlocks);

  SmallVector<BasicBlock *, 8> ExitBlocks;

  L->getUniqueExitBlocks(ExitBlocks);

  if (ExitBlocks.size() != 1 || ExitingBlocks.size() != 1)

    return false;


  BasicBlock *ExitBlock = ExitBlocks[0];

  BasicBlock::iterator BI = ExitBlock->begin();

  while (PHINode *P = dyn_cast<PHINode>(BI)) {

    Value *Incoming = P->getIncomingValueForBlock(ExitingBlocks[0]);


    // If the Incoming value of P is found in RewritePhiSet, we know it

    // could be rewritten to use a loop invariant value in transformation

    // phase later. Skip it in the loop invariant check below.

    bool found = false;

    for (const RewritePhi &Phi : RewritePhiSet) {

      unsigned i = Phi.Ith;

      if (Phi.PN == P && (Phi.PN)->getIncomingValue(i) == Incoming) {

        found = true;

        break;

      }

    }


    Instruction *I;

    if (!found && (I = dyn_cast<Instruction>(Incoming)))

      if (!L->hasLoopInvariantOperands(I))

        return false;


    ++BI;

  }


  for (auto *BB : L->blocks())

    if (llvm::any_of(*BB, [](Instruction &I) {

          return I.mayHaveSideEffects();

        }))

      return false;


  return true;

}


/// Checks if it is safe to call InductionDescriptor::isInductionPHI for \p Phi,

/// and returns true if this Phi is an induction phi in the loop. When

/// isInductionPHI returns true, \p ID will be also be set by isInductionPHI.


static bool checkIsIndPhi(PHINode *Phi, Loop *L, ScalarEvolution *SE,

                          InductionDescriptor &ID) {

  if (!Phi)

    return false;

  if (!L->getLoopPreheader())

    return false;

  if (Phi->getParent() != L->getHeader())

    return false;

  return InductionDescriptor::isInductionPHI(Phi, L, SE, ID);

}


int llvm::rewriteLoopExitValues(Loop *L, LoopInfo *LI, TargetLibraryInfo *TLI,

                                ScalarEvolution *SE,

                                const TargetTransformInfo *TTI,

                                SCEVExpander &Rewriter, DominatorTree *DT,

                                ReplaceExitVal ReplaceExitValue,

                                SmallVector<WeakTrackingVH, 16> &DeadInsts) {

  // Check a pre-condition.

  assert(L->isRecursivelyLCSSAForm(*DT, *LI) &&

         "Indvars did not preserve LCSSA!");


  SmallVector<BasicBlock*, 8> ExitBlocks;

  L->getUniqueExitBlocks(ExitBlocks);


  SmallVector<RewritePhi, 8> RewritePhiSet;

  // Find all values that are computed inside the loop, but used outside of it.

  // Because of LCSSA, these values will only occur in LCSSA PHI Nodes.  Scan

  // the exit blocks of the loop to find them.

  for (BasicBlock *ExitBB : ExitBlocks) {

    // If there are no PHI nodes in this exit block, then no values defined

    // inside the loop are used on this path, skip it.

    PHINode *PN = dyn_cast<PHINode>(ExitBB->begin());

    if (!PN) continue;


    unsigned NumPreds = PN->getNumIncomingValues();


    // Iterate over all of the PHI nodes.

    BasicBlock::iterator BBI = ExitBB->begin();

    while ((PN = dyn_cast<PHINode>(BBI++))) {

      if (PN->use_empty())

        continue; // dead use, don't replace it


      if (!SE->isSCEVable(PN->getType()))

        continue;


      // Iterate over all of the values in all the PHI nodes.

      for (unsigned i = 0; i != NumPreds; ++i) {

        // If the value being merged in is not integer or is not defined

        // in the loop, skip it.

        Value *InVal = PN->getIncomingValue(i);

        if (!isa<Instruction>(InVal))

          continue;


        // If this pred is for a subloop, not L itself, skip it.

        if (LI->getLoopFor(PN->getIncomingBlock(i)) != L)

          continue; // The Block is in a subloop, skip it.


        // Check that InVal is defined in the loop.

        Instruction *Inst = cast<Instruction>(InVal);

        if (!L->contains(Inst))

          continue;


        // Find exit values which are induction variables in the loop, and are

        // unused in the loop, with the only use being the exit block PhiNode,

        // and the induction variable update binary operator.

        // The exit value can be replaced with the final value when it is cheap

        // to do so.

        if (ReplaceExitValue == UnusedIndVarInLoop) {

          InductionDescriptor ID;

          PHINode *IndPhi = dyn_cast<PHINode>(Inst);

          if (IndPhi) {

            if (!checkIsIndPhi(IndPhi, L, SE, ID))

              continue;

            // This is an induction PHI. Check that the only users are PHI

            // nodes, and induction variable update binary operators.

            if (llvm::any_of(Inst->users(), [&](User *U) {

                  if (!isa<PHINode>(U) && !isa<BinaryOperator>(U))

                    return true;

                  BinaryOperator *B = dyn_cast<BinaryOperator>(U);

                  if (B && B != ID.getInductionBinOp())

                    return true;

                  return false;

                }))

              continue;

          } else {

            // If it is not an induction phi, it must be an induction update

            // binary operator with an induction phi user.

            BinaryOperator *B = dyn_cast<BinaryOperator>(Inst);

            if (!B)

              continue;

            if (llvm::any_of(Inst->users(), [&](User *U) {

                  PHINode *Phi = dyn_cast<PHINode>(U);

                  if (Phi != PN && !checkIsIndPhi(Phi, L, SE, ID))

                    return true;

                  return false;

                }))

              continue;

            if (B != ID.getInductionBinOp())

              continue;

          }

        }


        // Okay, this instruction has a user outside of the current loop

        // and varies predictably *inside* the loop.  Evaluate the value it

        // contains when the loop exits, if possible.  We prefer to start with

        // expressions which are true for all exits (so as to maximize

        // expression reuse by the SCEVExpander), but resort to per-exit

        // evaluation if that fails.

        const SCEV *ExitValue = SE->getSCEVAtScope(Inst, L->getParentLoop());

        if (isa<SCEVCouldNotCompute>(ExitValue) ||

            !SE->isLoopInvariant(ExitValue, L) ||

            !Rewriter.isSafeToExpand(ExitValue)) {

          // TODO: This should probably be sunk into SCEV in some way; maybe a

          // getSCEVForExit(SCEV*, L, ExitingBB)?  It can be generalized for

          // most SCEV expressions and other recurrence types (e.g. shift

          // recurrences).  Is there existing code we can reuse?

          const SCEV *ExitCount = SE->getExitCount(L, PN->getIncomingBlock(i));

          if (isa<SCEVCouldNotCompute>(ExitCount))

            continue;

          if (auto *AddRec = dyn_cast<SCEVAddRecExpr>(SE->getSCEV(Inst)))

            if (AddRec->getLoop() == L)

              ExitValue = AddRec->evaluateAtIteration(ExitCount, *SE);

          if (isa<SCEVCouldNotCompute>(ExitValue) ||

              !SE->isLoopInvariant(ExitValue, L) ||

              !Rewriter.isSafeToExpand(ExitValue))

            continue;

        }


        // Computing the value outside of the loop brings no benefit if it is

        // definitely used inside the loop in a way which can not be optimized

        // away. Avoid doing so unless we know we have a value which computes

        // the ExitValue already. TODO: This should be merged into SCEV

        // expander to leverage its knowledge of existing expressions.

        if (ReplaceExitValue != AlwaysRepl && !isa<SCEVConstant>(ExitValue) &&

            !isa<SCEVUnknown>(ExitValue) && hasHardUserWithinLoop(L, Inst))

          continue;


        // Check if expansions of this SCEV would count as being high cost.

        bool HighCost = Rewriter.isHighCostExpansion(

            ExitValue, L, SCEVCheapExpansionBudget, TTI, Inst);


        // Note that we must not perform expansions until after

        // we query *all* the costs, because if we perform temporary expansion

        // inbetween, one that we might not intend to keep, said expansion

        // *may* affect cost calculation of the next SCEV's we'll query,

        // and next SCEV may errneously get smaller cost.


        // Collect all the candidate PHINodes to be rewritten.

        Instruction *InsertPt =

          (isa<PHINode>(Inst) || isa<LandingPadInst>(Inst)) ?

          &*Inst->getParent()->getFirstInsertionPt() : Inst;

        RewritePhiSet.emplace_back(PN, i, ExitValue, InsertPt, HighCost);

      }

    }

  }


  // TODO: evaluate whether it is beneficial to change how we calculate

  // high-cost: if we have SCEV 'A' which we know we will expand, should we

  // calculate the cost of other SCEV's after expanding SCEV 'A', thus

  // potentially giving cost bonus to those other SCEV's?


  bool LoopCanBeDel = canLoopBeDeleted(L, RewritePhiSet);

  int NumReplaced = 0;


  // Transformation.

  for (const RewritePhi &Phi : RewritePhiSet) {

    PHINode *PN = Phi.PN;


    // Only do the rewrite when the ExitValue can be expanded cheaply.

    // If LoopCanBeDel is true, rewrite exit value aggressively.

    if ((ReplaceExitValue == OnlyCheapRepl ||

         ReplaceExitValue == UnusedIndVarInLoop) &&

        !LoopCanBeDel && Phi.HighCost)

      continue;


    Value *ExitVal = Rewriter.expandCodeFor(

        Phi.ExpansionSCEV, Phi.PN->getType(), Phi.ExpansionPoint);


    LLVM_DEBUG(dbgs() << "rewriteLoopExitValues: AfterLoopVal = " << *ExitVal

                      << '\n'

                      << "  LoopVal = " << *(Phi.ExpansionPoint) << "\n");


#ifndef NDEBUG

    // If we reuse an instruction from a loop which is neither L nor one of

    // its containing loops, we end up breaking LCSSA form for this loop by

    // creating a new use of its instruction.

    if (auto *ExitInsn = dyn_cast<Instruction>(ExitVal))

      if (auto *EVL = LI->getLoopFor(ExitInsn->getParent()))

        if (EVL != L)

          assert(EVL->contains(L) && "LCSSA breach detected!");

#endif


    NumReplaced++;

    Instruction *Inst = cast<Instruction>(PN->getIncomingValue(Phi.Ith));

    PN->setIncomingValue(Phi.Ith, ExitVal);

    // It's necessary to tell ScalarEvolution about this explicitly so that

    // it can walk the def-use list and forget all SCEVs, as it may not be

    // watching the PHI itself. Once the new exit value is in place, there

    // may not be a def-use connection between the loop and every instruction

    // which got a SCEVAddRecExpr for that loop.

    SE->forgetValue(PN);


    // If this instruction is dead now, delete it. Don't do it now to avoid

    // invalidating iterators.

    if (isInstructionTriviallyDead(Inst, TLI))

      DeadInsts.push_back(Inst);


    // Replace PN with ExitVal if that is legal and does not break LCSSA.

    if (PN->getNumIncomingValues() == 1 &&

        LI->replacementPreservesLCSSAForm(PN, ExitVal)) {

      PN->replaceAllUsesWith(ExitVal);

      PN->eraseFromParent();

    }

  }


  // The insertion point instruction may have been deleted; clear it out

  // so that the rewriter doesn't trip over it later.

  Rewriter.clearInsertPoint();

  return NumReplaced;

}


/// Set weights for \p UnrolledLoop and \p RemainderLoop based on weights for

/// \p OrigLoop.


void llvm::setProfileInfoAfterUnrolling(Loop *OrigLoop, Loop *UnrolledLoop,

                                        Loop *RemainderLoop, uint64_t UF) {

  assert(UF > 0 && "Zero unrolled factor is not supported");

  assert(UnrolledLoop != RemainderLoop &&

         "Unrolled and Remainder loops are expected to distinct");


  // Get number of iterations in the original scalar loop.

  unsigned OrigLoopInvocationWeight = 0;

  std::optional<unsigned> OrigAverageTripCount =

      getLoopEstimatedTripCount(OrigLoop, &OrigLoopInvocationWeight);

  if (!OrigAverageTripCount)

    return;


  // Calculate number of iterations in unrolled loop.

  unsigned UnrolledAverageTripCount = *OrigAverageTripCount / UF;

  // Calculate number of iterations for remainder loop.

  unsigned RemainderAverageTripCount = *OrigAverageTripCount % UF;


  setLoopEstimatedTripCount(UnrolledLoop, UnrolledAverageTripCount,

                            OrigLoopInvocationWeight);

  setLoopEstimatedTripCount(RemainderLoop, RemainderAverageTripCount,

                            OrigLoopInvocationWeight);

}


/// Utility that implements appending of loops onto a worklist.

/// Loops are added in preorder (analogous for reverse postorder for trees),

/// and the worklist is processed LIFO.

template <typename RangeT>


void llvm::appendReversedLoopsToWorklist(

    RangeT &&Loops, SmallPriorityWorklist<Loop *, 4> &Worklist) {

  // We use an internal worklist to build up the preorder traversal without

  // recursion.

  SmallVector<Loop *, 4> PreOrderLoops, PreOrderWorklist;


  // We walk the initial sequence of loops in reverse because we generally want

  // to visit defs before uses and the worklist is LIFO.

  for (Loop *RootL : Loops) {

    assert(PreOrderLoops.empty() && "Must start with an empty preorder walk.");

    assert(PreOrderWorklist.empty() &&

           "Must start with an empty preorder walk worklist.");

    PreOrderWorklist.push_back(RootL);

    do {

      Loop *L = PreOrderWorklist.pop_back_val();

      PreOrderWorklist.append(L->begin(), L->end());

      PreOrderLoops.push_back(L);

    } while (!PreOrderWorklist.empty());


    Worklist.insert(std::move(PreOrderLoops));

    PreOrderLoops.clear();

  }

}


template <typename RangeT>

void llvm::appendLoopsToWorklist(RangeT &&Loops,

                                 SmallPriorityWorklist<Loop *, 4> &Worklist) {

  appendReversedLoopsToWorklist(reverse(Loops), Worklist);

}


template LLVM_EXPORT_TEMPLATE void

llvm::appendLoopsToWorklist<ArrayRef<Loop *> &>(

    ArrayRef<Loop *> &Loops, SmallPriorityWorklist<Loop *, 4> &Worklist);


template LLVM_EXPORT_TEMPLATE void

llvm::appendLoopsToWorklist<Loop &>(Loop &L,

                                    SmallPriorityWorklist<Loop *, 4> &Worklist);


void llvm::appendLoopsToWorklist(LoopInfo &LI,

                                 SmallPriorityWorklist<Loop *, 4> &Worklist) {

  appendReversedLoopsToWorklist(LI, Worklist);

}


Loop *llvm::cloneLoop(Loop *L, Loop *PL, ValueToValueMapTy &VM,

                      LoopInfo *LI, LPPassManager *LPM) {

  Loop &New = *LI->AllocateLoop();

  if (PL)

    PL->addChildLoop(&New);

  else

    LI->addTopLevelLoop(&New);


  if (LPM)

    LPM->addLoop(New);


  // Add all of the blocks in L to the new loop.

  for (BasicBlock *BB : L->blocks())

    if (LI->getLoopFor(BB) == L)

      New.addBasicBlockToLoop(cast<BasicBlock>(VM[BB]), *LI);


  // Add all of the subloops to the new loop.

  for (Loop *I : *L)

    cloneLoop(I, &New, VM, LI, LPM);


  return &New;

}


/// IR Values for the lower and upper bounds of a pointer evolution.  We

/// need to use value-handles because SCEV expansion can invalidate previously

/// expanded values.  Thus expansion of a pointer can invalidate the bounds for

/// a previous one.


struct PointerBounds {

  TrackingVH<Value> Start;

  TrackingVH<Value> End;

  Value *StrideToCheck;

};


/// Expand code for the lower and upper bound of the pointer group \p CG

/// in \p TheLoop.  \return the values for the bounds.


static PointerBounds expandBounds(const RuntimeCheckingPtrGroup *CG,

                                  Loop *TheLoop, Instruction *Loc,

                                  SCEVExpander &Exp, bool HoistRuntimeChecks) {

  LLVMContext &Ctx = Loc->getContext();

  Type *PtrArithTy = PointerType::get(Ctx, CG->AddressSpace);


  Value *Start = nullptr, *End = nullptr;

  LLVM_DEBUG(dbgs() << "LAA: Adding RT check for range:\n");

  const SCEV *Low = CG->Low, *High = CG->High, *Stride = nullptr;


  // If the Low and High values are themselves loop-variant, then we may want

  // to expand the range to include those covered by the outer loop as well.

  // There is a trade-off here with the advantage being that creating checks

  // using the expanded range permits the runtime memory checks to be hoisted

  // out of the outer loop. This reduces the cost of entering the inner loop,

  // which can be significant for low trip counts. The disadvantage is that

  // there is a chance we may now never enter the vectorized inner loop,

  // whereas using a restricted range check could have allowed us to enter at

  // least once. This is why the behaviour is not currently the default and is

  // controlled by the parameter 'HoistRuntimeChecks'.

  if (HoistRuntimeChecks && TheLoop->getParentLoop() &&

      isa<SCEVAddRecExpr>(High) && isa<SCEVAddRecExpr>(Low)) {

    auto *HighAR = cast<SCEVAddRecExpr>(High);

    auto *LowAR = cast<SCEVAddRecExpr>(Low);

    const Loop *OuterLoop = TheLoop->getParentLoop();

    ScalarEvolution &SE = *Exp.getSE();

    const SCEV *Recur = LowAR->getStepRecurrence(SE);

    if (Recur == HighAR->getStepRecurrence(SE) &&

        HighAR->getLoop() == OuterLoop && LowAR->getLoop() == OuterLoop) {

      BasicBlock *OuterLoopLatch = OuterLoop->getLoopLatch();

      const SCEV *OuterExitCount = SE.getExitCount(OuterLoop, OuterLoopLatch);

      if (!isa<SCEVCouldNotCompute>(OuterExitCount) &&

          OuterExitCount->getType()->isIntegerTy()) {

        const SCEV *NewHigh =

            cast<SCEVAddRecExpr>(High)->evaluateAtIteration(OuterExitCount, SE);

        if (!isa<SCEVCouldNotCompute>(NewHigh)) {

          LLVM_DEBUG(dbgs() << "LAA: Expanded RT check for range to include "

                               "outer loop in order to permit hoisting\n");

          High = NewHigh;

          Low = cast<SCEVAddRecExpr>(Low)->getStart();

          // If there is a possibility that the stride is negative then we have

          // to generate extra checks to ensure the stride is positive.

          if (!SE.isKnownNonNegative(

                  SE.applyLoopGuards(Recur, HighAR->getLoop()))) {

            Stride = Recur;

            LLVM_DEBUG(dbgs() << "LAA: ... but need to check stride is "

                                 "positive: "

                              << *Stride << '\n');

          }

        }

      }

    }

  }


  Start = Exp.expandCodeFor(Low, PtrArithTy, Loc);

  End = Exp.expandCodeFor(High, PtrArithTy, Loc);

  if (CG->NeedsFreeze) {

    IRBuilder<> Builder(Loc);

    Start = Builder.CreateFreeze(Start, Start->getName() + ".fr");

    End = Builder.CreateFreeze(End, End->getName() + ".fr");

  }

  Value *StrideVal =

      Stride ? Exp.expandCodeFor(Stride, Stride->getType(), Loc) : nullptr;

  LLVM_DEBUG(dbgs() << "Start: " << *Low << " End: " << *High << "\n");

  return {Start, End, StrideVal};

}


/// Turns a collection of checks into a collection of expanded upper and

/// lower bounds for both pointers in the check.

static SmallVector<std::pair<PointerBounds, PointerBounds>, 4>


expandBounds(const SmallVectorImpl<RuntimePointerCheck> &PointerChecks, Loop *L,

             Instruction *Loc, SCEVExpander &Exp, bool HoistRuntimeChecks) {

  SmallVector<std::pair<PointerBounds, PointerBounds>, 4> ChecksWithBounds;


  // Here we're relying on the SCEV Expander's cache to only emit code for the

  // same bounds once.

  transform(PointerChecks, std::back_inserter(ChecksWithBounds),

            [&](const RuntimePointerCheck &Check) {

              PointerBounds First = expandBounds(Check.first, L, Loc, Exp,

                                                 HoistRuntimeChecks),

                            Second = expandBounds(Check.second, L, Loc, Exp,

                                                  HoistRuntimeChecks);

              return std::make_pair(First, Second);

            });


  return ChecksWithBounds;

}


Value *llvm::addRuntimeChecks(

    Instruction *Loc, Loop *TheLoop,

    const SmallVectorImpl<RuntimePointerCheck> &PointerChecks,

    SCEVExpander &Exp, bool HoistRuntimeChecks) {

  // TODO: Move noalias annotation code from LoopVersioning here and share with LV if possible.

  // TODO: Pass  RtPtrChecking instead of PointerChecks and SE separately, if possible

  auto ExpandedChecks =

      expandBounds(PointerChecks, TheLoop, Loc, Exp, HoistRuntimeChecks);


  LLVMContext &Ctx = Loc->getContext();

  IRBuilder ChkBuilder(Ctx, InstSimplifyFolder(Loc->getDataLayout()));

  ChkBuilder.SetInsertPoint(Loc);

  // Our instructions might fold to a constant.

  Value *MemoryRuntimeCheck = nullptr;


  for (const auto &[A, B] : ExpandedChecks) {

    // Check if two pointers (A and B) conflict where conflict is computed as:

    // start(A) <= end(B) && start(B) <= end(A)


    assert((A.Start->getType()->getPointerAddressSpace() ==

            B.End->getType()->getPointerAddressSpace()) &&

           (B.Start->getType()->getPointerAddressSpace() ==

            A.End->getType()->getPointerAddressSpace()) &&

           "Trying to bounds check pointers with different address spaces");


    // [A|B].Start points to the first accessed byte under base [A|B].

    // [A|B].End points to the last accessed byte, plus one.

    // There is no conflict when the intervals are disjoint:

    // NoConflict = (B.Start >= A.End) || (A.Start >= B.End)

    //

    // bound0 = (B.Start < A.End)

    // bound1 = (A.Start < B.End)

    //  IsConflict = bound0 & bound1

    Value *Cmp0 = ChkBuilder.CreateICmpULT(A.Start, B.End, "bound0");

    Value *Cmp1 = ChkBuilder.CreateICmpULT(B.Start, A.End, "bound1");

    Value *IsConflict = ChkBuilder.CreateAnd(Cmp0, Cmp1, "found.conflict");

    if (A.StrideToCheck) {

      Value *IsNegativeStride = ChkBuilder.CreateICmpSLT(

          A.StrideToCheck, ConstantInt::get(A.StrideToCheck->getType(), 0),

          "stride.check");

      IsConflict = ChkBuilder.CreateOr(IsConflict, IsNegativeStride);

    }

    if (B.StrideToCheck) {

      Value *IsNegativeStride = ChkBuilder.CreateICmpSLT(

          B.StrideToCheck, ConstantInt::get(B.StrideToCheck->getType(), 0),

          "stride.check");

      IsConflict = ChkBuilder.CreateOr(IsConflict, IsNegativeStride);

    }

    if (MemoryRuntimeCheck) {

      IsConflict =

          ChkBuilder.CreateOr(MemoryRuntimeCheck, IsConflict, "conflict.rdx");

    }

    MemoryRuntimeCheck = IsConflict;

  }


  Exp.eraseDeadInstructions(MemoryRuntimeCheck);

  return MemoryRuntimeCheck;

}


Value *llvm::addDiffRuntimeChecks(

    Instruction *Loc, ArrayRef<PointerDiffInfo> Checks, SCEVExpander &Expander,

    function_ref<Value *(IRBuilderBase &, unsigned)> GetVF, unsigned IC) {


  LLVMContext &Ctx = Loc->getContext();

  IRBuilder ChkBuilder(Ctx, InstSimplifyFolder(Loc->getDataLayout()));

  ChkBuilder.SetInsertPoint(Loc);

  // Our instructions might fold to a constant.

  Value *MemoryRuntimeCheck = nullptr;


  auto &SE = *Expander.getSE();

  // Map to keep track of created compares, The key is the pair of operands for

  // the compare, to allow detecting and re-using redundant compares.

  DenseMap<std::pair<Value *, Value *>, Value *> SeenCompares;

  for (const auto &[SrcStart, SinkStart, AccessSize, NeedsFreeze] : Checks) {

    Type *Ty = SinkStart->getType();

    // Compute VF * IC * AccessSize.

    auto *VFTimesICTimesSize =

        ChkBuilder.CreateMul(GetVF(ChkBuilder, Ty->getScalarSizeInBits()),

                             ConstantInt::get(Ty, IC * AccessSize));

    Value *Diff =

        Expander.expandCodeFor(SE.getMinusSCEV(SinkStart, SrcStart), Ty, Loc);


    // Check if the same compare has already been created earlier. In that case,

    // there is no need to check it again.

    Value *IsConflict = SeenCompares.lookup({Diff, VFTimesICTimesSize});

    if (IsConflict)

      continue;


    IsConflict =

        ChkBuilder.CreateICmpULT(Diff, VFTimesICTimesSize, "diff.check");

    SeenCompares.insert({{Diff, VFTimesICTimesSize}, IsConflict});

    if (NeedsFreeze)

      IsConflict =

          ChkBuilder.CreateFreeze(IsConflict, IsConflict->getName() + ".fr");

    if (MemoryRuntimeCheck) {

      IsConflict =

          ChkBuilder.CreateOr(MemoryRuntimeCheck, IsConflict, "conflict.rdx");

    }

    MemoryRuntimeCheck = IsConflict;

  }


  Expander.eraseDeadInstructions(MemoryRuntimeCheck);

  return MemoryRuntimeCheck;

}


std::optional<IVConditionInfo>


llvm::hasPartialIVCondition(const Loop &L, unsigned MSSAThreshold,

                            const MemorySSA &MSSA, AAResults &AA) {

  auto *TI = dyn_cast<BranchInst>(L.getHeader()->getTerminator());

  if (!TI || !TI->isConditional())

    return {};


  auto *CondI = dyn_cast<Instruction>(TI->getCondition());

  // The case with the condition outside the loop should already be handled

  // earlier.

  // Allow CmpInst and TruncInsts as they may be users of load instructions

  // and have potential for partial unswitching

  if (!CondI || !isa<CmpInst, TruncInst>(CondI) || !L.contains(CondI))

    return {};


  SmallVector<Instruction *> InstToDuplicate;

  InstToDuplicate.push_back(CondI);


  SmallVector<Value *, 4> WorkList;

  WorkList.append(CondI->op_begin(), CondI->op_end());


  SmallVector<MemoryAccess *, 4> AccessesToCheck;

  SmallVector<MemoryLocation, 4> AccessedLocs;

  while (!WorkList.empty()) {

    Instruction *I = dyn_cast<Instruction>(WorkList.pop_back_val());

    if (!I || !L.contains(I))

      continue;


    // TODO: support additional instructions.

    if (!isa<LoadInst>(I) && !isa<GetElementPtrInst>(I))

      return {};


    // Do not duplicate volatile and atomic loads.

    if (auto *LI = dyn_cast<LoadInst>(I))

      if (LI->isVolatile() || LI->isAtomic())

        return {};


    InstToDuplicate.push_back(I);

    if (MemoryAccess *MA = MSSA.getMemoryAccess(I)) {

      if (auto *MemUse = dyn_cast_or_null<MemoryUse>(MA)) {

        // Queue the defining access to check for alias checks.

        AccessesToCheck.push_back(MemUse->getDefiningAccess());

        AccessedLocs.push_back(MemoryLocation::get(I));

      } else {

        // MemoryDefs may clobber the location or may be atomic memory

        // operations. Bail out.

        return {};

      }

    }

    WorkList.append(I->op_begin(), I->op_end());

  }


  if (InstToDuplicate.empty())

    return {};


  SmallVector<BasicBlock *, 4> ExitingBlocks;

  L.getExitingBlocks(ExitingBlocks);

  auto HasNoClobbersOnPath =

      [&L, &AA, &AccessedLocs, &ExitingBlocks, &InstToDuplicate,

       MSSAThreshold](BasicBlock *Succ, BasicBlock *Header,

                      SmallVector<MemoryAccess *, 4> AccessesToCheck)

      -> std::optional<IVConditionInfo> {

    IVConditionInfo Info;

    // First, collect all blocks in the loop that are on a patch from Succ

    // to the header.

    SmallVector<BasicBlock *, 4> WorkList;

    WorkList.push_back(Succ);

    WorkList.push_back(Header);

    SmallPtrSet<BasicBlock *, 4> Seen;

    Seen.insert(Header);

    Info.PathIsNoop &=

        all_of(*Header, [](Instruction &I) { return !I.mayHaveSideEffects(); });


    while (!WorkList.empty()) {

      BasicBlock *Current = WorkList.pop_back_val();

      if (!L.contains(Current))

        continue;

      const auto &SeenIns = Seen.insert(Current);

      if (!SeenIns.second)

        continue;


      Info.PathIsNoop &= all_of(

          *Current, [](Instruction &I) { return !I.mayHaveSideEffects(); });

      WorkList.append(succ_begin(Current), succ_end(Current));

    }


    // Require at least 2 blocks on a path through the loop. This skips

    // paths that directly exit the loop.

    if (Seen.size() < 2)

      return {};


    // Next, check if there are any MemoryDefs that are on the path through

    // the loop (in the Seen set) and they may-alias any of the locations in

    // AccessedLocs. If that is the case, they may modify the condition and

    // partial unswitching is not possible.

    SmallPtrSet<MemoryAccess *, 4> SeenAccesses;

    while (!AccessesToCheck.empty()) {

      MemoryAccess *Current = AccessesToCheck.pop_back_val();

      auto SeenI = SeenAccesses.insert(Current);

      if (!SeenI.second || !Seen.contains(Current->getBlock()))

        continue;


      // Bail out if exceeded the threshold.

      if (SeenAccesses.size() >= MSSAThreshold)

        return {};


      // MemoryUse are read-only accesses.

      if (isa<MemoryUse>(Current))

        continue;


      // For a MemoryDef, check if is aliases any of the location feeding

      // the original condition.

      if (auto *CurrentDef = dyn_cast<MemoryDef>(Current)) {

        if (any_of(AccessedLocs, [&AA, CurrentDef](MemoryLocation &Loc) {

              return isModSet(

                  AA.getModRefInfo(CurrentDef->getMemoryInst(), Loc));

            }))

          return {};

      }


      for (Use &U : Current->uses())

        AccessesToCheck.push_back(cast<MemoryAccess>(U.getUser()));

    }


    // We could also allow loops with known trip counts without mustprogress,

    // but ScalarEvolution may not be available.

    Info.PathIsNoop &= isMustProgress(&L);


    // If the path is considered a no-op so far, check if it reaches a

    // single exit block without any phis. This ensures no values from the

    // loop are used outside of the loop.

    if (Info.PathIsNoop) {

      for (auto *Exiting : ExitingBlocks) {

        if (!Seen.contains(Exiting))

          continue;

        for (auto *Succ : successors(Exiting)) {

          if (L.contains(Succ))

            continue;


          Info.PathIsNoop &= Succ->phis().empty() &&

                             (!Info.ExitForPath || Info.ExitForPath == Succ);

          if (!Info.PathIsNoop)

            break;

          assert((!Info.ExitForPath || Info.ExitForPath == Succ) &&

                 "cannot have multiple exit blocks");

          Info.ExitForPath = Succ;

        }

      }

    }

    if (!Info.ExitForPath)

      Info.PathIsNoop = false;


    Info.InstToDuplicate = InstToDuplicate;

    return Info;

  };


  // If we branch to the same successor, partial unswitching will not be

  // beneficial.

  if (TI->getSuccessor(0) == TI->getSuccessor(1))

    return {};


  if (auto Info = HasNoClobbersOnPath(TI->getSuccessor(0), L.getHeader(),

                                      AccessesToCheck)) {

    Info->KnownValue = ConstantInt::getTrue(TI->getContext());

    return Info;

  }

  if (auto Info = HasNoClobbersOnPath(TI->getSuccessor(1), L.getHeader(),

                                      AccessesToCheck)) {

    Info->KnownValue = ConstantInt::getFalse(TI->getContext());

    return Info;

  }


  return {};

}


Poison
@ Poison
Definition AArch64AsmPrinter.cpp:74

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

Select
AMDGPU Register Bank Select
Definition AMDGPURegBankSelect.cpp:68

AliasAnalysis.h

BasicAliasAnalysis.h
This is the interface for LLVM's primary stateless and local alias analysis.

blocks
bbsections Prepares for basic block by splitting functions into clusters of basic blocks
Definition BasicBlockSections.cpp:141

BasicBlockUtils.h

A
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")

D
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")

B
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")

Compiler.h

LLVM_EXPORT_TEMPLATE
#define LLVM_EXPORT_TEMPLATE
Definition Compiler.h:215

DIBuilder.h

DenseSet.h
This file defines the DenseSet and SmallDenseSet classes.

DomTreeUpdater.h

Dominators.h

Check
#define Check(C,...)
Definition GenericConvergenceVerifierImpl.h:34

GlobalsModRef.h
This is the interface for a simple mod/ref and alias analysis over globals.

Cleanup
static const HTTPClientCleanup Cleanup
Definition HTTPClient.cpp:42

Loops
Hexagon Hardware Loops
Definition HexagonHardwareLoops.cpp:367

IntrinsicInst.h

Module.h
Module.h This file contains the declarations for the Module class.

Users
iv Induction Variable Users
Definition IVUsers.cpp:48

ReplaceExitValue
static cl::opt< ReplaceExitVal > ReplaceExitValue("replexitval", cl::Hidden, cl::init(OnlyCheapRepl), cl::desc("Choose the strategy to replace exit value in IndVarSimplify"), cl::values(clEnumValN(NeverRepl, "never", "never replace exit value"), clEnumValN(OnlyCheapRepl, "cheap", "only replace exit value when the cost is cheap"), clEnumValN(UnusedIndVarInLoop, "unusedindvarinloop", "only replace exit value when it is an unused " "induction variable in the loop and has cheap replacement cost"), clEnumValN(NoHardUse, "noharduse", "only replace exit values when loop def likely dead"), clEnumValN(AlwaysRepl, "always", "always replace exit value whenever possible")))

InitializePasses.h

InstSimplifyFolder.h

Instructions.h

Ops
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
Definition ItaniumDemangle.h:3368

HoistRuntimeChecks
static cl::opt< bool, true > HoistRuntimeChecks("hoist-runtime-checks", cl::Hidden, cl::desc("Hoist inner loop runtime memory checks to outer loop if possible"), cl::location(VectorizerParams::HoistRuntimeChecks), cl::init(true))

LoopAccessAnalysis.h

LoopInfo.h

LoopPass.h

hasHardUserWithinLoop
static bool hasHardUserWithinLoop(const Loop *L, const Instruction *I)
Definition LoopUtils.cpp:1552

LLVMLoopDisableLICM
static const char * LLVMLoopDisableLICM
Definition LoopUtils.cpp:56

expandBounds
static PointerBounds expandBounds(const RuntimeCheckingPtrGroup *CG, Loop *TheLoop, Instruction *Loc, SCEVExpander &Exp, bool HoistRuntimeChecks)
Expand code for the lower and upper bound of the pointer group CG in TheLoop.
Definition LoopUtils.cpp:1976

canLoopBeDeleted
static bool canLoopBeDeleted(Loop *L, SmallVector< RewritePhi, 8 > &RewritePhiSet)
Definition LoopUtils.cpp:1593

LLVMLoopDisableNonforced
static const char * LLVMLoopDisableNonforced
Definition LoopUtils.cpp:55

createStringMetadata
static MDNode * createStringMetadata(Loop *TheLoop, StringRef Name, unsigned V)
Create MDNode for input string.
Definition LoopUtils.cpp:204

getExpectedExitLoopLatchBranch
static BranchInst * getExpectedExitLoopLatchBranch(Loop *L)
Checks if L has an exiting latch branch.
Definition LoopUtils.cpp:791

estimateLoopTripCount
static std::optional< unsigned > estimateLoopTripCount(Loop *L)
Definition LoopUtils.cpp:820

checkIsIndPhi
static bool checkIsIndPhi(PHINode *Phi, Loop *L, ScalarEvolution *SE, InductionDescriptor &ID)
Checks if it is safe to call InductionDescriptor::isInductionPHI for Phi, and returns true if this Ph...
Definition LoopUtils.cpp:1647

LoopUtils.h

I
#define I(x, y, z)
Definition MD5.cpp:58

H
#define H(x, y, z)
Definition MD5.cpp:57

MDBuilder.h

MemorySSAUpdater.h

MemorySSA.h
This file exposes an interface to building/using memory SSA to walk memory instructions using a use/d...

High
uint64_t High
Definition NVVMIntrRange.cpp:46

P
#define P(N)

INITIALIZE_PASS_DEPENDENCY
#define INITIALIZE_PASS_DEPENDENCY(depName)
Definition PassSupport.h:42

Pass.h

PatternMatch.h

PriorityWorklist.h
This file provides a priority worklist.

ProfDataUtils.h
This file contains the declarations for profiling metadata utility functions.

Cond
const SmallVectorImpl< MachineOperand > & Cond
Definition RISCVRedundantCopyElimination.cpp:71

Opc
auto Opc
Definition RISCVRedundantCopyElimination.cpp:75

ScalarEvolutionAliasAnalysis.h
This is the interface for a SCEV-based alias analysis.

ScalarEvolutionExpander.h

ScalarEvolutionExpressions.h

ScalarEvolution.h

ScopeExit.h
This file defines the make_scope_exit function, which executes user-defined cleanup logic at scope ex...

SetVector.h
This file implements a set that has insertion order iteration characteristics.

MSSAThreshold
static cl::opt< unsigned > MSSAThreshold("simple-loop-unswitch-memoryssa-threshold", cl::desc("Max number of memory uses to explore during " "partial unswitching analysis"), cl::init(100), cl::Hidden)

SmallPtrSet.h
This file defines the SmallPtrSet class.

SmallVector.h
This file defines the SmallVector class.

Debug.h

LLVM_DEBUG
#define LLVM_DEBUG(...)
Definition Debug.h:114

Local.h

ValueHandle.h

Node
Definition ItaniumDemangle.h:166

llvm::AAResultsWrapperPass
A wrapper pass to provide the legacy pass manager access to a suitably prepared AAResults object.
Definition AliasAnalysis.h:1008

llvm::AAResults
Definition AliasAnalysis.h:318

llvm::APFloat::getLargest
static APFloat getLargest(const fltSemantics &Sem, bool Negative=false)
Returns the largest finite number in the given semantics.
Definition APFloat.h:1138

llvm::APInt
Class for arbitrary precision integers.
Definition APInt.h:78

llvm::APInt::getMaxValue
static APInt getMaxValue(unsigned numBits)
Gets maximum unsigned value of APInt for specific bit width.
Definition APInt.h:206

llvm::APInt::getSignedMaxValue
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition APInt.h:209

llvm::APInt::getMinValue
static APInt getMinValue(unsigned numBits)
Gets minimum unsigned value of APInt for a specific bit width.
Definition APInt.h:216

llvm::APInt::getSignedMinValue
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
Definition APInt.h:219

llvm::AnalysisUsage
Represent the analysis usage information of a pass.
Definition PassAnalysisSupport.h:48

llvm::AnalysisUsage::addRequiredID
LLVM_ABI AnalysisUsage & addRequiredID(const void *ID)
Definition Pass.cpp:284

llvm::AnalysisUsage::addPreservedID
AnalysisUsage & addPreservedID(const void *ID)
Definition PassAnalysisSupport.h:89

llvm::AnalysisUsage::addRequired
AnalysisUsage & addRequired()
Definition PassAnalysisSupport.h:76

llvm::AnalysisUsage::addPreserved
AnalysisUsage & addPreserved()
Add the specified Pass class to the set of analyses preserved by this pass.
Definition PassAnalysisSupport.h:99

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:41

llvm::BasicAAWrapperPass
Legacy wrapper pass to provide the BasicAAResult object.
Definition BasicAliasAnalysis.h:169

llvm::BasicBlock
LLVM Basic Block Representation.
Definition BasicBlock.h:62

llvm::BasicBlock::begin
iterator begin()
Instruction iterator methods.
Definition BasicBlock.h:459

llvm::BasicBlock::iterator
InstListType::iterator iterator
Instruction iterators...
Definition BasicBlock.h:170

llvm::BasicBlock::getContext
LLVM_ABI LLVMContext & getContext() const
Get the context in which this basic block lives.
Definition BasicBlock.cpp:131

llvm::BasicBlock::getTerminator
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction if the block is well formed or null if the block is not well forme...
Definition BasicBlock.h:233

llvm::BinaryOperator
Definition InstrTypes.h:171

llvm::BranchInst
Conditional or Unconditional Branch instruction.
Definition Instructions.h:3057

llvm::BranchInst::getNumSuccessors
unsigned getNumSuccessors() const
Definition Instructions.h:3143

llvm::BranchInst::getSuccessor
BasicBlock * getSuccessor(unsigned i) const
Definition Instructions.h:3145

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:678

llvm::CmpInst::ICMP_SLT
@ ICMP_SLT
signed less than
Definition InstrTypes.h:707

llvm::CmpInst::ICMP_SLE
@ ICMP_SLE
signed less or equal
Definition InstrTypes.h:708

llvm::CmpInst::FCMP_OLT
@ FCMP_OLT
0 1 0 0 True if ordered and less than
Definition InstrTypes.h:684

llvm::CmpInst::FCMP_OGT
@ FCMP_OGT
0 0 1 0 True if ordered and greater than
Definition InstrTypes.h:682

llvm::CmpInst::ICMP_UGT
@ ICMP_UGT
unsigned greater than
Definition InstrTypes.h:701

llvm::CmpInst::ICMP_SGT
@ ICMP_SGT
signed greater than
Definition InstrTypes.h:705

llvm::CmpInst::ICMP_ULT
@ ICMP_ULT
unsigned less than
Definition InstrTypes.h:703

llvm::CmpInst::ICMP_NE
@ ICMP_NE
not equal
Definition InstrTypes.h:700

llvm::CmpInst::ICMP_SGE
@ ICMP_SGE
signed greater or equal
Definition InstrTypes.h:706

llvm::ConstantAsMetadata::get
static ConstantAsMetadata * get(Constant *C)
Definition Metadata.h:535

llvm::ConstantExpr::getIntrinsicIdentity
static LLVM_ABI Constant * getIntrinsicIdentity(Intrinsic::ID, Type *Ty)
Definition Constants.cpp:2739

llvm::ConstantExpr::getBinOpIdentity
static LLVM_ABI Constant * getBinOpIdentity(unsigned Opcode, Type *Ty, bool AllowRHSConstant=false, bool NSZ=false)
Return the identity constant for a binary opcode.
Definition Constants.cpp:2694

llvm::ConstantFP::getInfinity
static LLVM_ABI Constant * getInfinity(Type *Ty, bool Negative=false)
Definition Constants.cpp:1105

llvm::ConstantFP::getQNaN
static LLVM_ABI Constant * getQNaN(Type *Ty, bool Negative=false, APInt *Payload=nullptr)
Definition Constants.cpp:1037

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition Constants.h:87

llvm::ConstantInt::getTrue
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
Definition Constants.cpp:868

llvm::ConstantInt::getFalse
static LLVM_ABI ConstantInt * getFalse(LLVMContext &Context)
Definition Constants.cpp:875

llvm::ConstantInt::getSExtValue
int64_t getSExtValue() const
Return the constant as a 64-bit integer value after it has been sign extended as appropriate for the ...
Definition Constants.h:169

llvm::DIBuilder
Definition DIBuilder.h:46

llvm::DbgVariableRecord
Record of a variable value-assignment, aka a non instruction representation of the dbg....
Definition DebugProgramInstruction.h:277

llvm::DebugVariable
Identifies a unique instance of a variable.
Definition DebugInfoMetadata.h:4589

llvm::DenseMapBase::lookup
ValueT lookup(const_arg_type_t< KeyT > Val) const
lookup - Return the entry for the specified key, or a default constructed value if no such entry exis...
Definition DenseMap.h:187

llvm::DenseMapBase::insert
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Definition DenseMap.h:214

llvm::DenseMap
Definition DenseMap.h:700

llvm::DomTreeNodeBase::children
iterator_range< iterator > children()
Definition GenericDomTree.h:84

llvm::DomTreeUpdater
Definition DomTreeUpdater.h:34

llvm::DominatorTreeBase< BasicBlock, false >::Delete
static constexpr UpdateKind Delete
Definition GenericDomTree.h:253

llvm::DominatorTreeBase< BasicBlock, false >::Insert
static constexpr UpdateKind Insert
Definition GenericDomTree.h:252

llvm::DominatorTreeBase::getNode
DomTreeNodeBase< NodeT > * getNode(const NodeT *BB) const
getNode - return the (Post)DominatorTree node for the specified basic block.
Definition GenericDomTree.h:401

llvm::DominatorTreeWrapperPass
Legacy analysis pass which computes a DominatorTree.
Definition Dominators.h:322

llvm::DominatorTree
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition Dominators.h:165

llvm::DominatorTree::isReachableFromEntry
LLVM_ABI bool isReachableFromEntry(const Use &U) const
Provide an overload for a Use.
Definition Dominators.cpp:334

llvm::ElementCount::get
static constexpr ElementCount get(ScalarTy MinVal, bool Scalable)
Definition TypeSize.h:315

llvm::FastMathFlags
Convenience struct for specifying and reasoning about fast-math flags.
Definition FMF.h:22

llvm::FastMathFlags::noSignedZeros
bool noSignedZeros() const
Definition FMF.h:67

llvm::FastMathFlags::noNaNs
bool noNaNs() const
Definition FMF.h:65

llvm::GenericDomTreeUpdater::applyUpdates
void applyUpdates(ArrayRef< UpdateT > Updates)
Submit updates to all available trees.
Definition GenericDomTreeUpdaterImpl.h:59

llvm::GlobalsAAWrapperPass
Legacy wrapper pass to provide the GlobalsAAResult object.
Definition GlobalsModRef.h:146

llvm::IRBuilderBase
Common base class shared among various IRBuilders.
Definition IRBuilder.h:114

llvm::IRBuilderBase::CreateICmpULT
Value * CreateICmpULT(Value *LHS, Value *RHS, const Twine &Name="")
Definition IRBuilder.h:2345

llvm::IRBuilderBase::CreateFreeze
Value * CreateFreeze(Value *V, const Twine &Name="")
Definition IRBuilder.h:2637

llvm::IRBuilderBase::CreateAnd
Value * CreateAnd(Value *LHS, Value *RHS, const Twine &Name="")
Definition IRBuilder.h:1551

llvm::IRBuilderBase::CreateICmpSLT
Value * CreateICmpSLT(Value *LHS, Value *RHS, const Twine &Name="")
Definition IRBuilder.h:2361

llvm::IRBuilderBase::SetInsertPoint
void SetInsertPoint(BasicBlock *TheBB)
This specifies that created instructions should be appended to the end of the specified block.
Definition IRBuilder.h:207

llvm::IRBuilderBase::CreateOr
Value * CreateOr(Value *LHS, Value *RHS, const Twine &Name="", bool IsDisjoint=false)
Definition IRBuilder.h:1573

llvm::IRBuilderBase::CreateMul
Value * CreateMul(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Definition IRBuilder.h:1437

llvm::IRBuilder
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition IRBuilder.h:2780

llvm::InductionDescriptor
A struct for saving information about induction variables.
Definition IVDescriptors.h:380

llvm::InductionDescriptor::isInductionPHI
static LLVM_ABI bool isInductionPHI(PHINode *Phi, const Loop *L, ScalarEvolution *SE, InductionDescriptor &D, const SCEV *Expr=nullptr, SmallVectorImpl< Instruction * > *CastsToIgnore=nullptr)
Returns true if Phi is an induction in the loop L.
Definition IVDescriptors.cpp:1609

llvm::InstSimplifyFolder
InstSimplifyFolder - Use InstructionSimplify to fold operations to existing values.
Definition InstSimplifyFolder.h:36

llvm::Instruction
Definition Instruction.h:69

llvm::Instruction::getNumSuccessors
LLVM_ABI unsigned getNumSuccessors() const LLVM_READONLY
Return the number of successors that this instruction has.
Definition Instruction.cpp:1281

llvm::Instruction::eraseFromParent
LLVM_ABI InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
Definition Instruction.cpp:104

llvm::Instruction::mayHaveSideEffects
LLVM_ABI bool mayHaveSideEffects() const LLVM_READONLY
Return true if the instruction may have side effects.
Definition Instruction.cpp:1213

llvm::Instruction::setMetadata
LLVM_ABI void setMetadata(unsigned KindID, MDNode *Node)
Set the metadata of the specified kind to the specified node.
Definition Metadata.cpp:1718

llvm::Instruction::BinaryOps
BinaryOps
Definition Instruction.h:998

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition LLVMContext.h:68

llvm::LPPassManager
Definition LoopPass.h:77

llvm::LPPassManager::addLoop
void addLoop(Loop &L)
Definition LoopPass.cpp:77

llvm::LoopBase::contains
bool contains(const LoopT *L) const
Return true if the specified loop is contained within in this loop.
Definition GenericLoopInfo.h:124

llvm::LoopBase::getLoopLatch
BlockT * getLoopLatch() const
If there is a single latch block for this loop, return it.
Definition GenericLoopInfoImpl.h:256

llvm::LoopBase::getHeader
BlockT * getHeader() const
Definition GenericLoopInfo.h:90

llvm::LoopBase< BasicBlock, Loop >::iterator
std::vector< Loop * >::const_iterator iterator
Definition GenericLoopInfo.h:153

llvm::LoopBase::getParentLoop
LoopT * getParentLoop() const
Return the parent loop if it exists or nullptr for top level loops.
Definition GenericLoopInfo.h:99

llvm::LoopInfoBase::addTopLevelLoop
void addTopLevelLoop(LoopT *New)
This adds the specified loop to the collection of top-level loops.
Definition GenericLoopInfo.h:663

llvm::LoopInfoBase::end
iterator end() const
Definition GenericLoopInfo.h:582

llvm::LoopInfoBase::removeBlock
void removeBlock(BlockT *BB)
This method completely removes BB from all data structures, including all of the Loop objects it is n...
Definition GenericLoopInfo.h:671

llvm::LoopInfoBase::AllocateLoop
LoopT * AllocateLoop(ArgsTy &&...Args)
Definition GenericLoopInfo.h:570

llvm::LoopInfoBase::removeLoop
LoopT * removeLoop(iterator I)
This removes the specified top-level loop from this loop info object.
Definition GenericLoopInfo.h:633

llvm::LoopInfoBase::getLoopFor
LoopT * getLoopFor(const BlockT *BB) const
Return the inner most loop that BB lives in.
Definition GenericLoopInfo.h:606

llvm::LoopInfoBase::destroy
void destroy(LoopT *L)
Destroy a loop that has been removed from the LoopInfo nest.
Definition GenericLoopInfo.h:710

llvm::LoopInfoWrapperPass
The legacy pass manager's analysis pass to compute loop information.
Definition LoopInfo.h:596

llvm::LoopInfo
Definition LoopInfo.h:408

llvm::LoopInfo::replacementPreservesLCSSAForm
bool replacementPreservesLCSSAForm(Instruction *From, Value *To)
Returns true if replacing From with To everywhere is guaranteed to preserve LCSSA form.
Definition LoopInfo.h:441

llvm::LoopInfo::erase
LLVM_ABI void erase(Loop *L)
Update LoopInfo after removing the last backedge from a loop.
Definition LoopInfo.cpp:887

llvm::Loop
Represents a single loop in the control flow graph.
Definition LoopInfo.h:40

llvm::Loop::setLoopID
void setLoopID(MDNode *LoopID) const
Set the llvm.loop loop id metadata for this loop.
Definition LoopInfo.cpp:526

llvm::Loop::getLoopID
MDNode * getLoopID() const
Return the llvm.loop loop id metadata node for this loop if it is present.
Definition LoopInfo.cpp:502

llvm::MDBuilder
Definition MDBuilder.h:37

llvm::MDBuilder::createBranchWeights
LLVM_ABI MDNode * createBranchWeights(uint32_t TrueWeight, uint32_t FalseWeight, bool IsExpected=false)
Return metadata containing two branch weights.
Definition MDBuilder.cpp:38

llvm::MDNode
Metadata node.
Definition Metadata.h:1077

llvm::MDNode::replaceOperandWith
LLVM_ABI void replaceOperandWith(unsigned I, Metadata *New)
Replace a specific operand.
Definition Metadata.cpp:1078

llvm::MDNode::getOperand
const MDOperand & getOperand(unsigned I) const
Definition Metadata.h:1445

llvm::MDNode::operands
ArrayRef< MDOperand > operands() const
Definition Metadata.h:1443

llvm::MDNode::get
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
Definition Metadata.h:1565

llvm::MDNode::getNumOperands
unsigned getNumOperands() const
Return number of MDNode operands.
Definition Metadata.h:1451

llvm::MDNode::getContext
LLVMContext & getContext() const
Definition Metadata.h:1241

llvm::MDOperand
Tracking metadata reference owned by Metadata.
Definition Metadata.h:899

llvm::MDString
A single uniqued string.
Definition Metadata.h:720

llvm::MDString::getString
LLVM_ABI StringRef getString() const
Definition Metadata.cpp:617

llvm::MDString::get
static LLVM_ABI MDString * get(LLVMContext &Context, StringRef Str)
Definition Metadata.cpp:607

llvm::MDTuple
Tuple of metadata.
Definition Metadata.h:1493

llvm::MemoryAccess
Definition MemorySSA.h:143

llvm::MemoryAccess::getBlock
BasicBlock * getBlock() const
Definition MemorySSA.h:162

llvm::MemoryLocation
Representation for a specific memory location.
Definition MemoryLocation.h:216

llvm::MemoryLocation::get
static LLVM_ABI MemoryLocation get(const LoadInst *LI)
Return a location with information about the memory reference by the given instruction.
Definition MemoryLocation.cpp:36

llvm::MemorySSAUpdater
Definition MemorySSAUpdater.h:55

llvm::MemorySSAWrapperPass
Legacy analysis pass which computes MemorySSA.
Definition MemorySSA.h:993

llvm::MemorySSA
Encapsulates MemorySSA, including all data associated with memory accesses.
Definition MemorySSA.h:702

llvm::MemorySSA::verifyMemorySSA
LLVM_ABI void verifyMemorySSA(VerificationLevel=VerificationLevel::Fast) const
Verify that MemorySSA is self consistent (IE definitions dominate all uses, uses appear in the right ...
Definition MemorySSA.cpp:1905

llvm::MemorySSA::getMemoryAccess
MemoryUseOrDef * getMemoryAccess(const Instruction *I) const
Given a memory Mod/Ref'ing instruction, get the MemorySSA access associated with it.
Definition MemorySSA.h:720

llvm::Metadata
Root of the metadata hierarchy.
Definition Metadata.h:63

llvm::PHINode
Definition Instructions.h:2638

llvm::PHINode::setIncomingValue
void setIncomingValue(unsigned i, Value *V)
Definition Instructions.h:2716

llvm::PHINode::getIncomingBlock
BasicBlock * getIncomingBlock(unsigned i) const
Return incoming basic block number i.
Definition Instructions.h:2733

llvm::PHINode::getIncomingValue
Value * getIncomingValue(unsigned i) const
Return incoming value number x.
Definition Instructions.h:2713

llvm::PHINode::getBasicBlockIndex
int getBasicBlockIndex(const BasicBlock *BB) const
Return the first index of the specified basic block in the value list for this PHI.
Definition Instructions.h:2807

llvm::PHINode::getNumIncomingValues
unsigned getNumIncomingValues() const
Return the number of incoming edges.
Definition Instructions.h:2709

llvm::PassRegistry
PassRegistry - This class manages the registration and intitialization of the pass subsystem as appli...
Definition PassRegistry.h:38

llvm::PointerType::get
static LLVM_ABI PointerType * get(Type *ElementType, unsigned AddressSpace)
This constructs a pointer to an object of the specified type in a numbered address space.

llvm::PoisonValue::get
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Definition Constants.cpp:1885

llvm::PriorityWorklist::insert
bool insert(const T &X)
Insert a new element into the PriorityWorklist.
Definition PriorityWorklist.h:90

llvm::RecurrenceDescriptor::isSignedRecurrenceKind
static bool isSignedRecurrenceKind(RecurKind Kind)
Returns true if recurrece kind is a signed redux kind.
Definition IVDescriptors.h:288

llvm::RecurrenceDescriptor::isAnyOfRecurrenceKind
static bool isAnyOfRecurrenceKind(RecurKind Kind)
Returns true if the recurrence kind is of the form select(cmp(),x,y) where one of (x,...
Definition IVDescriptors.h:269

llvm::RecurrenceDescriptor::isFindLastIVRecurrenceKind
static bool isFindLastIVRecurrenceKind(RecurKind Kind)
Returns true if the recurrence kind is of the form select(cmp(),x,y) where one of (x,...
Definition IVDescriptors.h:282

llvm::RecurrenceDescriptor::isFindIVRecurrenceKind
static bool isFindIVRecurrenceKind(RecurKind Kind)
Returns true if the recurrence kind is of the form select(cmp(),x,y) where one of (x,...
Definition IVDescriptors.h:297

llvm::RecurrenceDescriptor::isMinMaxRecurrenceKind
static bool isMinMaxRecurrenceKind(RecurKind Kind)
Returns true if the recurrence kind is any min/max kind.
Definition IVDescriptors.h:263

llvm::Registry
A global registry used in conjunction with static constructors to make pluggable components (like tar...
Definition Registry.h:44

llvm::SCEVAAWrapperPass
Legacy wrapper pass to provide the SCEVAAResult object.
Definition ScalarEvolutionAliasAnalysis.h:58

llvm::SCEVExpander
This class uses information about analyze scalars to rewrite expressions in canonical form.
Definition ScalarEvolutionExpander.h:64

llvm::SCEVExpander::getSE
ScalarEvolution * getSE()
Definition ScalarEvolutionExpander.h:221

llvm::SCEVExpander::expandCodeFor
LLVM_ABI Value * expandCodeFor(const SCEV *SH, Type *Ty, BasicBlock::iterator I)
Insert code to directly compute the specified SCEV expression into the program.
Definition ScalarEvolutionExpander.cpp:1511

llvm::SCEVExpander::eraseDeadInstructions
void eraseDeadInstructions(Value *Root)
Remove inserted instructions that are dead, e.g.
Definition ScalarEvolutionExpander.cpp:179

llvm::SCEV
This class represents an analyzed expression in the program.
Definition ScalarEvolution.h:72

llvm::SCEV::getType
LLVM_ABI Type * getType() const
Return the LLVM type of this SCEV expression.
Definition ScalarEvolution.cpp:383

llvm::ScalarEvolutionWrapperPass
Definition ScalarEvolution.h:2392

llvm::ScalarEvolution
The main scalar evolution driver.
Definition ScalarEvolution.h:448

llvm::ScalarEvolution::isKnownNonNegative
LLVM_ABI bool isKnownNonNegative(const SCEV *S)
Test if the given expression is known to be non-negative.
Definition ScalarEvolution.cpp:10991

llvm::ScalarEvolution::isLoopEntryGuardedByCond
LLVM_ABI bool isLoopEntryGuardedByCond(const Loop *L, CmpPredicate Pred, const SCEV *LHS, const SCEV *RHS)
Test whether entry to the loop is protected by a conditional between LHS and RHS.
Definition ScalarEvolution.cpp:11801

llvm::ScalarEvolution::getSCEVAtScope
LLVM_ABI const SCEV * getSCEVAtScope(const SCEV *S, const Loop *L)
Return a SCEV expression for the specified value at the specified scope in the program.
Definition ScalarEvolution.cpp:9885

llvm::ScalarEvolution::getZero
const SCEV * getZero(Type *Ty)
Return a SCEV for the constant 0 of a specific type.
Definition ScalarEvolution.h:663

llvm::ScalarEvolution::getConstant
LLVM_ABI const SCEV * getConstant(ConstantInt *V)
Definition ScalarEvolution.cpp:470

llvm::ScalarEvolution::getSCEV
LLVM_ABI const SCEV * getSCEV(Value *V)
Return a SCEV expression for the full generality of the specified expression.
Definition ScalarEvolution.cpp:4580

llvm::ScalarEvolution::forgetLoop
LLVM_ABI void forgetLoop(const Loop *L)
This method should be called by the client when it has changed a loop in a way that may effect Scalar...
Definition ScalarEvolution.cpp:8527

llvm::ScalarEvolution::isLoopInvariant
LLVM_ABI bool isLoopInvariant(const SCEV *S, const Loop *L)
Return true if the value of the given SCEV is unchanging in the specified loop.
Definition ScalarEvolution.cpp:14176

llvm::ScalarEvolution::getLoopDisposition
LLVM_ABI LoopDisposition getLoopDisposition(const SCEV *S, const Loop *L)
Return the "disposition" of the given SCEV with respect to the given loop.
Definition ScalarEvolution.cpp:14086

llvm::ScalarEvolution::isSCEVable
LLVM_ABI bool isSCEVable(Type *Ty) const
Test if values of the given type are analyzable within the SCEV framework.
Definition ScalarEvolution.cpp:4474

llvm::ScalarEvolution::forgetValue
LLVM_ABI void forgetValue(Value *V)
This method should be called by the client when it has changed a value in a way that may effect its v...
Definition ScalarEvolution.cpp:8571

llvm::ScalarEvolution::forgetBlockAndLoopDispositions
LLVM_ABI void forgetBlockAndLoopDispositions(Value *V=nullptr)
Called when the client has changed the disposition of values in a loop or block.
Definition ScalarEvolution.cpp:8626

llvm::ScalarEvolution::LoopDisposition
LoopDisposition
An enum describing the relationship between a SCEV and a loop.
Definition ScalarEvolution.h:453

llvm::ScalarEvolution::LoopInvariant
@ LoopInvariant
The SCEV is loop-invariant.
Definition ScalarEvolution.h:455

llvm::ScalarEvolution::isAvailableAtLoopEntry
LLVM_ABI bool isAvailableAtLoopEntry(const SCEV *S, const Loop *L)
Determine if the SCEV can be evaluated at loop's entry.
Definition ScalarEvolution.cpp:2510

llvm::ScalarEvolution::getExitCount
LLVM_ABI const SCEV * getExitCount(const Loop *L, const BasicBlock *ExitingBlock, ExitCountKind Kind=Exact)
Return the number of times the backedge executes before the given exit would be taken; if not exactly...
Definition ScalarEvolution.cpp:8345

llvm::ScalarEvolution::applyLoopGuards
LLVM_ABI const SCEV * applyLoopGuards(const SCEV *Expr, const Loop *L)
Try to apply information from loop guards for L to Expr.
Definition ScalarEvolution.cpp:16078

llvm::SelectInst
This class represents the LLVM 'select' instruction.
Definition Instructions.h:1689

llvm::SmallDenseSet
Implements a dense probed hash-table based set with some number of buckets stored inline.
Definition DenseSet.h:281

llvm::SmallPriorityWorklist
A version of PriorityWorklist that selects small size optimized data structures for the vector and ma...
Definition PriorityWorklist.h:238

llvm::SmallPtrSetImplBase::size
size_type size() const
Definition SmallPtrSet.h:99

llvm::SmallPtrSetImpl::insert
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
Definition SmallPtrSet.h:401

llvm::SmallPtrSetImpl::contains
bool contains(ConstPtrType Ptr) const
Definition SmallPtrSet.h:476

llvm::SmallPtrSet
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
Definition SmallPtrSet.h:541

llvm::SmallSetVector
A SetVector that performs no allocations if smaller than a certain size.
Definition SetVector.h:356

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition SmallVector.h:574

llvm::SmallVectorImpl::pop_back_val
T pop_back_val()
Definition SmallVector.h:674

llvm::SmallVectorImpl::emplace_back
reference emplace_back(ArgTypes &&... Args)
Definition SmallVector.h:938

llvm::SmallVectorImpl::append
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
Definition SmallVector.h:684

llvm::SmallVectorImpl::clear
void clear()
Definition SmallVector.h:611

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition SmallVector.h:414

llvm::SmallVectorTemplateCommon::size
size_t size() const
Definition SmallVector.h:79

llvm::SmallVectorTemplateCommon::empty
bool empty() const
Definition SmallVector.h:82

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition SmallVector.h:1197

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55

llvm::StringRef::starts_with
bool starts_with(StringRef Prefix) const
Check if this string starts with the given Prefix.
Definition StringRef.h:269

llvm::TargetLibraryInfo
Provides information about what library functions are available for the current target.
Definition TargetLibraryInfo.h:285

llvm::TargetTransformInfo
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Definition TargetTransformInfo.h:219

llvm::TargetTransformInfo::ReductionShuffle
ReductionShuffle
Definition TargetTransformInfo.h:1858

llvm::TargetTransformInfo::ReductionShuffle::Pairwise
@ Pairwise
Definition TargetTransformInfo.h:1858

llvm::TrackingVH
Value handle that tracks a Value across RAUW.
Definition ValueHandle.h:332

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45

llvm::Type::isVectorTy
bool isVectorTy() const
True if this is an instance of VectorType.
Definition Type.h:273

llvm::Type::getInt32Ty
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
Definition Type.cpp:297

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition Type.h:240

llvm::Use
A Use represents the edge between a Value definition and its users.
Definition Use.h:35

llvm::User
Definition User.h:44

llvm::VPIntrinsic::getForIntrinsic
static LLVM_ABI Intrinsic::ID getForIntrinsic(Intrinsic::ID Id)
The llvm.vp.
Definition IntrinsicInst.cpp:593

llvm::VPReductionIntrinsic::isVPReduction
static LLVM_ABI bool isVPReduction(Intrinsic::ID ID)
Definition IntrinsicInst.cpp:708

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:256

llvm::Value::replaceAllUsesWith
LLVM_ABI void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
Definition Value.cpp:546

llvm::Value::users
iterator_range< user_iterator > users()
Definition Value.h:426

llvm::Value::use_empty
bool use_empty() const
Definition Value.h:346

llvm::Value::getContext
LLVM_ABI LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.cpp:1101

llvm::Value::uses
iterator_range< use_iterator > uses()
Definition Value.h:380

llvm::Value::getName
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
Definition Value.cpp:322

llvm::detail::DenseSetImpl::insert
std::pair< iterator, bool > insert(const ValueT &V)
Definition DenseSet.h:194

llvm::function_ref
An efficient, type-erasing, non-owning reference to a callable.
Definition STLFunctionalExtras.h:37

llvm::ilist_detail::node_parent_access::getParent
const ParentTy * getParent() const
Definition ilist_node.h:34

llvm::raw_ostream
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition raw_ostream.h:53

uint64_t

Changed
Changed
Definition ObjCARCOpts.cpp:2370

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

llvm::AA
Abstract Attribute helper functions.
Definition Attributor.h:165

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24

llvm::Intrinsic::not_intrinsic
@ not_intrinsic
Definition Intrinsics.h:46

llvm::Intrinsic::ID
unsigned ID
Definition GenericSSAContext.h:28

llvm::Loc
Definition DwarfDebug.h:129

llvm::PatternMatch
Definition PatternMatch.h:47

llvm::SI
Definition SIInstrInfo.h:1720

llvm::mdconst::extract_or_null
std::enable_if_t< detail::IsValidPointer< X, Y >::value, X * > extract_or_null(Y &&MD)
Extract a Value from Metadata, allowing null.
Definition Metadata.h:681

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::drop_begin
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition STLExtras.h:310

llvm::createSimpleReduction
LLVM_ABI Value * createSimpleReduction(IRBuilderBase &B, Value *Src, RecurKind RdxKind)
Create a reduction of the given vector.
Definition LoopUtils.cpp:1397

llvm::getOptionalElementCountLoopAttribute
LLVM_ABI std::optional< ElementCount > getOptionalElementCountLoopAttribute(const Loop *TheLoop)
Find a combination of metadata ("llvm.loop.vectorize.width" and "llvm.loop.vectorize....
Definition LoopUtils.cpp:251

llvm::ThreadPriority::Low
@ Low
Lower the current thread's priority such that it does not affect foreground tasks significantly.
Definition Threading.h:262

llvm::addRuntimeChecks
LLVM_ABI Value * addRuntimeChecks(Instruction *Loc, Loop *TheLoop, const SmallVectorImpl< RuntimePointerCheck > &PointerChecks, SCEVExpander &Expander, bool HoistRuntimeChecks=false)
Add code that checks at runtime if the accessed arrays in PointerChecks overlap.
Definition LoopUtils.cpp:2064

llvm::createFindLastIVReduction
LLVM_ABI Value * createFindLastIVReduction(IRBuilderBase &B, Value *Src, RecurKind RdxKind, Value *Start, Value *Sentinel)
Create a reduction of the given vector Src for a reduction of the kind RecurKind::FindLastIV.
Definition LoopUtils.cpp:1331

llvm::find
auto find(R &&Range, const T &Val)
Provide wrappers to std::find which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1733

llvm::fill
void fill(R &&Range, T &&Value)
Provide wrappers to std::fill which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1727

llvm::getLoopEstimatedTripCount
LLVM_ABI std::optional< unsigned > getLoopEstimatedTripCount(Loop *L, unsigned *EstimatedLoopInvocationWeight=nullptr)
Return either:
Definition LoopUtils.cpp:869

llvm::all_of
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1707

llvm::PseudoProbeType::Block
@ Block
Definition PseudoProbe.h:30

llvm::getMinMaxReductionIntrinsicOp
LLVM_ABI Intrinsic::ID getMinMaxReductionIntrinsicOp(Intrinsic::ID RdxID)
Returns the min/max intrinsic used when expanding a min/max reduction.
Definition LoopUtils.cpp:1107

llvm::getBooleanLoopAttribute
LLVM_ABI bool getBooleanLoopAttribute(const Loop *TheLoop, StringRef Name)
Returns true if Name is applied to TheLoop and enabled.
Definition LoopInfo.cpp:1109

llvm::RuntimePointerCheck
std::pair< const RuntimeCheckingPtrGroup *, const RuntimeCheckingPtrGroup * > RuntimePointerCheck
A memcheck which made up of a pair of grouped pointers.
Definition LoopAccessAnalysis.h:487

llvm::make_scope_exit
detail::scope_exit< std::decay_t< Callable > > make_scope_exit(Callable &&F)
Definition ScopeExit.h:59

llvm::isKnownNonPositiveInLoop
LLVM_ABI bool isKnownNonPositiveInLoop(const SCEV *S, const Loop *L, ScalarEvolution &SE)
Returns true if we can prove that S is defined and always non-positive in loop L.
Definition LoopUtils.cpp:1518

llvm::getOptionalBoolLoopAttribute
LLVM_ABI std::optional< bool > getOptionalBoolLoopAttribute(const Loop *TheLoop, StringRef Name)
Definition LoopInfo.cpp:1091

llvm::dyn_cast
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:649

llvm::appendReversedLoopsToWorklist
void appendReversedLoopsToWorklist(RangeT &&, SmallPriorityWorklist< Loop *, 4 > &)
Utility that implements appending of loops onto a worklist given a range.
Definition LoopUtils.cpp:1898

llvm::AlignStyle::Right
@ Right
Definition FormatCommon.h:17

llvm::AlignStyle::Left
@ Left
Definition FormatCommon.h:17

llvm::successors
auto successors(const MachineBasicBlock *BB)
Definition MachineBasicBlock.h:1421

llvm::initializeLoopPassPass
LLVM_ABI void initializeLoopPassPass(PassRegistry &)
Manually defined generic "LoopPass" dependency initialization.
Definition LoopUtils.cpp:190

llvm::from_range
constexpr from_range_t from_range
Definition STLForwardCompat.h:99

llvm::formLCSSARecursively
LLVM_ABI bool formLCSSARecursively(Loop &L, const DominatorTree &DT, const LoopInfo *LI, ScalarEvolution *SE)
Put a loop nest into LCSSA form.
Definition LCSSA.cpp:449

llvm::getReductionIdentity
LLVM_ABI Value * getReductionIdentity(Intrinsic::ID RdxID, Type *Ty, FastMathFlags FMF)
Given information about an @llvm.vector.reduce.
Definition LoopUtils.cpp:1347

llvm::makeFollowupLoopID
LLVM_ABI std::optional< MDNode * > makeFollowupLoopID(MDNode *OrigLoopID, ArrayRef< StringRef > FollowupAttrs, const char *InheritOptionsAttrsPrefix="", bool AlwaysNew=false)
Create a new loop identifier for a loop created from a loop transformation.
Definition LoopUtils.cpp:264

llvm::getArithmeticReductionInstruction
LLVM_ABI unsigned getArithmeticReductionInstruction(Intrinsic::ID RdxID)
Returns the arithmetic instruction opcode used when expanding a reduction.
Definition LoopUtils.cpp:1059

llvm::make_early_inc_range
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
Definition STLExtras.h:626

llvm::LCSSAID
LLVM_ABI char & LCSSAID
Definition LCSSA.cpp:526

llvm::LoopSimplifyID
LLVM_ABI char & LoopSimplifyID
Definition LoopSimplify.cpp:784

llvm::createMinMaxOp
LLVM_ABI Value * createMinMaxOp(IRBuilderBase &Builder, RecurKind RK, Value *Left, Value *Right)
Returns a Min/Max operation corresponding to MinMaxRecurrenceKind.
Definition LoopUtils.cpp:1200

llvm::collectChildrenInLoop
LLVM_ABI SmallVector< BasicBlock *, 16 > collectChildrenInLoop(DominatorTree *DT, DomTreeNode *N, const Loop *CurLoop)
Does a BFS from a given node to all of its children inside a given loop.
Definition LoopUtils.cpp:450

llvm::addStringMetadataToLoop
LLVM_ABI void addStringMetadataToLoop(Loop *TheLoop, const char *MDString, unsigned V=0)
Set input string into loop metadata by keeping other values intact.
Definition LoopUtils.cpp:215

llvm::cannotBeMaxInLoop
LLVM_ABI bool cannotBeMaxInLoop(const SCEV *S, const Loop *L, ScalarEvolution &SE, bool Signed)
Returns true if S is defined and never is equal to signed/unsigned max.
Definition LoopUtils.cpp:1536

llvm::DomTreeNode
DomTreeNodeBase< BasicBlock > DomTreeNode
Definition Dominators.h:95

llvm::divideNearest
constexpr T divideNearest(U Numerator, V Denominator)
Returns (Numerator / Denominator) rounded by round-half-up.
Definition MathExtras.h:469

llvm::hasVectorizeTransformation
LLVM_ABI TransformationMode hasVectorizeTransformation(const Loop *L)
Definition LoopUtils.cpp:392

llvm::dyn_cast_or_null
auto dyn_cast_or_null(const Y &Val)
Definition Casting.h:759

llvm::transform
OutputIt transform(R &&Range, OutputIt d_first, UnaryFunction F)
Wrapper function around std::transform to apply a function to a range and store the result elsewhere.
Definition STLExtras.h:1950

llvm::any_of
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1714

llvm::isInstructionTriviallyDead
LLVM_ABI bool isInstructionTriviallyDead(Instruction *I, const TargetLibraryInfo *TLI=nullptr)
Return true if the result produced by the instruction is not used, and the instruction will return.
Definition Local.cpp:402

llvm::findDefsUsedOutsideOfLoop
LLVM_ABI SmallVector< Instruction *, 8 > findDefsUsedOutsideOfLoop(Loop *L)
Returns the instructions that use values defined in the loop.
Definition LoopUtils.cpp:124

llvm::reverse
auto reverse(ContainerTy &&C)
Definition STLExtras.h:400

llvm::getReductionIntrinsicID
LLVM_ABI constexpr Intrinsic::ID getReductionIntrinsicID(RecurKind RK)
Returns the llvm.vector.reduce intrinsic that corresponds to the recurrence kind.
Definition LoopUtils.cpp:997

llvm::isMustProgress
LLVM_ABI bool isMustProgress(const Loop *L)
Return true if this loop can be assumed to make progress.
Definition LoopInfo.cpp:1162

llvm::isPowerOf2_32
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition MathExtras.h:288

llvm::isModSet
bool isModSet(const ModRefInfo MRI)
Definition ModRef.h:49

llvm::hasUnrollAndJamTransformation
LLVM_ABI TransformationMode hasUnrollAndJamTransformation(const Loop *L)
Definition LoopUtils.cpp:374

llvm::deleteDeadLoop
LLVM_ABI void deleteDeadLoop(Loop *L, DominatorTree *DT, ScalarEvolution *SE, LoopInfo *LI, MemorySSA *MSSA=nullptr)
This function deletes dead loops.
Definition LoopUtils.cpp:485

llvm::dbgs
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:207

llvm::hasDisableAllTransformsHint
LLVM_ABI bool hasDisableAllTransformsHint(const Loop *L)
Look for the loop attribute that disables all transformation heuristic.
Definition LoopUtils.cpp:345

llvm::appendLoopsToWorklist
LLVM_TEMPLATE_ABI void appendLoopsToWorklist(RangeT &&, SmallPriorityWorklist< Loop *, 4 > &)
Utility that implements appending of loops onto a worklist given a range.

llvm::SCEVCheapExpansionBudget
LLVM_ABI cl::opt< unsigned > SCEVCheapExpansionBudget

llvm::Count
FunctionAddr VTableAddr Count
Definition InstrProf.h:139

llvm::getShuffleReduction
LLVM_ABI Value * getShuffleReduction(IRBuilderBase &Builder, Value *Src, unsigned Op, TargetTransformInfo::ReductionShuffle RS, RecurKind MinMaxKind=RecurKind::None)
Generates a vector reduction using shufflevectors to reduce the value.
Definition LoopUtils.cpp:1243

llvm::hasUnrollTransformation
LLVM_ABI TransformationMode hasUnrollTransformation(const Loop *L)
Definition LoopUtils.cpp:353

llvm::hasDistributeTransformation
LLVM_ABI TransformationMode hasDistributeTransformation(const Loop *L)
Definition LoopUtils.cpp:428

llvm::breakLoopBackedge
LLVM_ABI void breakLoopBackedge(Loop *L, DominatorTree &DT, ScalarEvolution &SE, LoopInfo &LI, MemorySSA *MSSA)
Remove the backedge of the specified loop.
Definition LoopUtils.cpp:711

llvm::isa
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:548

llvm::getLoopAnalysisUsage
LLVM_ABI void getLoopAnalysisUsage(AnalysisUsage &AU)
Helper to consistently add the set of standard passes to a loop pass's AnalysisUsage.
Definition LoopUtils.cpp:142

llvm::propagateIRFlags
LLVM_ABI void propagateIRFlags(Value *I, ArrayRef< Value * > VL, Value *OpValue=nullptr, bool IncludeWrapFlags=true)
Get the intersection (logical and) of all of the potential IR flags of each scalar operation (VL) tha...
Definition LoopUtils.cpp:1477

llvm::isKnownPositiveInLoop
LLVM_ABI bool isKnownPositiveInLoop(const SCEV *S, const Loop *L, ScalarEvolution &SE)
Returns true if we can prove that S is defined and always positive in loop L.
Definition LoopUtils.cpp:1511

llvm::Key
LLVM_ATTRIBUTE_VISIBILITY_DEFAULT AnalysisKey InnerAnalysisManagerProxy< AnalysisManagerT, IRUnitT, ExtraArgTs... >::Key
Definition PassManager.h:668

llvm::changeToUnreachable
LLVM_ABI unsigned changeToUnreachable(Instruction *I, bool PreserveLCSSA=false, DomTreeUpdater *DTU=nullptr, MemorySSAUpdater *MSSAU=nullptr)
Insert an unreachable instruction before the specified instruction, making it and the rest of the cod...
Definition Local.cpp:2513

llvm::succ_begin
RNSuccIterator< NodeRef, BlockT, RegionT > succ_begin(NodeRef Node)
Definition RegionIterator.h:249

llvm::getOptionalIntLoopAttribute
LLVM_ABI std::optional< int > getOptionalIntLoopAttribute(const Loop *TheLoop, StringRef Name)
Find named metadata for a loop with an integer value.
Definition LoopInfo.cpp:1113

llvm::SplitBlockPredecessors
LLVM_ABI BasicBlock * SplitBlockPredecessors(BasicBlock *BB, ArrayRef< BasicBlock * > Preds, const char *Suffix, DominatorTree *DT, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, bool PreserveLCSSA=false)
This method introduces at least one new basic block into the function and moves some of the predecess...
Definition BasicBlockUtils.cpp:1297

llvm::IRMemLocation::First
@ First
Helpers to iterate all locations in the MemoryEffectsBase class.
Definition ModRef.h:71

llvm::TTI
TargetTransformInfo TTI
Definition TargetTransformInfo.h:214

llvm::getMinMaxReductionPredicate
LLVM_ABI CmpInst::Predicate getMinMaxReductionPredicate(RecurKind RK)
Returns the comparison predicate used when expanding a min/max reduction.
Definition LoopUtils.cpp:1178

llvm::hasLICMVersioningTransformation
LLVM_ABI TransformationMode hasLICMVersioningTransformation(const Loop *L)
Definition LoopUtils.cpp:438

llvm::VerifyMemorySSA
LLVM_ABI bool VerifyMemorySSA
Enables verification of MemorySSA.
Definition MemorySSA.cpp:84

llvm::TransformationMode
TransformationMode
The mode sets how eager a transformation should be applied.
Definition LoopUtils.h:284

llvm::TM_Unspecified
@ TM_Unspecified
The pass can use heuristics to determine whether a transformation should be applied.
Definition LoopUtils.h:287

llvm::TM_SuppressedByUser
@ TM_SuppressedByUser
The transformation must not be applied.
Definition LoopUtils.h:307

llvm::TM_ForcedByUser
@ TM_ForcedByUser
The transformation was directed by the user, e.g.
Definition LoopUtils.h:301

llvm::TM_Disable
@ TM_Disable
The transformation should not be applied.
Definition LoopUtils.h:293

llvm::TM_Enable
@ TM_Enable
The transformation should be applied without considering a cost model.
Definition LoopUtils.h:290

llvm::succ_end
RNSuccIterator< NodeRef, BlockT, RegionT > succ_end(NodeRef Node)
Definition RegionIterator.h:254

llvm::hasDisableLICMTransformsHint
LLVM_ABI bool hasDisableLICMTransformsHint(const Loop *L)
Look for the loop attribute that disables the LICM transformation heuristics.
Definition LoopUtils.cpp:349

llvm::appendLoopsToWorklist< Loop & >
template LLVM_TEMPLATE_ABI void appendLoopsToWorklist< Loop & >(Loop &L, SmallPriorityWorklist< Loop *, 4 > &Worklist)

llvm::LEB128Sign::Signed
@ Signed
Definition LEB128.h:234

llvm::getReductionForBinop
LLVM_ABI Intrinsic::ID getReductionForBinop(Instruction::BinaryOps Opc)
Returns the reduction intrinsic id corresponding to the binary operation.
Definition LoopUtils.cpp:1089

llvm::RecurKind
RecurKind
These are the kinds of recurrences that we support.
Definition IVDescriptors.h:34

llvm::RecurKind::UMin
@ UMin
Unsigned integer min implemented in terms of select(cmp()).
Definition IVDescriptors.h:46

llvm::RecurKind::FMinimumNum
@ FMinimumNum
FP min with llvm.minimumnum semantics.
Definition IVDescriptors.h:56

llvm::RecurKind::Or
@ Or
Bitwise or logical OR of integers.
Definition IVDescriptors.h:41

llvm::RecurKind::FMinimum
@ FMinimum
FP min with llvm.minimum semantics.
Definition IVDescriptors.h:54

llvm::RecurKind::FMaxNum
@ FMaxNum
FP max with llvm.maxnum semantics including NaNs.
Definition IVDescriptors.h:53

llvm::RecurKind::Mul
@ Mul
Product of integers.
Definition IVDescriptors.h:40

llvm::RecurKind::None
@ None
Not a recurrence.
Definition IVDescriptors.h:36

llvm::RecurKind::AnyOf
@ AnyOf
AnyOf reduction with select(cmp(),x,y) where one of (x,y) is loop invariant, and both x and y are int...
Definition IVDescriptors.h:59

llvm::RecurKind::Xor
@ Xor
Bitwise or logical XOR of integers.
Definition IVDescriptors.h:43

llvm::RecurKind::FMax
@ FMax
FP max implemented in terms of select(cmp()).
Definition IVDescriptors.h:51

llvm::RecurKind::FMaximum
@ FMaximum
FP max with llvm.maximum semantics.
Definition IVDescriptors.h:55

llvm::RecurKind::FMulAdd
@ FMulAdd
Sum of float products with llvm.fmuladd(a * b + sum).
Definition IVDescriptors.h:58

llvm::RecurKind::FMul
@ FMul
Product of floats.
Definition IVDescriptors.h:49

llvm::RecurKind::SMax
@ SMax
Signed integer max implemented in terms of select(cmp()).
Definition IVDescriptors.h:45

llvm::RecurKind::And
@ And
Bitwise or logical AND of integers.
Definition IVDescriptors.h:42

llvm::RecurKind::SMin
@ SMin
Signed integer min implemented in terms of select(cmp()).
Definition IVDescriptors.h:44

llvm::RecurKind::FMin
@ FMin
FP min implemented in terms of select(cmp()).
Definition IVDescriptors.h:50

llvm::RecurKind::FMinNum
@ FMinNum
FP min with llvm.minnum semantics including NaNs.
Definition IVDescriptors.h:52

llvm::RecurKind::Sub
@ Sub
Subtraction of integers.
Definition IVDescriptors.h:38

llvm::RecurKind::Add
@ Add
Sum of integers.
Definition IVDescriptors.h:37

llvm::RecurKind::AddChainWithSubs
@ AddChainWithSubs
A chain of adds and subs.
Definition IVDescriptors.h:39

llvm::RecurKind::FAdd
@ FAdd
Sum of floats.
Definition IVDescriptors.h:48

llvm::RecurKind::FMaximumNum
@ FMaximumNum
FP max with llvm.maximumnum semantics.
Definition IVDescriptors.h:57

llvm::RecurKind::UMax
@ UMax
Unsigned integer max implemented in terms of select(cmp()).
Definition IVDescriptors.h:47

llvm::getRecurrenceIdentity
LLVM_ABI Value * getRecurrenceIdentity(RecurKind K, Type *Tp, FastMathFlags FMF)
Given information about an recurrence kind, return the identity for the @llvm.vector....
Definition LoopUtils.cpp:1389

llvm::setProfileInfoAfterUnrolling
LLVM_ABI void setProfileInfoAfterUnrolling(Loop *OrigLoop, Loop *UnrolledLoop, Loop *RemainderLoop, uint64_t UF)
Set weights for UnrolledLoop and RemainderLoop based on weights for OrigLoop and the following distri...
Definition LoopUtils.cpp:1870

llvm::formDedicatedExitBlocks
LLVM_ABI bool formDedicatedExitBlocks(Loop *L, DominatorTree *DT, LoopInfo *LI, MemorySSAUpdater *MSSAU, bool PreserveLCSSA)
Ensure that all exit blocks of the loop are dedicated exits.
Definition LoopUtils.cpp:58

llvm::Op
DWARFExpression::Operation Op
Definition DWARFExpressionPrinter.cpp:22

llvm::operator<<
raw_ostream & operator<<(raw_ostream &OS, const APFixedPoint &FX)
Definition APFixedPoint.h:312

llvm::isKnownNegativeInLoop
LLVM_ABI bool isKnownNegativeInLoop(const SCEV *S, const Loop *L, ScalarEvolution &SE)
Returns true if we can prove that S is defined and always negative in loop L.
Definition LoopUtils.cpp:1497

llvm::BitWidth
constexpr unsigned BitWidth
Definition BitmaskEnum.h:223

llvm::ValueToValueMapTy
ValueMap< const Value *, WeakTrackingVH > ValueToValueMapTy
Definition MemorySSAUpdater.h:51

llvm::setLoopEstimatedTripCount
LLVM_ABI bool setLoopEstimatedTripCount(Loop *L, unsigned EstimatedTripCount, std::optional< unsigned > EstimatedLoopInvocationWeight=std::nullopt)
Set llvm.loop.estimated_trip_count with the value EstimatedTripCount in the loop metadata of L.
Definition LoopUtils.cpp:927

llvm::extractBranchWeights
LLVM_ABI bool extractBranchWeights(const MDNode *ProfileData, SmallVectorImpl< uint32_t > &Weights)
Extract branch weights from MD_prof metadata.
Definition ProfDataUtils.cpp:180

llvm::LLVMLoopEstimatedTripCount
LLVM_ABI const char * LLVMLoopEstimatedTripCount
Profile-based loop metadata that should be accessed only by using llvm::getLoopEstimatedTripCount and...
Definition ProfDataUtils.cpp:98

llvm::hasIterationCountInvariantInParent
LLVM_ABI bool hasIterationCountInvariantInParent(Loop *L, ScalarEvolution &SE)
Check inner loop (L) backedge count is known to be invariant on all iterations of its outer loop.
Definition LoopUtils.cpp:975

llvm::cast
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:565

llvm::isAlmostDeadIV
LLVM_ABI bool isAlmostDeadIV(PHINode *IV, BasicBlock *LatchBlock, Value *Cond)
Return true if the induction variable IV in a Loop whose latch is LatchBlock would become dead if the...
Definition LoopUtils.cpp:471

llvm::predecessors
auto predecessors(const MachineBasicBlock *BB)
Definition MachineBasicBlock.h:1422

llvm::rewriteLoopExitValues
LLVM_ABI int rewriteLoopExitValues(Loop *L, LoopInfo *LI, TargetLibraryInfo *TLI, ScalarEvolution *SE, const TargetTransformInfo *TTI, SCEVExpander &Rewriter, DominatorTree *DT, ReplaceExitVal ReplaceExitValue, SmallVector< WeakTrackingVH, 16 > &DeadInsts)
If the final value of any expressions that are recurrent in the loop can be computed,...
Definition LoopUtils.cpp:1658

llvm::createOrderedReduction
LLVM_ABI Value * createOrderedReduction(IRBuilderBase &B, RecurKind RdxKind, Value *Src, Value *Start)
Create an ordered reduction intrinsic using the given recurrence kind RdxKind.
Definition LoopUtils.cpp:1450

llvm::addDiffRuntimeChecks
LLVM_ABI Value * addDiffRuntimeChecks(Instruction *Loc, ArrayRef< PointerDiffInfo > Checks, SCEVExpander &Expander, function_ref< Value *(IRBuilderBase &, unsigned)> GetVF, unsigned IC)
Definition LoopUtils.cpp:2123

llvm::getMinMaxReductionRecurKind
LLVM_ABI RecurKind getMinMaxReductionRecurKind(Intrinsic::ID RdxID)
Returns the recurence kind used when expanding a min/max reduction.
Definition LoopUtils.cpp:1159

llvm::ReplaceExitVal
ReplaceExitVal
Definition LoopUtils.h:516

llvm::UnusedIndVarInLoop
@ UnusedIndVarInLoop
Definition LoopUtils.h:520

llvm::OnlyCheapRepl
@ OnlyCheapRepl
Definition LoopUtils.h:518

llvm::AlwaysRepl
@ AlwaysRepl
Definition LoopUtils.h:521

llvm::SplitEdge
LLVM_ABI BasicBlock * SplitEdge(BasicBlock *From, BasicBlock *To, DominatorTree *DT=nullptr, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, const Twine &BBName="")
Split the edge connecting the specified blocks, and return the newly created basic block between From...
Definition BasicBlockUtils.cpp:645

llvm::hasPartialIVCondition
LLVM_ABI std::optional< IVConditionInfo > hasPartialIVCondition(const Loop &L, unsigned MSSAThreshold, const MemorySSA &MSSA, AAResults &AA)
Check if the loop header has a conditional branch that is not loop-invariant, because it involves loa...
Definition LoopUtils.cpp:2170

llvm::filterDbgVars
static auto filterDbgVars(iterator_range< simple_ilist< DbgRecord >::iterator > R)
Filter the DbgRecord range to DbgVariableRecord types only and downcast.
Definition DebugProgramInstruction.h:562

llvm::PseudoProbeAttributes::Sentinel
@ Sentinel
Definition PseudoProbe.h:34

llvm::createAnyOfReduction
LLVM_ABI Value * createAnyOfReduction(IRBuilderBase &B, Value *Src, Value *InitVal, PHINode *OrigPhi)
Create a reduction of the given vector Src for a reduction of kind RecurKind::AnyOf.
Definition LoopUtils.cpp:1301

llvm::cannotBeMinInLoop
LLVM_ABI bool cannotBeMinInLoop(const SCEV *S, const Loop *L, ScalarEvolution &SE, bool Signed)
Returns true if S is defined and never is equal to signed/unsigned min.
Definition LoopUtils.cpp:1525

llvm::isKnownNonNegativeInLoop
LLVM_ABI bool isKnownNonNegativeInLoop(const SCEV *S, const Loop *L, ScalarEvolution &SE)
Returns true if we can prove that S is defined and always non-negative in loop L.
Definition LoopUtils.cpp:1504

llvm::getOrderedReduction
LLVM_ABI Value * getOrderedReduction(IRBuilderBase &Builder, Value *Acc, Value *Src, unsigned Op, RecurKind MinMaxKind=RecurKind::None)
Generates an ordered vector reduction using extracts to reduce the value.
Definition LoopUtils.cpp:1218

llvm::findOptionMDForLoopID
LLVM_ABI MDNode * findOptionMDForLoopID(MDNode *LoopID, StringRef Name)
Find and return the loop attribute node for the attribute Name in LoopID.
Definition LoopInfo.cpp:1041

llvm::getMinMaxReductionIntrinsicID
LLVM_ABI Intrinsic::ID getMinMaxReductionIntrinsicID(Intrinsic::ID IID)
Returns the llvm.vector.reduce min/max intrinsic that corresponds to the intrinsic op.
Definition LoopUtils.cpp:1043

llvm::ColorMode::Enable
@ Enable
Enable colors.
Definition WithColor.h:47

llvm::cloneLoop
LLVM_ABI Loop * cloneLoop(Loop *L, Loop *PL, ValueToValueMapTy &VM, LoopInfo *LI, LPPassManager *LPM)
Recursively clone the specified loop and all of its children, mapping the blocks with the specified m...
Definition LoopUtils.cpp:1941

std::swap
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition BitVector.h:853

N
#define N

DbgLoop
Definition LoopUtils.cpp:807

DbgLoop::DbgLoop
DbgLoop(const Loop *L)
Definition LoopUtils.cpp:809

DbgLoop::L
const Loop * L
Definition LoopUtils.cpp:808

PointerBounds
IR Values for the lower and upper bounds of a pointer evolution.
Definition LoopUtils.cpp:1968

PointerBounds::Start
TrackingVH< Value > Start
Definition LoopUtils.cpp:1969

PointerBounds::End
TrackingVH< Value > End
Definition LoopUtils.cpp:1970

PointerBounds::StrideToCheck
Value * StrideToCheck
Definition LoopUtils.cpp:1971

RewritePhi
Definition LoopUtils.cpp:1577

RewritePhi::HighCost
bool HighCost
Definition LoopUtils.cpp:1582

RewritePhi::Ith
unsigned Ith
Definition LoopUtils.cpp:1579

RewritePhi::RewritePhi
RewritePhi(PHINode *P, unsigned I, const SCEV *Val, Instruction *ExpansionPt, bool H)
Definition LoopUtils.cpp:1584

RewritePhi::ExpansionSCEV
const SCEV * ExpansionSCEV
Definition LoopUtils.cpp:1580

RewritePhi::PN
PHINode * PN
Definition LoopUtils.cpp:1578

RewritePhi::ExpansionPoint
Instruction * ExpansionPoint
Definition LoopUtils.cpp:1581

llvm::IVConditionInfo
Struct to hold information about a partially invariant condition.
Definition LoopUtils.h:605

llvm::Incoming
Incoming for lane maks phi as machine instruction, incoming register Reg and incoming block Block are...
Definition SILowerI1Copies.h:26

llvm::LCSSAVerificationPass
Definition LoopPass.h:125

llvm::RuntimeCheckingPtrGroup
A grouping of pointers.
Definition LoopAccessAnalysis.h:453

llvm::RuntimeCheckingPtrGroup::AddressSpace
unsigned AddressSpace
Address space of the involved pointers.
Definition LoopAccessAnalysis.h:478

llvm::RuntimeCheckingPtrGroup::NeedsFreeze
bool NeedsFreeze
Whether the pointer needs to be frozen after expansion, e.g.
Definition LoopAccessAnalysis.h:481

llvm::RuntimeCheckingPtrGroup::High
const SCEV * High
The SCEV expression which represents the upper bound of all the pointers in this group.
Definition LoopAccessAnalysis.h:471

llvm::RuntimeCheckingPtrGroup::Low
const SCEV * Low
The SCEV expression which represents the lower bound of all the pointers in this group.
Definition LoopAccessAnalysis.h:474

llvm::fltSemantics
Definition APFloat.cpp:103