doxygen/RISCVCodeGenPrepare_8cpp_source.html

//===----- RISCVCodeGenPrepare.cpp ----------------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This is a RISC-V specific version of CodeGenPrepare.

// It munges the code in the input function to better prepare it for

// SelectionDAG-based code generation. This works around limitations in it's

// basic-block-at-a-time approach.

//

//===----------------------------------------------------------------------===//


#include "RISCV.h"

#include "RISCVTargetMachine.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/Analysis/ValueTracking.h"

#include "llvm/CodeGen/TargetPassConfig.h"

#include "llvm/IR/Dominators.h"

#include "llvm/IR/IRBuilder.h"

#include "llvm/IR/InstVisitor.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/Intrinsics.h"

#include "llvm/IR/PatternMatch.h"

#include "llvm/InitializePasses.h"

#include "llvm/Pass.h"

#include "llvm/Transforms/Utils/Local.h"


using namespace llvm;


#define DEBUG_TYPE "riscv-codegenprepare"

#define PASS_NAME "RISC-V CodeGenPrepare"


namespace {

class RISCVCodeGenPrepare : public InstVisitor<RISCVCodeGenPrepare, bool> {

  Function &F;

  const DataLayout *DL;

  const DominatorTree *DT;

  const RISCVSubtarget *ST;


public:

  RISCVCodeGenPrepare(Function &F, const DominatorTree *DT,

                      const RISCVSubtarget *ST)

      : F(F), DL(&F.getDataLayout()), DT(DT), ST(ST) {}

  bool run();

  bool visitInstruction(Instruction &I) { return false; }

  bool visitAnd(BinaryOperator &BO);

  bool visitIntrinsicInst(IntrinsicInst &I);

  bool expandVPStrideLoad(IntrinsicInst &I);

  bool expandMulReduction(IntrinsicInst &I);

  bool widenVPMerge(Instruction *I);

  bool visitFreezeInst(FreezeInst &BO);

};

} // namespace


namespace {

class RISCVCodeGenPrepareLegacyPass : public FunctionPass {

public:

  static char ID;


  RISCVCodeGenPrepareLegacyPass() : FunctionPass(ID) {}


  bool runOnFunction(Function &F) override;

  StringRef getPassName() const override { return PASS_NAME; }


  void getAnalysisUsage(AnalysisUsage &AU) const override {

    AU.setPreservesCFG();

    AU.addRequired<DominatorTreeWrapperPass>();

    AU.addRequired<TargetPassConfig>();

  }

};

} // namespace


// Try to optimize (i64 (and (zext/sext (i32 X), C1))) if C1 has bit 31 set,

// but bits 63:32 are zero. If we know that bit 31 of X is 0, we can fill

// the upper 32 bits with ones.

bool RISCVCodeGenPrepare::visitAnd(BinaryOperator &BO) {

  if (!ST->is64Bit())

    return false;


  if (!BO.getType()->isIntegerTy(64))

    return false;


  using namespace PatternMatch;


  // Left hand side should be a zext nneg.

  Value *LHSSrc;

  if (!match(BO.getOperand(0), m_NNegZExt(m_Value(LHSSrc))))

    return false;


  if (!LHSSrc->getType()->isIntegerTy(32))

    return false;


  // Right hand side should be a constant.

  Value *RHS = BO.getOperand(1);


  auto *CI = dyn_cast<ConstantInt>(RHS);

  if (!CI)

    return false;

  uint64_t C = CI->getZExtValue();


  // Look for constants that fit in 32 bits but not simm12, and can be made

  // into simm12 by sign extending bit 31. This will allow use of ANDI.

  // TODO: Is worth making simm32?

  if (!isUInt<32>(C) || isInt<12>(C) || !isInt<12>(SignExtend64<32>(C)))

    return false;


  // Sign extend the constant and replace the And operand.

  C = SignExtend64<32>(C);

  BO.setOperand(1, ConstantInt::get(RHS->getType(), C));


  return true;

}


// With EVL tail folding, an AnyOf reduction will generate an i1 vp.merge like

// follows:

//

// loop:

//   %phi = phi <vscale x 4 x i1> [zeroinitializer, %entry], [%freeze, %loop]

//   %cmp = icmp ...

//   %rec = call <vscale x 4 x i1> @llvm.vp.merge(%cmp, i1 true, %phi, %evl)

//   %freeze = freeze <vscale x 4 x i1> %rec [optional]

//   ...

// middle:

//   %res = call i1 @llvm.vector.reduce.or(<vscale x 4 x i1> %freeze)

//

// However RVV doesn't have any tail undisturbed mask instructions and so we

// need a convoluted sequence of mask instructions to lower the i1 vp.merge: see

// llvm/test/CodeGen/RISCV/rvv/vpmerge-sdnode.ll.

//

// To avoid that this widens the i1 vp.merge to an i8 vp.merge, which will

// generate a single vmerge.vim:

//

// loop:

//   %phi = phi <vscale x 4 x i8> [zeroinitializer, %entry], [%freeze, %loop]

//   %cmp = icmp ...

//   %rec = call <vscale x 4 x i8> @llvm.vp.merge(%cmp, i8 true, %phi, %evl)

//   %freeze = freeze <vscale x 4 x i8> %rec

//   %trunc = trunc <vscale x 4 x i8> %freeze to <vscale x 4 x i1>

//   ...

// middle:

//   %res = call i1 @llvm.vector.reduce.or(<vscale x 4 x i1> %trunc)

//

// The trunc will normally be sunk outside of the loop, but even if there are

// users inside the loop it is still profitable.

bool RISCVCodeGenPrepare::widenVPMerge(Instruction *Root) {

  if (!Root->getType()->getScalarType()->isIntegerTy(1))

    return false;


  Value *Mask, *True, *PhiV, *EVL;

  using namespace PatternMatch;

  auto m_VPMerge = m_Intrinsic<Intrinsic::vp_merge>(

      m_Value(Mask), m_Value(True), m_Value(PhiV), m_Value(EVL));

  if (!match(Root, m_CombineOr(m_VPMerge, m_Freeze(m_VPMerge))))

    return false;


  auto *Phi = dyn_cast<PHINode>(PhiV);

  if (!Phi || !Phi->hasOneUse() || Phi->getNumIncomingValues() != 2 ||

      !match(Phi->getIncomingValue(0), m_Zero()) ||

      Phi->getIncomingValue(1) != Root)

    return false;


  Type *WideTy =

      VectorType::get(IntegerType::getInt8Ty(Root->getContext()),

                      cast<VectorType>(Root->getType())->getElementCount());


  IRBuilder<> Builder(Phi);

  PHINode *WidePhi = Builder.CreatePHI(WideTy, 2);

  WidePhi->addIncoming(ConstantAggregateZero::get(WideTy),

                       Phi->getIncomingBlock(0));

  Builder.SetInsertPoint(Root);

  Value *WideTrue = Builder.CreateZExt(True, WideTy);

  Value *WideMerge = Builder.CreateIntrinsic(Intrinsic::vp_merge, {WideTy},

                                             {Mask, WideTrue, WidePhi, EVL});

  if (isa<FreezeInst>(Root))

    WideMerge = Builder.CreateFreeze(WideMerge);

  WidePhi->addIncoming(WideMerge, Phi->getIncomingBlock(1));

  Value *Trunc = Builder.CreateTrunc(WideMerge, Root->getType());


  Root->replaceAllUsesWith(Trunc);


  // Break the cycle and delete the old chain.

  Phi->setIncomingValue(1, Phi->getIncomingValue(0));

  llvm::RecursivelyDeleteTriviallyDeadInstructions(Root);


  return true;

}


bool RISCVCodeGenPrepare::visitFreezeInst(FreezeInst &I) {

  if (auto *II = dyn_cast<IntrinsicInst>(I.getOperand(0)))

    if (II->getIntrinsicID() == Intrinsic::vp_merge)

      return widenVPMerge(&I);

  return false;

}


// LLVM vector reduction intrinsics return a scalar result, but on RISC-V vector

// reduction instructions write the result in the first element of a vector

// register. So when a reduction in a loop uses a scalar phi, we end up with

// unnecessary scalar moves:

//

// loop:

// vfmv.s.f v10, fa0

// vfredosum.vs v8, v8, v10

// vfmv.f.s fa0, v8

//

// This mainly affects ordered fadd reductions and VP reductions that have a

// scalar start value, since other types of reduction typically use element-wise

// vectorisation in the loop body. This tries to vectorize any scalar phis that

// feed into these reductions:

//

// loop:

// %phi = phi <float> [ ..., %entry ], [ %acc, %loop ]

// %acc = call float @llvm.vector.reduce.fadd.nxv2f32(float %phi,

//                                                    <vscale x 2 x float> %vec)

//

// ->

//

// loop:

// %phi = phi <vscale x 2 x float> [ ..., %entry ], [ %acc.vec, %loop ]

// %phi.scalar = extractelement <vscale x 2 x float> %phi, i64 0

// %acc = call float @llvm.vector.reduce.fadd.nxv2f32(float %x,

//                                                    <vscale x 2 x float> %vec)

// %acc.vec = insertelement <vscale x 2 x float> poison, float %acc.next, i64 0

//

// Which eliminates the scalar -> vector -> scalar crossing during instruction

// selection.

bool RISCVCodeGenPrepare::visitIntrinsicInst(IntrinsicInst &I) {

  if (expandVPStrideLoad(I))

    return true;


  if (expandMulReduction(I))

    return true;


  if (widenVPMerge(&I))

    return true;


  if (I.getIntrinsicID() != Intrinsic::vector_reduce_fadd &&

      !isa<VPReductionIntrinsic>(&I))

    return false;


  auto *PHI = dyn_cast<PHINode>(I.getOperand(0));

  if (!PHI || !PHI->hasOneUse() ||

      !llvm::is_contained(PHI->incoming_values(), &I))

    return false;


  Type *VecTy = I.getOperand(1)->getType();

  IRBuilder<> Builder(PHI);

  auto *VecPHI = Builder.CreatePHI(VecTy, PHI->getNumIncomingValues());


  for (auto *BB : PHI->blocks()) {

    Builder.SetInsertPoint(BB->getTerminator());

    Value *InsertElt = Builder.CreateInsertElement(

        VecTy, PHI->getIncomingValueForBlock(BB), (uint64_t)0);

    VecPHI->addIncoming(InsertElt, BB);

  }


  Builder.SetInsertPoint(&I);

  I.setOperand(0, Builder.CreateExtractElement(VecPHI, (uint64_t)0));


  PHI->eraseFromParent();


  return true;

}


// Extract pieces of size PieceEC from Vec, then build a binary tree of

// element-wise multiplies reducing to a single piece.


static Value *buildMulTree(IRBuilder<> &Builder, ElementCount PieceEC,

                           Value *Vec) {

  auto *VecTy = cast<VectorType>(Vec->getType());

  auto *PieceTy = VectorType::get(VecTy->getElementType(), PieceEC);

  unsigned PieceElts = PieceEC.getKnownMinValue();

  unsigned NumPieces = VecTy->getElementCount().getKnownMinValue() / PieceElts;

  assert(isPowerOf2_32(NumPieces));


  SmallVector<Value *, 8> Pieces(NumPieces);

  for (unsigned i = 0; i < NumPieces; i++)

    Pieces[i] = Builder.CreateExtractVector(PieceTy, Vec, i * PieceElts);


  while (Pieces.size() > 1) {

    for (unsigned i = 0; i < Pieces.size() / 2; i++)

      Pieces[i] =

          Builder.CreateMul(Pieces[i * 2], Pieces[i * 2 + 1], "bin.rdx");

    Pieces.truncate(Pieces.size() / 2);

  }

  return Pieces[0];

}


// Partially expand a vector_reduce_mul wider than M1 to reduce

// register pressure and the number of vsetvlis required.

bool RISCVCodeGenPrepare::expandMulReduction(IntrinsicInst &II) {

  if (II.getIntrinsicID() != Intrinsic::vector_reduce_mul)

    return false;


  if (!ST->hasVInstructions())

    return false;


  Value *TmpVec = II.getArgOperand(0);

  auto *VecTy = cast<VectorType>(TmpVec->getType());

  unsigned EltSize = VecTy->getScalarSizeInBits();


  if (auto *ScalTy = dyn_cast<ScalableVectorType>(VecTy)) {

    unsigned MinElts = ScalTy->getMinNumElements();


    if (auto VLen = ST->getRealVLen()) {

      // If VLEN is exactly known, convert to a fixed vector reduction and

      // recurse to let the fixed path handle it (shuffle reduction instead

      // of a scalar loop).

      unsigned VScale = *VLen / RISCV::RVVBitsPerBlock;

      auto *FixedTy =

          FixedVectorType::get(VecTy->getElementType(), MinElts * VScale);

      IRBuilder<> Builder(&II);

      Value *Fixed = Builder.CreateExtractVector(FixedTy, TmpVec, (uint64_t)0);

      auto *FixedRdx = cast<IntrinsicInst>(Builder.CreateIntrinsic(

          Intrinsic::vector_reduce_mul, {FixedTy}, {Fixed}));

      II.replaceAllUsesWith(FixedRdx);

      II.eraseFromParent();

      expandMulReduction(*FixedRdx);

      return true;

    }


    unsigned M1MinElts = RISCV::RVVBitsPerBlock / EltSize;

    if (MinElts <= M1MinElts || !isPowerOf2_32(MinElts / M1MinElts))

      return false;


    IRBuilder<> Builder(&II);

    auto M1EC = ElementCount::getScalable(M1MinElts);

    Value *Reduced = buildMulTree(Builder, M1EC, TmpVec);

    Value *Rdx = Builder.CreateIntrinsic(Intrinsic::vector_reduce_mul,

                                         {Reduced->getType()}, {Reduced});

    II.replaceAllUsesWith(Rdx);

    II.eraseFromParent();

    return true;

  }


  unsigned VF = cast<FixedVectorType>(VecTy)->getNumElements();

  unsigned MinVLen = ST->getRealMinVLen();

  unsigned M1VF = MinVLen / EltSize;


  if (!isPowerOf2_32(VF) || VF <= M1VF)

    return false;


  IRBuilder<> Builder(&II);

  auto M1EC = ElementCount::getFixed(M1VF);

  auto *M1Ty = VectorType::get(VecTy->getElementType(), M1EC);


  // When VLEN is exactly known, extract m1 pieces and build a mul tree.

  // This greatly reduces register pressure during the reduction, and

  // avoids all but one vsetvli (the one from original LMUL to m1).

  // TODO: Generalize to handle the splitting case.

  if (MinVLen == ST->getRealMaxVLen() && VF <= 8 * M1VF) {

    TmpVec = buildMulTree(Builder, M1EC, TmpVec);

  } else {

    // For non-exact VLEN, shuffle-reduce at the original vector width down to

    // m1, then extract.  This prioritizes reducing the number of vsetvli

    // over maximal reduction of LMUL for the intermediate states.

    SmallVector<int, 32> ShuffleMask(VF);

    for (unsigned LiveElts = VF; LiveElts > M1VF; LiveElts /= 2) {

      unsigned Half = LiveElts / 2;

      std::iota(ShuffleMask.begin(), ShuffleMask.begin() + Half, Half);

      std::fill(ShuffleMask.begin() + Half, ShuffleMask.end(), -1);

      Value *Shuf =

          Builder.CreateShuffleVector(TmpVec, ShuffleMask, "rdx.shuf");

      TmpVec = Builder.CreateMul(TmpVec, Shuf, "bin.rdx");

    }

    // Extract the M1-sized subvector and emit the final reduction intrinsic.

    // This is the reason we're here - to force a vsetvli toggle once at m1.

    TmpVec = Builder.CreateExtractVector(M1Ty, TmpVec, (uint64_t)0, "rdx.sub");

  }


  Value *Rdx =

      Builder.CreateIntrinsic(Intrinsic::vector_reduce_mul, {M1Ty}, {TmpVec});

  II.replaceAllUsesWith(Rdx);

  II.eraseFromParent();

  return true;

}


// Always expand zero strided loads so we match more .vx splat patterns, even if

// we have +optimized-zero-stride-loads. RISCVDAGToDAGISel::Select will convert

// it back to a strided load if it's optimized.

bool RISCVCodeGenPrepare::expandVPStrideLoad(IntrinsicInst &II) {

  Value *BasePtr, *VL;


  using namespace PatternMatch;

  if (!match(&II, m_Intrinsic<Intrinsic::experimental_vp_strided_load>(

                      m_Value(BasePtr), m_Zero(), m_AllOnes(), m_Value(VL))))

    return false;


  // If SEW>XLEN then a splat will get lowered as a zero strided load anyway, so

  // avoid expanding here.

  if (II.getType()->getScalarSizeInBits() > ST->getXLen())

    return false;


  if (!isKnownNonZero(VL, {*DL, DT, nullptr, &II}))

    return false;


  auto *VTy = cast<VectorType>(II.getType());


  IRBuilder<> Builder(&II);

  Type *STy = VTy->getElementType();

  Value *Val = Builder.CreateLoad(STy, BasePtr);

  Value *Res = Builder.CreateIntrinsic(

      Intrinsic::vp_merge, VTy,

      {II.getOperand(2), Builder.CreateVectorSplat(VTy->getElementCount(), Val),

       PoisonValue::get(VTy), VL});


  II.replaceAllUsesWith(Res);

  II.eraseFromParent();

  return true;

}


bool RISCVCodeGenPrepare::run() {

  bool MadeChange = false;

  for (auto &BB : F)

    for (Instruction &I : llvm::make_early_inc_range(BB))

      MadeChange |= visit(I);


  return MadeChange;

}


bool RISCVCodeGenPrepareLegacyPass::runOnFunction(Function &F) {

  if (skipFunction(F))

    return false;


  auto &TPC = getAnalysis<TargetPassConfig>();

  auto &TM = TPC.getTM<RISCVTargetMachine>();

  auto ST = &TM.getSubtarget<RISCVSubtarget>(F);

  auto DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree();


  RISCVCodeGenPrepare RVCGP(F, DT, ST);

  return RVCGP.run();

}


INITIALIZE_PASS_BEGIN(RISCVCodeGenPrepareLegacyPass, DEBUG_TYPE, PASS_NAME,

                      false, false)

INITIALIZE_PASS_DEPENDENCY(TargetPassConfig)

INITIALIZE_PASS_END(RISCVCodeGenPrepareLegacyPass, DEBUG_TYPE, PASS_NAME, false,

                    false)


char RISCVCodeGenPrepareLegacyPass::ID = 0;


FunctionPass *llvm::createRISCVCodeGenPrepareLegacyPass() {

  return new RISCVCodeGenPrepareLegacyPass();

}


PreservedAnalyses RISCVCodeGenPreparePass::run(Function &F,

                                               FunctionAnalysisManager &FAM) {

  DominatorTree *DT = &FAM.getResult<DominatorTreeAnalysis>(F);

  auto ST = &TM->getSubtarget<RISCVSubtarget>(F);

  bool Changed = RISCVCodeGenPrepare(F, DT, ST).run();

  if (!Changed)

    return PreservedAnalyses::all();


  PreservedAnalyses PA = PreservedAnalyses::none();

  PA.preserveSet<CFGAnalyses>();

  return PA;

}


assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

PHI
Rewrite undef for PHI
Definition AMDGPURewriteUndefForPHI.cpp:98

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition ARMSLSHardening.cpp:73

Dominators.h

runOnFunction
static bool runOnFunction(Function &F, bool PostInlining)
Definition EntryExitInstrumenter.cpp:109

DEBUG_TYPE
#define DEBUG_TYPE
Definition GenericCycleImpl.h:31

IRBuilder.h

IntrinsicInst.h

InitializePasses.h

InstVisitor.h

Intrinsics.h

TemplateParamKind::Type
@ Type
Definition ItaniumDemangle.h:1243

F
#define F(x, y, z)
Definition MD5.cpp:54

I
#define I(x, y, z)
Definition MD5.cpp:57

II
uint64_t IntrinsicInst * II
Definition NVVMIntrRange.cpp:46

FAM
FunctionAnalysisManager FAM
Definition PassBuilderBindings.cpp:61

INITIALIZE_PASS_DEPENDENCY
#define INITIALIZE_PASS_DEPENDENCY(depName)
Definition PassSupport.h:42

INITIALIZE_PASS_END
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
Definition PassSupport.h:44

INITIALIZE_PASS_BEGIN
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
Definition PassSupport.h:39

Pass.h

PatternMatch.h

buildMulTree
static Value * buildMulTree(IRBuilder<> &Builder, ElementCount PieceEC, Value *Vec)
Definition RISCVCodeGenPrepare.cpp:269

PASS_NAME
#define PASS_NAME
Definition RISCVCodeGenPrepare.cpp:34

RISCVTargetMachine.h

RISCV.h

visit
static void visit(BasicBlock &Start, std::function< bool(BasicBlock *)> op)
Definition SPIRVStructurizer.cpp:189

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

TargetPassConfig.h
Target-Independent Code Generator Pass Configuration Options pass.

Local.h

PASS_NAME
#define PASS_NAME
Definition TypePromotion.cpp:43

ValueTracking.h

RHS
Value * RHS
Definition X86PartialReduction.cpp:81

llvm::AnalysisUsage::addRequired
AnalysisUsage & addRequired()
Definition PassAnalysisSupport.h:76

llvm::AnalysisUsage::setPreservesCFG
LLVM_ABI void setPreservesCFG()
This function should be called by the pass, iff they do not:
Definition Pass.cpp:275

llvm::BinaryOperator
Definition InstrTypes.h:206

llvm::CFGAnalyses
Represents analyses that only rely on functions' control flow.
Definition Analysis.h:73

llvm::ConstantAggregateZero::get
static LLVM_ABI ConstantAggregateZero * get(Type *Ty)
Definition Constants.cpp:1810

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64

llvm::DominatorTreeAnalysis
Analysis pass which computes a DominatorTree.
Definition Dominators.h:270

llvm::DominatorTree
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition Dominators.h:151

llvm::ElementCount
Definition TypeSize.h:298

llvm::ElementCount::getScalable
static constexpr ElementCount getScalable(ScalarTy MinVal)
Definition TypeSize.h:312

llvm::ElementCount::getFixed
static constexpr ElementCount getFixed(ScalarTy MinVal)
Definition TypeSize.h:309

llvm::FixedVectorType::get
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
Definition Type.cpp:867

llvm::FreezeInst
This class represents a freeze function that returns random concrete value if an operand is either a ...
Definition Instructions.h:5398

llvm::FunctionPass
FunctionPass class - This class is used to implement most global optimizations.
Definition Pass.h:314

llvm::Function
Definition Function.h:65

llvm::IRBuilder
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition IRBuilder.h:2848

llvm::InstVisitor
Base class for instruction visitors.
Definition InstVisitor.h:78

llvm::Instruction
Definition Instruction.h:70

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition IntrinsicInst.h:49

llvm::PHINode::addIncoming
void addIncoming(Value *V, BasicBlock *BB)
Add an incoming value to the end of the PHI list.
Definition Instructions.h:2795

llvm::PoisonValue::get
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Definition Constants.cpp:2034

llvm::PreservedAnalyses
A set of analyses that are preserved following a run of a transformation pass.
Definition Analysis.h:112

llvm::PreservedAnalyses::none
static PreservedAnalyses none()
Convenience factory function for the empty preserved set.
Definition Analysis.h:115

llvm::PreservedAnalyses::all
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition Analysis.h:118

llvm::PreservedAnalyses::preserveSet
PreservedAnalyses & preserveSet()
Mark an analysis set as preserved.
Definition Analysis.h:151

llvm::RISCVCodeGenPreparePass::run
PreservedAnalyses run(Function &F, FunctionAnalysisManager &FAM)
Definition RISCVCodeGenPrepare.cpp:447

llvm::RISCVSubtarget
Definition RISCVSubtarget.h:84

llvm::RISCVSubtarget::getRealMinVLen
unsigned getRealMinVLen() const
Definition RISCVSubtarget.h:263

llvm::RISCVSubtarget::getXLen
unsigned getXLen() const
Definition RISCVSubtarget.h:234

llvm::RISCVSubtarget::hasVInstructions
bool hasVInstructions() const
Definition RISCVSubtarget.h:315

llvm::RISCVSubtarget::getRealVLen
std::optional< unsigned > getRealVLen() const
Definition RISCVSubtarget.h:272

llvm::RISCVSubtarget::getRealMaxVLen
unsigned getRealMaxVLen() const
Definition RISCVSubtarget.h:267

llvm::RISCVSubtarget::is64Bit
bool is64Bit() const
Definition RISCVSubtarget.h:229

llvm::SmallVectorImpl::truncate
void truncate(size_type N)
Like resize, but requires that N is less than size().
Definition SmallVector.h:663

llvm::SmallVectorTemplateCommon::size
size_t size() const
Definition SmallVector.h:83

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition SmallVector.h:1236

llvm::TargetPassConfig
Target-Independent Code Generator Pass Configuration Options.
Definition TargetPassConfig.h:84

llvm::Type::getScalarType
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition Type.h:368

llvm::Type::getScalarSizeInBits
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
Definition Type.cpp:232

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition Type.h:257

llvm::User::setOperand
void setOperand(unsigned i, Value *Val)
Definition User.h:212

llvm::User::getOperand
Value * getOperand(unsigned i) const
Definition User.h:207

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:255

llvm::Value::replaceAllUsesWith
LLVM_ABI void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
Definition Value.cpp:553

llvm::Value::getContext
LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.h:258

llvm::VectorType::get
static LLVM_ABI VectorType * get(Type *ElementType, ElementCount EC)
This static method is the primary way to construct an VectorType.

llvm::details::FixedOrScalableQuantity::getKnownMinValue
constexpr ScalarTy getKnownMinValue() const
Returns the minimum value this quantity can represent.
Definition TypeSize.h:165

Changed
Changed
Definition ObjCARCOpts.cpp:2366

false
Definition MachinePipeliner.cpp:245

llvm::ARM_MB::ST
@ ST
Definition ARMBaseInfo.h:73

llvm::BitmaskEnumDetail::Mask
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
Definition BitmaskEnum.h:126

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::PatternMatchHelpers::m_CombineOr
match_combine_or< Ty... > m_CombineOr(const Ty &...Ps)
Combine pattern matchers matching any of Ps patterns.
Definition PatternMatchHelpers.h:56

llvm::PatternMatch::m_AllOnes
cst_pred_ty< is_all_ones > m_AllOnes()
Match an integer or vector with all bits set.
Definition PatternMatch.h:508

llvm::PatternMatch::m_Freeze
OneOps_match< OpTy, Instruction::Freeze > m_Freeze(const OpTy &Op)
Matches FreezeInst.
Definition PatternMatch.h:1938

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition PatternMatch.h:53

llvm::PatternMatch::m_Intrinsic
IntrinsicID_match m_Intrinsic()
Match intrinsic calls like this: m_Intrinsic<Intrinsic::fabs>(m_Value(X))
Definition PatternMatch.h:2797

llvm::PatternMatch::m_Value
auto m_Value()
Match an arbitrary value and ignore it.
Definition PatternMatch.h:135

llvm::PatternMatch::m_NNegZExt
NNegZExt_match< OpTy > m_NNegZExt(const OpTy &Op)
Definition PatternMatch.h:2251

llvm::PatternMatch::m_Zero
is_zero m_Zero()
Match any null constant or a vector with all elements equal to 0.
Definition PatternMatch.h:607

llvm::RISCV::RVVBitsPerBlock
static constexpr unsigned RVVBitsPerBlock
Definition RISCVTargetParser.h:69

llvm::codeview::EncodedFramePtrReg::BasePtr
@ BasePtr
Definition CodeView.h:527

llvm::rdf::Phi
NodeAddr< PhiNode * > Phi
Definition RDFGraph.h:390

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition FunctionInfo.h:25

llvm::RecursivelyDeleteTriviallyDeadInstructions
LLVM_ABI bool RecursivelyDeleteTriviallyDeadInstructions(Value *V, const TargetLibraryInfo *TLI=nullptr, MemorySSAUpdater *MSSAU=nullptr, std::function< void(Value *)> AboutToDeleteCallback=std::function< void(Value *)>())
If the specified value is a trivially dead instruction, delete it.
Definition Local.cpp:535

llvm::isInt
constexpr bool isInt(int64_t x)
Checks if an integer fits into the given bit width.
Definition MathExtras.h:165

llvm::createRISCVCodeGenPrepareLegacyPass
FunctionPass * createRISCVCodeGenPrepareLegacyPass()
Definition RISCVCodeGenPrepare.cpp:443

llvm::dyn_cast
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643

llvm::make_early_inc_range
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
Definition STLExtras.h:633

llvm::FloatStyle::Fixed
@ Fixed
Definition NativeFormatting.h:18

llvm::Value
RelativeUniformCounterPtr ValuesPtrExpr VTableAddr Value
Definition InstrProf.h:143

llvm::isPowerOf2_32
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition MathExtras.h:279

llvm::isUInt
constexpr bool isUInt(uint64_t x)
Checks if an unsigned integer fits into the given bit width.
Definition MathExtras.h:189

llvm::SmallVector
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
Definition SmallVector.h:1162

llvm::isa
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547

llvm::isKnownNonZero
LLVM_ABI bool isKnownNonZero(const Value *V, const SimplifyQuery &Q, unsigned Depth=0)
Return true if the given value is known to be non-zero when defined.
Definition ValueTracking.cpp:3800

llvm::IRBuilder
IRBuilder(LLVMContext &, FolderTy, InserterTy, MDNode *, ArrayRef< OperandBundleDef >) -> IRBuilder< FolderTy, InserterTy >

llvm::cast
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559

llvm::is_contained
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
Definition STLExtras.h:1947

llvm::SignExtend64
constexpr int64_t SignExtend64(uint64_t x)
Sign-extend the number in the bottom B bits of X to a 64-bit integer.
Definition MathExtras.h:572

llvm::FunctionAnalysisManager
AnalysisManager< Function > FunctionAnalysisManager
Convenience typedef for the Function analysis manager.
Definition PassManager.h:586