doxygen/ARMTargetTransformInfo_8h_source.html

//===- ARMTargetTransformInfo.h - ARM specific TTI --------------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

/// \file

/// This file a TargetTransformInfoImplBase conforming object specific to the

/// ARM target machine. It uses the target's detailed information to

/// provide more precise answers to certain TTI queries, while letting the

/// target independent and default TTI implementations handle the rest.

//

//===----------------------------------------------------------------------===//


#ifndef LLVM_LIB_TARGET_ARM_ARMTARGETTRANSFORMINFO_H

#define LLVM_LIB_TARGET_ARM_ARMTARGETTRANSFORMINFO_H


#include "ARM.h"

#include "ARMSubtarget.h"

#include "ARMTargetMachine.h"

#include "llvm/ADT/ArrayRef.h"

#include "llvm/Analysis/TargetTransformInfo.h"

#include "llvm/CodeGen/BasicTTIImpl.h"

#include "llvm/IR/Constant.h"

#include "llvm/IR/Function.h"

#include "llvm/TargetParser/SubtargetFeature.h"

#include <optional>


namespace llvm {


class APInt;

class ARMTargetLowering;

class Instruction;

class Loop;

class SCEV;

class ScalarEvolution;

class Type;

class Value;


namespace TailPredication {


enum Mode {

  Disabled = 0,

  EnabledNoReductions,

  Enabled,

  ForceEnabledNoReductions,

  ForceEnabled

};


}


// For controlling conversion of memcpy into Tail Predicated loop.


namespace TPLoop {

enum MemTransfer { ForceDisabled = 0, ForceEnabled, Allow };

}


class ARMTTIImpl final : public BasicTTIImplBase<ARMTTIImpl> {

  using BaseT = BasicTTIImplBase<ARMTTIImpl>;

  using TTI = TargetTransformInfo;


  friend BaseT;


  const ARMSubtarget *ST;

  const ARMTargetLowering *TLI;


  const ARMSubtarget *getST() const { return ST; }

  const ARMTargetLowering *getTLI() const { return TLI; }


public:


  explicit ARMTTIImpl(const ARMBaseTargetMachine *TM, const Function &F)

      : BaseT(TM, F.getDataLayout()), ST(TM->getSubtargetImpl(F)),

        TLI(ST->getTargetLowering()) {}


  bool enableInterleavedAccessVectorization() const override { return true; }


  TTI::AddressingModeKind

  getPreferredAddressingMode(const Loop *L, ScalarEvolution *SE) const override;


  /// Floating-point computation using ARMv8 AArch32 Advanced

  /// SIMD instructions remains unchanged from ARMv7. Only AArch64 SIMD

  /// and Arm MVE are IEEE-754 compliant.


  bool isFPVectorizationPotentiallyUnsafe() const override {

    return !ST->isTargetDarwin() && !ST->hasMVEFloatOps();

  }


  std::optional<Instruction *>

  instCombineIntrinsic(InstCombiner &IC, IntrinsicInst &II) const override;

  std::optional<Value *> simplifyDemandedVectorEltsIntrinsic(

      InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts,

      APInt &UndefElts2, APInt &UndefElts3,

      std::function<void(Instruction *, unsigned, APInt, APInt &)>

          SimplifyAndSetOp) const override;


  /// \name Scalar TTI Implementations

  /// @{


  InstructionCost getIntImmCodeSizeCost(unsigned Opcode, unsigned Idx,

                                        const APInt &Imm,

                                        Type *Ty) const override;


  using BaseT::getIntImmCost;

  InstructionCost getIntImmCost(const APInt &Imm, Type *Ty,

                                TTI::TargetCostKind CostKind) const override;


  InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx,

                                    const APInt &Imm, Type *Ty,

                                    TTI::TargetCostKind CostKind,

                                    Instruction *Inst = nullptr) const override;


  /// @}


  /// \name Vector TTI Implementations

  /// @{


  unsigned getNumberOfRegisters(unsigned ClassID) const override {

    bool Vector = (ClassID == 1);

    if (Vector) {

      if (ST->hasNEON())

        return 16;

      if (ST->hasMVEIntegerOps())

        return 8;

      return 0;

    }


    if (ST->isThumb1Only())

      return 8;

    return 13;

  }


  TypeSize


  getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const override {

    switch (K) {

    case TargetTransformInfo::RGK_Scalar:

      return TypeSize::getFixed(32);

    case TargetTransformInfo::RGK_FixedWidthVector:

      if (ST->hasNEON())

        return TypeSize::getFixed(128);

      if (ST->hasMVEIntegerOps())

        return TypeSize::getFixed(128);

      return TypeSize::getFixed(0);

    case TargetTransformInfo::RGK_ScalableVector:

      return TypeSize::getScalable(0);

    }

    llvm_unreachable("Unsupported register kind");

  }


  unsigned getMaxInterleaveFactor(ElementCount VF,

                                  bool HasUnorderedReductions) const override {

    return ST->getMaxInterleaveFactor();

  }


  bool isProfitableLSRChainElement(Instruction *I) const override;


  bool

  isLegalMaskedLoad(Type *DataTy, Align Alignment, unsigned AddressSpace,

                    TTI::MaskKind MaskKind =

                        TTI::MaskKind::VariableOrConstantMask) const override;


  bool


  isLegalMaskedStore(Type *DataTy, Align Alignment, unsigned AddressSpace,

                     TTI::MaskKind MaskKind =

                         TTI::MaskKind::VariableOrConstantMask) const override {

    return isLegalMaskedLoad(DataTy, Alignment, AddressSpace, MaskKind);

  }


  bool forceScalarizeMaskedGather(VectorType *VTy,

                                  Align Alignment) const override {

    // For MVE, we have a custom lowering pass that will already have custom

    // legalised any gathers that we can lower to MVE intrinsics, and want to

    // expand all the rest. The pass runs before the masked intrinsic lowering

    // pass.

    return true;

  }


  bool forceScalarizeMaskedScatter(VectorType *VTy,

                                   Align Alignment) const override {

    return forceScalarizeMaskedGather(VTy, Alignment);

  }


  bool isLegalMaskedGather(Type *Ty, Align Alignment) const override;


  bool isLegalMaskedScatter(Type *Ty, Align Alignment) const override {

    return isLegalMaskedGather(Ty, Alignment);

  }


  InstructionCost getMemcpyCost(const Instruction *I) const override;


  uint64_t getMaxMemIntrinsicInlineSizeThreshold() const override {

    return ST->getMaxInlineSizeThreshold();

  }


  int getNumMemOps(const IntrinsicInst *I) const;


  InstructionCost

  getShuffleCost(TTI::ShuffleKind Kind, VectorType *DstTy, VectorType *SrcTy,

                 ArrayRef<int> Mask, TTI::TargetCostKind CostKind, int Index,

                 VectorType *SubTp, ArrayRef<const Value *> Args = {},

                 const Instruction *CxtI = nullptr) const override;


  bool preferInLoopReduction(RecurKind Kind, Type *Ty) const override;


  bool preferPredicatedReductionSelect() const override;


  bool shouldExpandReduction(const IntrinsicInst *II) const override {

    return false;

  }


  InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind,

                                 const Instruction *I = nullptr) const override;


  InstructionCost

  getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src,

                   TTI::CastContextHint CCH, TTI::TargetCostKind CostKind,

                   const Instruction *I = nullptr) const override;


  InstructionCost getCmpSelInstrCost(

      unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred,

      TTI::TargetCostKind CostKind,

      TTI::OperandValueInfo Op1Info = {TTI::OK_AnyValue, TTI::OP_None},

      TTI::OperandValueInfo Op2Info = {TTI::OK_AnyValue, TTI::OP_None},

      const Instruction *I = nullptr) const override;


  using BaseT::getVectorInstrCost;

  InstructionCost

  getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind,

                     unsigned Index, const Value *Op0, const Value *Op1,

                     TTI::VectorInstrContext VIC =

                         TTI::VectorInstrContext::None) const override;


  InstructionCost

  getAddressComputationCost(Type *Val, ScalarEvolution *SE, const SCEV *Ptr,

                            TTI::TargetCostKind CostKind) const override;


  InstructionCost getArithmeticInstrCost(

      unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind,

      TTI::OperandValueInfo Op1Info = {TTI::OK_AnyValue, TTI::OP_None},

      TTI::OperandValueInfo Op2Info = {TTI::OK_AnyValue, TTI::OP_None},

      ArrayRef<const Value *> Args = {},

      const Instruction *CxtI = nullptr) const override;


  InstructionCost getMemoryOpCost(

      unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace,

      TTI::TargetCostKind CostKind,

      TTI::OperandValueInfo OpInfo = {TTI::OK_AnyValue, TTI::OP_None},

      const Instruction *I = nullptr) const override;


  InstructionCost

  getMemIntrinsicInstrCost(const MemIntrinsicCostAttributes &MICA,

                           TTI::TargetCostKind CostKind) const override;


  InstructionCost getMaskedMemoryOpCost(const MemIntrinsicCostAttributes &MICA,

                                        TTI::TargetCostKind CostKind) const;


  InstructionCost getInterleavedMemoryOpCost(

      unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef<unsigned> Indices,

      Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind,

      bool UseMaskForCond = false, bool UseMaskForGaps = false) const override;


  InstructionCost getGatherScatterOpCost(const MemIntrinsicCostAttributes &MICA,

                                         TTI::TargetCostKind CostKind) const;


  InstructionCost

  getArithmeticReductionCost(unsigned Opcode, VectorType *ValTy,

                             std::optional<FastMathFlags> FMF,

                             TTI::TargetCostKind CostKind) const override;

  InstructionCost

  getExtendedReductionCost(unsigned Opcode, bool IsUnsigned, Type *ResTy,

                           VectorType *ValTy, std::optional<FastMathFlags> FMF,

                           TTI::TargetCostKind CostKind) const override;

  InstructionCost

  getMulAccReductionCost(bool IsUnsigned, unsigned RedOpcode, Type *ResTy,

                         VectorType *ValTy,

                         TTI::TargetCostKind CostKind) const override;


  InstructionCost

  getMinMaxReductionCost(Intrinsic::ID IID, VectorType *Ty, FastMathFlags FMF,

                         TTI::TargetCostKind CostKind) const override;


  InstructionCost

  getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA,

                        TTI::TargetCostKind CostKind) const override;


  InstructionCost getPartialReductionCost(

      unsigned Opcode, Type *InputTypeA, Type *InputTypeB, Type *AccumType,

      ElementCount VF, TTI::PartialReductionExtendKind OpAExtend,

      TTI::PartialReductionExtendKind OpBExtend, std::optional<unsigned> BinOp,

      TTI::TargetCostKind CostKind,

      std::optional<FastMathFlags> FMF) const override {

    return InstructionCost::getInvalid();

  }


  /// getScalingFactorCost - Return the cost of the scaling used in

  /// addressing mode represented by AM.

  /// If the AM is supported, the return value must be >= 0.

  /// If the AM is not supported, the return value is an invalid cost.

  InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV,

                                       StackOffset BaseOffset, bool HasBaseReg,

                                       int64_t Scale,

                                       unsigned AddrSpace) const override;


  bool maybeLoweredToCall(Instruction &I) const;

  bool isLoweredToCall(const Function *F) const override;

  bool isHardwareLoopProfitable(Loop *L, ScalarEvolution &SE,

                                AssumptionCache &AC, TargetLibraryInfo *LibInfo,

                                HardwareLoopInfo &HWLoopInfo) const override;

  bool preferTailFoldingOverEpilogue(TailFoldingInfo *TFI) const override;

  void getUnrollingPreferences(Loop *L, ScalarEvolution &SE,

                               TTI::UnrollingPreferences &UP,

                               OptimizationRemarkEmitter *ORE) const override;


  TailFoldingStyle getPreferredTailFoldingStyle() const override;


  void getPeelingPreferences(Loop *L, ScalarEvolution &SE,

                             TTI::PeelingPreferences &PP) const override;


  bool shouldBuildLookupTablesForConstant(Constant *C) const override {

    // In the ROPI and RWPI relocation models we can't have pointers to global

    // variables or functions in constant data, so don't convert switches to

    // lookup tables if any of the values would need relocation.

    if (ST->isROPI() || ST->isRWPI())

      return !C->needsDynamicRelocation();


    return true;

  }


  bool shouldConsiderVectorizationRegPressure() const override;


  bool hasArmWideBranch(bool Thumb) const override;


  bool isProfitableToSinkOperands(Instruction *I,

                                  SmallVectorImpl<Use *> &Ops) const override;


  unsigned getNumBytesToPadGlobalArray(unsigned Size,

                                       Type *ArrayType) const override;


  /// @}

};


/// isVREVMask - Check if a vector shuffle corresponds to a VREV

/// instruction with the specified blocksize.  (The order of the elements

/// within each block of the vector is reversed.)


inline bool isVREVMask(ArrayRef<int> M, EVT VT, unsigned BlockSize) {

  assert((BlockSize == 16 || BlockSize == 32 || BlockSize == 64) &&

         "Only possible block sizes for VREV are: 16, 32, 64");


  unsigned EltSz = VT.getScalarSizeInBits();

  if (EltSz != 8 && EltSz != 16 && EltSz != 32)

    return false;


  unsigned BlockElts = M[0] + 1;

  // If the first shuffle index is UNDEF, be optimistic.

  if (M[0] < 0)

    BlockElts = BlockSize / EltSz;


  if (BlockSize <= EltSz || BlockSize != BlockElts * EltSz)

    return false;


  for (unsigned i = 0, e = M.size(); i < e; ++i) {

    if (M[i] < 0)

      continue; // ignore UNDEF indices

    if ((unsigned)M[i] != (i - i % BlockElts) + (BlockElts - 1 - i % BlockElts))

      return false;

  }


  return true;

}


} // end namespace llvm


#endif // LLVM_LIB_TARGET_ARM_ARMTARGETTRANSFORMINFO_H

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

ARMSubtarget.h

ARMTargetMachine.h

ARM.h

ArrayRef.h

BasicTTIImpl.h
This file provides a helper that implements much of the TTI interface in terms of the target-independ...

CostKind
static cl::opt< OutputCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(OutputCostKind::RecipThroughput), cl::values(clEnumValN(OutputCostKind::RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(OutputCostKind::Latency, "latency", "Instruction latency"), clEnumValN(OutputCostKind::CodeSize, "code-size", "Code size"), clEnumValN(OutputCostKind::SizeAndLatency, "size-latency", "Code size and latency"), clEnumValN(OutputCostKind::All, "all", "Print all cost kinds")))

IntrinsicCostStrategy::InstructionCost
@ InstructionCost
Definition CostModel.cpp:51

Constant.h

Function.h

InlinePriorityMode::Size
@ Size
Definition InlineOrder.cpp:25

TemplateParamKind::Type
@ Type
Definition ItaniumDemangle.h:1243

Ops
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
Definition ItaniumDemangle.h:3391

F
#define F(x, y, z)
Definition MD5.cpp:54

I
#define I(x, y, z)
Definition MD5.cpp:57

II
uint64_t IntrinsicInst * II
Definition NVVMIntrRange.cpp:46

SubtargetFeature.h

BlockSize
static const int BlockSize
Definition TarWriter.cpp:33

TargetTransformInfo.h
This pass exposes codegen information to IR-level passes.

llvm::APInt
Class for arbitrary precision integers.
Definition APInt.h:78

llvm::ARMBaseTargetMachine
Definition ARMTargetMachine.h:29

llvm::ARMSubtarget
Definition ARMSubtarget.h:48

llvm::ARMTTIImpl::getGatherScatterOpCost
InstructionCost getGatherScatterOpCost(const MemIntrinsicCostAttributes &MICA, TTI::TargetCostKind CostKind) const
Definition ARMTargetTransformInfo.cpp:1706

llvm::ARMTTIImpl::getRegisterBitWidth
TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const override
Definition ARMTargetTransformInfo.h:131

llvm::ARMTTIImpl::getAddressComputationCost
InstructionCost getAddressComputationCost(Type *Val, ScalarEvolution *SE, const SCEV *Ptr, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:1076

llvm::ARMTTIImpl::isFPVectorizationPotentiallyUnsafe
bool isFPVectorizationPotentiallyUnsafe() const override
Floating-point computation using ARMv8 AArch32 Advanced SIMD instructions remains unchanged from ARMv...
Definition ARMTargetTransformInfo.h:82

llvm::ARMTTIImpl::getMaskedMemoryOpCost
InstructionCost getMaskedMemoryOpCost(const MemIntrinsicCostAttributes &MICA, TTI::TargetCostKind CostKind) const
Definition ARMTargetTransformInfo.cpp:1643

llvm::ARMTTIImpl::getMemoryOpCost
InstructionCost getMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, TTI::OperandValueInfo OpInfo={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr) const override
Definition ARMTargetTransformInfo.cpp:1577

llvm::ARMTTIImpl::getMemcpyCost
InstructionCost getMemcpyCost(const Instruction *I) const override
Definition ARMTargetTransformInfo.cpp:1216

llvm::ARMTTIImpl::isLegalMaskedScatter
bool isLegalMaskedScatter(Type *Ty, Align Alignment) const override
Definition ARMTargetTransformInfo.h:182

llvm::ARMTTIImpl::maybeLoweredToCall
bool maybeLoweredToCall(Instruction &I) const
Definition ARMTargetTransformInfo.cpp:2233

llvm::ARMTTIImpl::preferInLoopReduction
bool preferInLoopReduction(RecurKind Kind, Type *Ty) const override
Definition ARMTargetTransformInfo.cpp:2757

llvm::ARMTTIImpl::getCmpSelInstrCost
InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr) const override
Definition ARMTargetTransformInfo.cpp:929

llvm::ARMTTIImpl::getMulAccReductionCost
InstructionCost getMulAccReductionCost(bool IsUnsigned, unsigned RedOpcode, Type *ResTy, VectorType *ValTy, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:1936

llvm::ARMTTIImpl::getInterleavedMemoryOpCost
InstructionCost getInterleavedMemoryOpCost(unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, bool UseMaskForCond=false, bool UseMaskForGaps=false) const override
Definition ARMTargetTransformInfo.cpp:1664

llvm::ARMTTIImpl::getIntImmCost
InstructionCost getIntImmCost(const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:307

llvm::ARMTTIImpl::hasArmWideBranch
bool hasArmWideBranch(bool Thumb) const override
Definition ARMTargetTransformInfo.cpp:2801

llvm::ARMTTIImpl::shouldConsiderVectorizationRegPressure
bool shouldConsiderVectorizationRegPressure() const override
Definition ARMTargetTransformInfo.cpp:2794

llvm::ARMTTIImpl::preferTailFoldingOverEpilogue
bool preferTailFoldingOverEpilogue(TailFoldingInfo *TFI) const override
Definition ARMTargetTransformInfo.cpp:2557

llvm::ARMTTIImpl::shouldExpandReduction
bool shouldExpandReduction(const IntrinsicInst *II) const override
Definition ARMTargetTransformInfo.h:204

llvm::ARMTTIImpl::shouldBuildLookupTablesForConstant
bool shouldBuildLookupTablesForConstant(Constant *C) const override
Definition ARMTargetTransformInfo.h:315

llvm::ARMTTIImpl::getCastInstrCost
InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src, TTI::CastContextHint CCH, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const override
Definition ARMTargetTransformInfo.cpp:485

llvm::ARMTTIImpl::getNumMemOps
int getNumMemOps(const IntrinsicInst *I) const
Given a memcpy/memset/memmove instruction, return the number of memory operations performed,...
Definition ARMTargetTransformInfo.cpp:1149

llvm::ARMTTIImpl::getCFInstrCost
InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const override
Definition ARMTargetTransformInfo.cpp:471

llvm::ARMTTIImpl::getIntImmCodeSizeCost
InstructionCost getIntImmCodeSizeCost(unsigned Opcode, unsigned Idx, const APInt &Imm, Type *Ty) const override
Definition ARMTargetTransformInfo.cpp:342

llvm::ARMTTIImpl::isLoweredToCall
bool isLoweredToCall(const Function *F) const override
Definition ARMTargetTransformInfo.cpp:2171

llvm::ARMTTIImpl::getExtendedReductionCost
InstructionCost getExtendedReductionCost(unsigned Opcode, bool IsUnsigned, Type *ResTy, VectorType *ValTy, std::optional< FastMathFlags > FMF, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:1901

llvm::ARMTTIImpl::isProfitableToSinkOperands
bool isProfitableToSinkOperands(Instruction *I, SmallVectorImpl< Use * > &Ops) const override
Check if sinking I's operands to I's basic block is profitable, because the operands can be folded in...
Definition ARMTargetTransformInfo.cpp:2836

llvm::ARMTTIImpl::getMaxMemIntrinsicInlineSizeThreshold
uint64_t getMaxMemIntrinsicInlineSizeThreshold() const override
Definition ARMTargetTransformInfo.h:188

llvm::ARMTTIImpl::isLegalMaskedStore
bool isLegalMaskedStore(Type *DataTy, Align Alignment, unsigned AddressSpace, TTI::MaskKind MaskKind=TTI::MaskKind::VariableOrConstantMask) const override
Definition ARMTargetTransformInfo.h:160

llvm::ARMTTIImpl::forceScalarizeMaskedScatter
bool forceScalarizeMaskedScatter(VectorType *VTy, Align Alignment) const override
Definition ARMTargetTransformInfo.h:175

llvm::ARMTTIImpl::getPartialReductionCost
InstructionCost getPartialReductionCost(unsigned Opcode, Type *InputTypeA, Type *InputTypeB, Type *AccumType, ElementCount VF, TTI::PartialReductionExtendKind OpAExtend, TTI::PartialReductionExtendKind OpBExtend, std::optional< unsigned > BinOp, TTI::TargetCostKind CostKind, std::optional< FastMathFlags > FMF) const override
Definition ARMTargetTransformInfo.h:283

llvm::ARMTTIImpl::getArithmeticReductionCost
InstructionCost getArithmeticReductionCost(unsigned Opcode, VectorType *ValTy, std::optional< FastMathFlags > FMF, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:1816

llvm::ARMTTIImpl::simplifyDemandedVectorEltsIntrinsic
std::optional< Value * > simplifyDemandedVectorEltsIntrinsic(InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts, APInt &UndefElts2, APInt &UndefElts3, std::function< void(Instruction *, unsigned, APInt, APInt &)> SimplifyAndSetOp) const override
Definition ARMTargetTransformInfo.cpp:265

llvm::ARMTTIImpl::getMaxInterleaveFactor
unsigned getMaxInterleaveFactor(ElementCount VF, bool HasUnorderedReductions) const override
Definition ARMTargetTransformInfo.h:147

llvm::ARMTTIImpl::isLegalMaskedLoad
bool isLegalMaskedLoad(Type *DataTy, Align Alignment, unsigned AddressSpace, TTI::MaskKind MaskKind=TTI::MaskKind::VariableOrConstantMask) const override
Definition ARMTargetTransformInfo.cpp:1115

llvm::ARMTTIImpl::ARMTTIImpl
ARMTTIImpl(const ARMBaseTargetMachine *TM, const Function &F)
Definition ARMTargetTransformInfo.h:70

llvm::ARMTTIImpl::getPreferredTailFoldingStyle
TailFoldingStyle getPreferredTailFoldingStyle() const override
Definition ARMTargetTransformInfo.cpp:2612

llvm::ARMTTIImpl::getIntImmCostInst
InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx, const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind, Instruction *Inst=nullptr) const override
Definition ARMTargetTransformInfo.cpp:400

llvm::ARMTTIImpl::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr) const override
Definition ARMTargetTransformInfo.cpp:1380

llvm::ARMTTIImpl::getIntrinsicInstrCost
InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:2026

llvm::ARMTTIImpl::instCombineIntrinsic
std::optional< Instruction * > instCombineIntrinsic(InstCombiner &IC, IntrinsicInst &II) const override
Definition ARMTargetTransformInfo.cpp:112

llvm::ARMTTIImpl::getPeelingPreferences
void getPeelingPreferences(Loop *L, ScalarEvolution &SE, TTI::PeelingPreferences &PP) const override
Definition ARMTargetTransformInfo.cpp:2752

llvm::ARMTTIImpl::getMinMaxReductionCost
InstructionCost getMinMaxReductionCost(Intrinsic::ID IID, VectorType *Ty, FastMathFlags FMF, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:1966

llvm::ARMTTIImpl::getPreferredAddressingMode
TTI::AddressingModeKind getPreferredAddressingMode(const Loop *L, ScalarEvolution *SE) const override
Definition ARMTargetTransformInfo.cpp:96

llvm::ARMTTIImpl::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, const Value *Op0, const Value *Op1, TTI::VectorInstrContext VIC=TTI::VectorInstrContext::None) const override
Definition ARMTargetTransformInfo.cpp:889

llvm::ARMTTIImpl::forceScalarizeMaskedGather
bool forceScalarizeMaskedGather(VectorType *VTy, Align Alignment) const override
Definition ARMTargetTransformInfo.h:166

llvm::ARMTTIImpl::getNumberOfRegisters
unsigned getNumberOfRegisters(unsigned ClassID) const override
Definition ARMTargetTransformInfo.h:115

llvm::ARMTTIImpl::getShuffleCost
InstructionCost getShuffleCost(TTI::ShuffleKind Kind, VectorType *DstTy, VectorType *SrcTy, ArrayRef< int > Mask, TTI::TargetCostKind CostKind, int Index, VectorType *SubTp, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr) const override
Definition ARMTargetTransformInfo.cpp:1226

llvm::ARMTTIImpl::getMemIntrinsicInstrCost
InstructionCost getMemIntrinsicInstrCost(const MemIntrinsicCostAttributes &MICA, TTI::TargetCostKind CostKind) const override
Definition ARMTargetTransformInfo.cpp:1629

llvm::ARMTTIImpl::preferPredicatedReductionSelect
bool preferPredicatedReductionSelect() const override
Definition ARMTargetTransformInfo.cpp:2770

llvm::ARMTTIImpl::isLegalMaskedGather
bool isLegalMaskedGather(Type *Ty, Align Alignment) const override
Definition ARMTargetTransformInfo.cpp:1137

llvm::ARMTTIImpl::getNumBytesToPadGlobalArray
unsigned getNumBytesToPadGlobalArray(unsigned Size, Type *ArrayType) const override
Definition ARMTargetTransformInfo.cpp:2960

llvm::ARMTTIImpl::isProfitableLSRChainElement
bool isProfitableLSRChainElement(Instruction *I) const override
Definition ARMTargetTransformInfo.cpp:1098

llvm::ARMTTIImpl::isHardwareLoopProfitable
bool isHardwareLoopProfitable(Loop *L, ScalarEvolution &SE, AssumptionCache &AC, TargetLibraryInfo *LibInfo, HardwareLoopInfo &HWLoopInfo) const override
Definition ARMTargetTransformInfo.cpp:2320

llvm::ARMTTIImpl::getUnrollingPreferences
void getUnrollingPreferences(Loop *L, ScalarEvolution &SE, TTI::UnrollingPreferences &UP, OptimizationRemarkEmitter *ORE) const override
Definition ARMTargetTransformInfo.cpp:2622

llvm::ARMTTIImpl::enableInterleavedAccessVectorization
bool enableInterleavedAccessVectorization() const override
Definition ARMTargetTransformInfo.h:74

llvm::ARMTTIImpl::getScalingFactorCost
InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV, StackOffset BaseOffset, bool HasBaseReg, int64_t Scale, unsigned AddrSpace) const override
getScalingFactorCost - Return the cost of the scaling used in addressing mode represented by AM.
Definition ARMTargetTransformInfo.cpp:2776

llvm::ARMTargetLowering
Definition ARMISelLowering.h:87

llvm::ArrayRef
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40

llvm::ArrayType
Class to represent array types.
Definition DerivedTypes.h:458

llvm::AssumptionCache
A cache of @llvm.assume calls within a function.
Definition AssumptionCache.h:44

llvm::BasicTTIImplBase< ARMTTIImpl >::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, const Value *Op0, const Value *Op1, TTI::VectorInstrContext VIC=TTI::VectorInstrContext::None) const override
Definition BasicTTIImpl.h:1477

llvm::BasicTTIImplBase< ARMTTIImpl >::BasicTTIImplBase
BasicTTIImplBase(const TargetMachine *TM, const DataLayout &DL)
Definition BasicTTIImpl.h:378

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:740

llvm::Constant
This is an important base class in LLVM.
Definition Constant.h:43

llvm::ElementCount
Definition TypeSize.h:298

llvm::Function
Definition Function.h:65

llvm::GlobalValue
Definition GlobalValue.h:49

llvm::InstCombiner
The core instruction combiner logic.
Definition InstCombiner.h:49

llvm::InstructionCost
Definition InstructionCost.h:30

llvm::InstructionCost::getInvalid
static InstructionCost getInvalid(CostType Val=0)
Definition InstructionCost.h:82

llvm::Instruction
Definition Instruction.h:70

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition IntrinsicInst.h:49

llvm::Loop
Represents a single loop in the control flow graph.
Definition LoopInfo.h:40

llvm::OptimizationRemarkEmitter
The optimization diagnostic interface.
Definition OptimizationRemarkEmitter.h:33

llvm::SCEV
This class represents an analyzed expression in the program.
Definition ScalarEvolution.h:249

llvm::ScalarEvolution
The main scalar evolution driver.
Definition ScalarEvolution.h:616

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition SmallVector.h:592

llvm::StackOffset
StackOffset holds a fixed and a scalable offset in bytes.
Definition TypeSize.h:30

llvm::TargetLibraryInfo
Provides information about what library functions are available for the current target.
Definition TargetLibraryInfo.h:266

llvm::TargetTransformInfoImplBase::getDataLayout
virtual const DataLayout & getDataLayout() const
Definition TargetTransformInfoImpl.h:51

llvm::TargetTransformInfoImplBase::getIntImmCost
virtual InstructionCost getIntImmCost(const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind) const
Definition TargetTransformInfoImpl.h:589

llvm::TargetTransformInfo
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Definition TargetTransformInfo.h:268

llvm::TargetTransformInfo::VectorInstrContext
VectorInstrContext
Represents a hint about the context in which an insert/extract is used.
Definition TargetTransformInfo.h:1068

llvm::TargetTransformInfo::VectorInstrContext::None
@ None
The insert/extract is not used with a load/store.
Definition TargetTransformInfo.h:1069

llvm::TargetTransformInfo::MaskKind
MaskKind
Some targets only support masked load/store with a constant mask.
Definition TargetTransformInfo.h:898

llvm::TargetTransformInfo::VariableOrConstantMask
@ VariableOrConstantMask
Definition TargetTransformInfo.h:899

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition TargetTransformInfo.h:331

llvm::TargetTransformInfo::OP_None
@ OP_None
Definition TargetTransformInfo.h:1277

llvm::TargetTransformInfo::RegisterKind
RegisterKind
Definition TargetTransformInfo.h:1352

llvm::TargetTransformInfo::RGK_FixedWidthVector
@ RGK_FixedWidthVector
Definition TargetTransformInfo.h:1352

llvm::TargetTransformInfo::RGK_ScalableVector
@ RGK_ScalableVector
Definition TargetTransformInfo.h:1352

llvm::TargetTransformInfo::RGK_Scalar
@ RGK_Scalar
Definition TargetTransformInfo.h:1352

llvm::TargetTransformInfo::PartialReductionExtendKind
PartialReductionExtendKind
Definition TargetTransformInfo.h:270

llvm::TargetTransformInfo::AddressingModeKind
AddressingModeKind
Which addressing mode Loop Strength Reduction will try to generate.
Definition TargetTransformInfo.h:885

llvm::TargetTransformInfo::ShuffleKind
ShuffleKind
The various kinds of shuffle patterns for vector queries.
Definition TargetTransformInfo.h:1248

llvm::TargetTransformInfo::CastContextHint
CastContextHint
Represents a hint about the context in which a cast is used.
Definition TargetTransformInfo.h:1586

llvm::TargetTransformInfo::OK_AnyValue
@ OK_AnyValue
Definition TargetTransformInfo.h:1269

llvm::TypeSize
Definition TypeSize.h:332

llvm::TypeSize::getFixed
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition TypeSize.h:343

llvm::TypeSize::getScalable
static constexpr TypeSize getScalable(ScalarTy MinimumSize)
Definition TypeSize.h:346

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::VectorType
Base class of all SIMD vector types.
Definition DerivedTypes.h:490

uint64_t

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition AMDGPUMetadata.h:396

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::Intrinsic::ID
unsigned ID
Definition GenericSSAContext.h:28

llvm::NVPTXAS::AddressSpace
AddressSpace
Definition NVPTXAddrSpace.h:21

llvm::TPLoop
Definition ARMTargetTransformInfo.h:53

llvm::TPLoop::MemTransfer
MemTransfer
Definition ARMTargetTransformInfo.h:54

llvm::TPLoop::Allow
@ Allow
Definition ARMTargetTransformInfo.h:54

llvm::TPLoop::ForceDisabled
@ ForceDisabled
Definition ARMTargetTransformInfo.h:54

llvm::TPLoop::ForceEnabled
@ ForceEnabled
Definition ARMTargetTransformInfo.h:54

llvm::TailPredication
Definition ARMTargetTransformInfo.h:42

llvm::TailPredication::Mode
Mode
Definition ARMTargetTransformInfo.h:43

llvm::TailPredication::ForceEnabled
@ ForceEnabled
Definition ARMTargetTransformInfo.h:48

llvm::TailPredication::Disabled
@ Disabled
Definition ARMTargetTransformInfo.h:44

llvm::TailPredication::EnabledNoReductions
@ EnabledNoReductions
Definition ARMTargetTransformInfo.h:45

llvm::TailPredication::ForceEnabledNoReductions
@ ForceEnabledNoReductions
Definition ARMTargetTransformInfo.h:47

llvm::TailPredication::Enabled
@ Enabled
Definition ARMTargetTransformInfo.h:46

llvm::sandboxir::Instruction
friend class Instruction
Iterator for Instructions in a `BasicBlock.
Definition BasicBlock.h:73

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition FunctionInfo.h:25

llvm::Value
RelativeUniformCounterPtr ValuesPtrExpr VTableAddr Value
Definition InstrProf.h:143

llvm::ArrayRef
ArrayRef(const T &OneElt) -> ArrayRef< T >

llvm::isVREVMask
bool isVREVMask(ArrayRef< int > M, EVT VT, unsigned BlockSize)
isVREVMask - Check if a vector shuffle corresponds to a VREV instruction with the specified blocksize...
Definition ARMTargetTransformInfo.h:341

llvm::TailFoldingStyle
TailFoldingStyle
Definition TargetTransformInfo.h:224

llvm::VFParamKind::Vector
@ Vector
Definition VFABIDemangler.h:27

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39

llvm::EVT
Extended Value Type.
Definition ValueTypes.h:35

llvm::EVT::getScalarSizeInBits
uint64_t getScalarSizeInBits() const
Definition ValueTypes.h:408

llvm::HardwareLoopInfo
Attributes of a target dependent hardware loop.
Definition TargetTransformInfo.h:103

llvm::TailFoldingInfo
Definition TargetTransformInfo.h:253

llvm::TargetTransformInfo::OperandValueInfo
Definition TargetTransformInfo.h:1285

llvm::TargetTransformInfo::PeelingPreferences
Definition TargetTransformInfo.h:762

llvm::TargetTransformInfo::UnrollingPreferences
Parameters that control the generic loop unrolling transformation.
Definition TargetTransformInfo.h:638