doxygen/X86TargetTransformInfo_8h_source.html

//===-- X86TargetTransformInfo.h - X86 specific TTI -------------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

/// \file

/// This file a TargetTransformInfoImplBase conforming object specific to the

/// X86 target machine. It uses the target's detailed information to

/// provide more precise answers to certain TTI queries, while letting the

/// target independent and default TTI implementations handle the rest.

///

//===----------------------------------------------------------------------===//


#ifndef LLVM_LIB_TARGET_X86_X86TARGETTRANSFORMINFO_H

#define LLVM_LIB_TARGET_X86_X86TARGETTRANSFORMINFO_H


#include "X86TargetMachine.h"

#include "llvm/Analysis/TargetTransformInfo.h"

#include "llvm/CodeGen/BasicTTIImpl.h"

#include <optional>


namespace llvm {


class InstCombiner;


class X86TTIImpl final : public BasicTTIImplBase<X86TTIImpl> {

  typedef BasicTTIImplBase<X86TTIImpl> BaseT;

  typedef TargetTransformInfo TTI;

  friend BaseT;


  const X86Subtarget *ST;

  const X86TargetLowering *TLI;


  const X86Subtarget *getST() const { return ST; }

  const X86TargetLowering *getTLI() const { return TLI; }


  const FeatureBitset InlineFeatureIgnoreList = {

      // clang-format off

      // This indicates the CPU is 64 bit capable not that we are in 64-bit

      // mode.

      X86::FeatureX86_64,


      // These features don't have any intrinsics or ABI effect.

      X86::FeatureNOPL,

      X86::FeatureCX16,

      X86::FeatureLAHFSAHF64,


      // Some older targets can be setup to fold unaligned loads.

      X86::FeatureSSEUnalignedMem,


      // Codegen control options.

      X86::TuningFast11ByteNOP,

      X86::TuningFast15ByteNOP,

      X86::TuningFastBEXTR,

      X86::TuningFastHorizontalOps,

      X86::TuningFastLZCNT,

      X86::TuningFastScalarFSQRT,

      X86::TuningFastSHLDRotate,

      X86::TuningFastScalarShiftMasks,

      X86::TuningFastVectorShiftMasks,

      X86::TuningFastVariableCrossLaneShuffle,

      X86::TuningFastVariablePerLaneShuffle,

      X86::TuningFastVectorFSQRT,

      X86::TuningLEAForSP,

      X86::TuningLEAUsesAG,

      X86::TuningLZCNTFalseDeps,

      X86::TuningBranchFusion,

      X86::TuningMacroFusion,

      X86::TuningPadShortFunctions,

      X86::TuningPOPCNTFalseDeps,

      X86::TuningMULCFalseDeps,

      X86::TuningPERMFalseDeps,

      X86::TuningRANGEFalseDeps,

      X86::TuningGETMANTFalseDeps,

      X86::TuningMULLQFalseDeps,

      X86::TuningSlow3OpsLEA,

      X86::TuningSlowDivide32,

      X86::TuningSlowDivide64,

      X86::TuningSlowIncDec,

      X86::TuningSlowIndirectCall,

      X86::TuningSlowLEA,

      X86::TuningSlowPMADDWD,

      X86::TuningSlowPMULLD,

      X86::TuningSlowSHLD,

      X86::TuningSlowTwoMemOps,

      X86::TuningSlowUAMem16,

      X86::TuningPreferMaskRegisters,

      X86::TuningInsertVZEROUPPER,

      X86::TuningUseSLMArithCosts,

      X86::TuningUseGLMDivSqrtCosts,

      X86::TuningNoDomainDelay,

      X86::TuningNoDomainDelayMov,

      X86::TuningNoDomainDelayShuffle,

      X86::TuningNoDomainDelayBlend,

      X86::TuningPreferShiftShuffle,

      X86::TuningFastImmVectorShift,

      X86::TuningFastDPWSSD,


      // Perf-tuning flags.

      X86::TuningFastGather,

      X86::TuningSlowUAMem32,

      X86::TuningAllowLight256Bit,


      // Based on whether user set the -mprefer-vector-width command line.

      X86::TuningPrefer128Bit,

      X86::TuningPrefer256Bit,


      // CPU name enums. These just follow CPU string.

      X86::ProcIntelAtom

      // clang-format on

  };


public:


  explicit X86TTIImpl(const X86TargetMachine *TM, const Function &F)

      : BaseT(TM, F.getDataLayout()), ST(TM->getSubtargetImpl(F)),

        TLI(ST->getTargetLowering()) {}


  /// \name Scalar TTI Implementations

  /// @{

  TTI::PopcntSupportKind getPopcntSupport(unsigned TyWidth) const override;


  /// @}


  /// \name Cache TTI Implementation

  /// @{

  std::optional<unsigned> getCacheSize(

    TargetTransformInfo::CacheLevel Level) const override;

  std::optional<unsigned> getCacheAssociativity(

    TargetTransformInfo::CacheLevel Level) const override;

  /// @}


  /// \name Vector TTI Implementations

  /// @{


  unsigned getNumberOfRegisters(unsigned ClassID) const override;

  unsigned getRegisterClassForType(bool Vector, Type *Ty) const override;

  bool hasConditionalLoadStoreForType(Type *Ty, bool IsStore) const override;

  TypeSize

  getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const override;

  unsigned getLoadStoreVecRegBitWidth(unsigned AS) const override;

  unsigned getMaxInterleaveFactor(ElementCount VF) const override;

  InstructionCost getArithmeticInstrCost(

      unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind,

      TTI::OperandValueInfo Op1Info = {TTI::OK_AnyValue, TTI::OP_None},

      TTI::OperandValueInfo Op2Info = {TTI::OK_AnyValue, TTI::OP_None},

      ArrayRef<const Value *> Args = {},

      const Instruction *CxtI = nullptr) const override;

  InstructionCost getAltInstrCost(VectorType *VecTy, unsigned Opcode0,

                                  unsigned Opcode1,

                                  const SmallBitVector &OpcodeMask,

                                  TTI::TargetCostKind CostKind) const override;


  InstructionCost

  getShuffleCost(TTI::ShuffleKind Kind, VectorType *DstTy, VectorType *SrcTy,

                 ArrayRef<int> Mask, TTI::TargetCostKind CostKind, int Index,

                 VectorType *SubTp, ArrayRef<const Value *> Args = {},

                 const Instruction *CxtI = nullptr) const override;

  InstructionCost

  getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src,

                   TTI::CastContextHint CCH, TTI::TargetCostKind CostKind,

                   const Instruction *I = nullptr) const override;

  InstructionCost getCmpSelInstrCost(

      unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred,

      TTI::TargetCostKind CostKind,

      TTI::OperandValueInfo Op1Info = {TTI::OK_AnyValue, TTI::OP_None},

      TTI::OperandValueInfo Op2Info = {TTI::OK_AnyValue, TTI::OP_None},

      const Instruction *I = nullptr) const override;

  using BaseT::getVectorInstrCost;

  InstructionCost

  getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind,

                     unsigned Index, const Value *Op0, const Value *Op1,

                     TTI::VectorInstrContext VIC =

                         TTI::VectorInstrContext::None) const override;

  InstructionCost

  getScalarizationOverhead(VectorType *Ty, const APInt &DemandedElts,

                           bool Insert, bool Extract,

                           TTI::TargetCostKind CostKind,

                           bool ForPoisonSrc = true, ArrayRef<Value *> VL = {},

                           TTI::VectorInstrContext VIC =

                               TTI::VectorInstrContext::None) const override;

  InstructionCost

  getReplicationShuffleCost(Type *EltTy, int ReplicationFactor, int VF,

                            const APInt &DemandedDstElts,

                            TTI::TargetCostKind CostKind) const override;

  InstructionCost getMemoryOpCost(

      unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace,

      TTI::TargetCostKind CostKind,

      TTI::OperandValueInfo OpInfo = {TTI::OK_AnyValue, TTI::OP_None},

      const Instruction *I = nullptr) const override;

  InstructionCost

  getMemIntrinsicInstrCost(const MemIntrinsicCostAttributes &MICA,

                           TTI::TargetCostKind CostKind) const override;

  InstructionCost getMaskedMemoryOpCost(const MemIntrinsicCostAttributes &MICA,

                                        TTI::TargetCostKind CostKind) const;

  InstructionCost getGatherScatterOpCost(const MemIntrinsicCostAttributes &MICA,

                                         TTI::TargetCostKind CostKind) const;

  InstructionCost

  getPointersChainCost(ArrayRef<const Value *> Ptrs, const Value *Base,

                       const TTI::PointersChainInfo &Info, Type *AccessTy,

                       TTI::TargetCostKind CostKind) const override;

  InstructionCost

  getAddressComputationCost(Type *PtrTy, ScalarEvolution *SE, const SCEV *Ptr,

                            TTI::TargetCostKind CostKind) const override;


  std::optional<Instruction *>

  instCombineIntrinsic(InstCombiner &IC, IntrinsicInst &II) const override;

  std::optional<Value *>

  simplifyDemandedUseBitsIntrinsic(InstCombiner &IC, IntrinsicInst &II,

                                   APInt DemandedMask, KnownBits &Known,

                                   bool &KnownBitsComputed) const override;

  std::optional<Value *> simplifyDemandedVectorEltsIntrinsic(

      InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts,

      APInt &UndefElts2, APInt &UndefElts3,

      std::function<void(Instruction *, unsigned, APInt, APInt &)>

          SimplifyAndSetOp) const override;


  unsigned getAtomicMemIntrinsicMaxElementSize() const override;


  InstructionCost

  getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA,

                        TTI::TargetCostKind CostKind) const override;


  InstructionCost

  getArithmeticReductionCost(unsigned Opcode, VectorType *Ty,

                             std::optional<FastMathFlags> FMF,

                             TTI::TargetCostKind CostKind) const override;


  InstructionCost getPartialReductionCost(

      unsigned Opcode, Type *InputTypeA, Type *InputTypeB, Type *AccumType,

      ElementCount VF, TTI::PartialReductionExtendKind OpAExtend,

      TTI::PartialReductionExtendKind OpBExtend, std::optional<unsigned> BinOp,

      TTI::TargetCostKind CostKind,

      std::optional<FastMathFlags> FMF) const override {

    return InstructionCost::getInvalid();

  }


  InstructionCost getMinMaxCost(Intrinsic::ID IID, Type *Ty,

                                TTI::TargetCostKind CostKind,

                                FastMathFlags FMF) const;


  InstructionCost

  getMinMaxReductionCost(Intrinsic::ID IID, VectorType *Ty, FastMathFlags FMF,

                         TTI::TargetCostKind CostKind) const override;


  InstructionCost getInterleavedMemoryOpCost(

      unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef<unsigned> Indices,

      Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind,

      bool UseMaskForCond = false, bool UseMaskForGaps = false) const override;

  InstructionCost getInterleavedMemoryOpCostAVX512(

      unsigned Opcode, FixedVectorType *VecTy, unsigned Factor,

      ArrayRef<unsigned> Indices, Align Alignment, unsigned AddressSpace,

      TTI::TargetCostKind CostKind, bool UseMaskForCond = false,

      bool UseMaskForGaps = false) const;


  InstructionCost getIntImmCost(int64_t) const;


  InstructionCost getIntImmCost(const APInt &Imm, Type *Ty,

                                TTI::TargetCostKind CostKind) const override;


  InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind,

                                 const Instruction *I = nullptr) const override;


  InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx,

                                    const APInt &Imm, Type *Ty,

                                    TTI::TargetCostKind CostKind,

                                    Instruction *Inst = nullptr) const override;

  InstructionCost

  getIntImmCostIntrin(Intrinsic::ID IID, unsigned Idx, const APInt &Imm,

                      Type *Ty, TTI::TargetCostKind CostKind) const override;

  /// Return the cost of the scaling factor used in the addressing

  /// mode represented by AM for this target, for a load/store

  /// of the specified type.

  /// If the AM is supported, the return value must be >= 0.

  /// If the AM is not supported, it returns an invalid cost.

  InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV,

                                       StackOffset BaseOffset, bool HasBaseReg,

                                       int64_t Scale,

                                       unsigned AddrSpace) const override;


  bool isLSRCostLess(const TargetTransformInfo::LSRCost &C1,

                     const TargetTransformInfo::LSRCost &C2) const override;

  bool canMacroFuseCmp() const override;

  bool

  isLegalMaskedLoad(Type *DataType, Align Alignment, unsigned AddressSpace,

                    TTI::MaskKind MaskKind =

                        TTI::MaskKind::VariableOrConstantMask) const override;

  bool

  isLegalMaskedStore(Type *DataType, Align Alignment, unsigned AddressSpace,

                     TTI::MaskKind MaskKind =

                         TTI::MaskKind::VariableOrConstantMask) const override;

  bool isLegalNTLoad(Type *DataType, Align Alignment) const override;

  bool isLegalNTStore(Type *DataType, Align Alignment) const override;

  bool isLegalBroadcastLoad(Type *ElementTy,

                            ElementCount NumElements) const override;

  bool forceScalarizeMaskedGather(VectorType *VTy,

                                  Align Alignment) const override;


  bool forceScalarizeMaskedScatter(VectorType *VTy,

                                   Align Alignment) const override {

    return forceScalarizeMaskedGather(VTy, Alignment);

  }


  bool isLegalMaskedGatherScatter(Type *DataType, Align Alignment) const;

  bool isLegalMaskedGather(Type *DataType, Align Alignment) const override;

  bool isLegalMaskedScatter(Type *DataType, Align Alignment) const override;

  bool isLegalMaskedExpandLoad(Type *DataType, Align Alignment) const override;

  bool isLegalMaskedCompressStore(Type *DataType,

                                  Align Alignment) const override;

  bool isLegalAltInstr(VectorType *VecTy, unsigned Opcode0, unsigned Opcode1,

                       const SmallBitVector &OpcodeMask) const override;

  bool hasDivRemOp(Type *DataType, bool IsSigned) const override;

  bool isExpensiveToSpeculativelyExecute(const Instruction *I) const override;

  bool isFCmpOrdCheaperThanFCmpZero(Type *Ty) const override;

  bool areInlineCompatible(const Function *Caller,

                           const Function *Callee) const override;

  bool areTypesABICompatible(const Function *Caller, const Function *Callee,

                             ArrayRef<Type *> Type) const override;


  uint64_t getMaxMemIntrinsicInlineSizeThreshold() const override {

    return ST->getMaxInlineSizeThreshold();

  }


  TTI::MemCmpExpansionOptions

  enableMemCmpExpansion(bool OptSize, bool IsZeroCmp) const override;

  bool preferAlternateOpcodeVectorization() const override { return false; }

  bool prefersVectorizedAddressing() const override;

  bool supportsEfficientVectorElementLoadStore() const override;

  bool enableInterleavedAccessVectorization() const override;


  InstructionCost getBranchMispredictPenalty() const override;


  bool isProfitableToSinkOperands(Instruction *I,

                                  SmallVectorImpl<Use *> &Ops) const override;


  bool isVectorShiftByScalarCheap(Type *Ty) const override;


  unsigned getStoreMinimumVF(unsigned VF, Type *ScalarMemTy, Type *ScalarValTy,

                             Align Alignment,

                             unsigned AddrSpace) const override;


  bool useFastCCForInternalCall(Function &F) const override;


private:

  bool supportsGather() const;

  InstructionCost getGSVectorCost(unsigned Opcode, TTI::TargetCostKind CostKind,

                                  Type *DataTy, const Value *Ptr,

                                  Align Alignment, unsigned AddressSpace) const;


  int getGatherOverhead() const;

  int getScatterOverhead() const;


  /// @}

};


} // end namespace llvm


#endif

BasicTTIImpl.h
This file provides a helper that implements much of the TTI interface in terms of the target-independ...

CostKind
static cl::opt< OutputCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(OutputCostKind::RecipThroughput), cl::values(clEnumValN(OutputCostKind::RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(OutputCostKind::Latency, "latency", "Instruction latency"), clEnumValN(OutputCostKind::CodeSize, "code-size", "Code size"), clEnumValN(OutputCostKind::SizeAndLatency, "size-latency", "Code size and latency"), clEnumValN(OutputCostKind::All, "all", "Print all cost kinds")))

IntrinsicCostStrategy::InstructionCost
@ InstructionCost
Definition CostModel.cpp:51

TemplateParamKind::Type
@ Type
Definition ItaniumDemangle.h:1243

Ops
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
Definition ItaniumDemangle.h:3391

F
#define F(x, y, z)
Definition MD5.cpp:54

I
#define I(x, y, z)
Definition MD5.cpp:57

InstCombiner
Machine InstCombiner
Definition MachineCombiner.cpp:130

II
uint64_t IntrinsicInst * II
Definition NVVMIntrRange.cpp:46

TargetTransformInfo.h
This pass exposes codegen information to IR-level passes.

X86TargetMachine.h

llvm::APInt
Class for arbitrary precision integers.
Definition APInt.h:78

llvm::ArrayRef
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40

llvm::BasicTTIImplBase< X86TTIImpl >::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, const Value *Op0, const Value *Op1, TTI::VectorInstrContext VIC=TTI::VectorInstrContext::None) const override
Definition BasicTTIImpl.h:1461

llvm::BasicTTIImplBase< X86TTIImpl >::BasicTTIImplBase
BasicTTIImplBase(const TargetMachine *TM, const DataLayout &DL)
Definition BasicTTIImpl.h:378

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:676

llvm::ElementCount
Definition TypeSize.h:298

llvm::FastMathFlags
Convenience struct for specifying and reasoning about fast-math flags.
Definition FMF.h:23

llvm::FeatureBitset
Container class for subtarget features.
Definition SubtargetFeature.h:42

llvm::FixedVectorType
Class to represent fixed width SIMD vectors.
Definition DerivedTypes.h:642

llvm::Function
Definition Function.h:65

llvm::GlobalValue
Definition GlobalValue.h:49

llvm::InstCombiner
The core instruction combiner logic.
Definition InstCombiner.h:48

llvm::InstructionCost
Definition InstructionCost.h:30

llvm::InstructionCost::getInvalid
static InstructionCost getInvalid(CostType Val=0)
Definition InstructionCost.h:82

llvm::Instruction
Definition Instruction.h:69

llvm::SmallBitVector
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
Definition SmallBitVector.h:35

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition SmallVector.h:581

llvm::StackOffset
StackOffset holds a fixed and a scalable offset in bytes.
Definition TypeSize.h:30

llvm::TargetTransformInfoImplBase::getDataLayout
virtual const DataLayout & getDataLayout() const
Definition TargetTransformInfoImpl.h:51

llvm::TargetTransformInfo
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Definition TargetTransformInfo.h:271

llvm::TargetTransformInfo::VectorInstrContext
VectorInstrContext
Represents a hint about the context in which an insert/extract is used.
Definition TargetTransformInfo.h:1067

llvm::TargetTransformInfo::VectorInstrContext::None
@ None
The insert/extract is not used with a load/store.
Definition TargetTransformInfo.h:1068

llvm::TargetTransformInfo::MaskKind
MaskKind
Some targets only support masked load/store with a constant mask.
Definition TargetTransformInfo.h:901

llvm::TargetTransformInfo::VariableOrConstantMask
@ VariableOrConstantMask
Definition TargetTransformInfo.h:902

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition TargetTransformInfo.h:334

llvm::TargetTransformInfo::OP_None
@ OP_None
Definition TargetTransformInfo.h:1275

llvm::TargetTransformInfo::RegisterKind
RegisterKind
Definition TargetTransformInfo.h:1350

llvm::TargetTransformInfo::PopcntSupportKind
PopcntSupportKind
Flags indicating the kind of support for population count.
Definition TargetTransformInfo.h:825

llvm::TargetTransformInfo::PartialReductionExtendKind
PartialReductionExtendKind
Definition TargetTransformInfo.h:273

llvm::TargetTransformInfo::ShuffleKind
ShuffleKind
The various kinds of shuffle patterns for vector queries.
Definition TargetTransformInfo.h:1246

llvm::TargetTransformInfo::CastContextHint
CastContextHint
Represents a hint about the context in which a cast is used.
Definition TargetTransformInfo.h:1581

llvm::TargetTransformInfo::OK_AnyValue
@ OK_AnyValue
Definition TargetTransformInfo.h:1267

llvm::TargetTransformInfo::CacheLevel
CacheLevel
The possible cache levels.
Definition TargetTransformInfo.h:1410

llvm::TypeSize
Definition TypeSize.h:332

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::VectorType
Base class of all SIMD vector types.
Definition DerivedTypes.h:482

llvm::X86Subtarget
Definition X86Subtarget.h:53

llvm::X86TTIImpl::useFastCCForInternalCall
bool useFastCCForInternalCall(Function &F) const override
Definition X86TargetTransformInfo.cpp:7351

llvm::X86TTIImpl::getReplicationShuffleCost
InstructionCost getReplicationShuffleCost(Type *EltTy, int ReplicationFactor, int VF, const APInt &DemandedDstElts, TTI::TargetCostKind CostKind) const override
Definition X86TargetTransformInfo.cpp:5197

llvm::X86TTIImpl::isLegalNTLoad
bool isLegalNTLoad(Type *DataType, Align Alignment) const override
Definition X86TargetTransformInfo.cpp:6443

llvm::X86TTIImpl::getMaxInterleaveFactor
unsigned getMaxInterleaveFactor(ElementCount VF) const override
Definition X86TargetTransformInfo.cpp:235

llvm::X86TTIImpl::getCacheAssociativity
std::optional< unsigned > getCacheAssociativity(TargetTransformInfo::CacheLevel Level) const override
Definition X86TargetTransformInfo.cpp:143

llvm::X86TTIImpl::getMinMaxReductionCost
InstructionCost getMinMaxReductionCost(Intrinsic::ID IID, VectorType *Ty, FastMathFlags FMF, TTI::TargetCostKind CostKind) const override
Try to calculate op costs for min/max reduction operations.
Definition X86TargetTransformInfo.cpp:5878

llvm::X86TTIImpl::isLegalBroadcastLoad
bool isLegalBroadcastLoad(Type *ElementTy, ElementCount NumElements) const override
Definition X86TargetTransformInfo.cpp:6478

llvm::X86TTIImpl::getRegisterClassForType
unsigned getRegisterClassForType(bool Vector, Type *Ty) const override
Definition X86TargetTransformInfo.cpp:166

llvm::X86TTIImpl::getMemIntrinsicInstrCost
InstructionCost getMemIntrinsicInstrCost(const MemIntrinsicCostAttributes &MICA, TTI::TargetCostKind CostKind) const override
Get memory intrinsic cost based on arguments.
Definition X86TargetTransformInfo.cpp:5474

llvm::X86TTIImpl::getPartialReductionCost
InstructionCost getPartialReductionCost(unsigned Opcode, Type *InputTypeA, Type *InputTypeB, Type *AccumType, ElementCount VF, TTI::PartialReductionExtendKind OpAExtend, TTI::PartialReductionExtendKind OpBExtend, std::optional< unsigned > BinOp, TTI::TargetCostKind CostKind, std::optional< FastMathFlags > FMF) const override
Definition X86TargetTransformInfo.h:230

llvm::X86TTIImpl::preferAlternateOpcodeVectorization
bool preferAlternateOpcodeVectorization() const override
Definition X86TargetTransformInfo.h:325

llvm::X86TTIImpl::getShuffleCost
InstructionCost getShuffleCost(TTI::ShuffleKind Kind, VectorType *DstTy, VectorType *SrcTy, ArrayRef< int > Mask, TTI::TargetCostKind CostKind, int Index, VectorType *SubTp, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr) const override
Definition X86TargetTransformInfo.cpp:1534

llvm::X86TTIImpl::X86TTIImpl
X86TTIImpl(const X86TargetMachine *TM, const Function &F)
Definition X86TargetTransformInfo.h:116

llvm::X86TTIImpl::isLegalNTStore
bool isLegalNTStore(Type *DataType, Align Alignment) const override
Definition X86TargetTransformInfo.cpp:6454

llvm::X86TTIImpl::getCastInstrCost
InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src, TTI::CastContextHint CCH, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const override
Definition X86TargetTransformInfo.cpp:2347

llvm::X86TTIImpl::getInterleavedMemoryOpCostAVX512
InstructionCost getInterleavedMemoryOpCostAVX512(unsigned Opcode, FixedVectorType *VecTy, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, bool UseMaskForCond=false, bool UseMaskForGaps=false) const
Definition X86TargetTransformInfo.cpp:6727

llvm::X86TTIImpl::isLegalAltInstr
bool isLegalAltInstr(VectorType *VecTy, unsigned Opcode0, unsigned Opcode1, const SmallBitVector &OpcodeMask) const override
Definition X86TargetTransformInfo.cpp:6557

llvm::X86TTIImpl::getRegisterBitWidth
TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const override
Definition X86TargetTransformInfo.cpp:210

llvm::X86TTIImpl::isVectorShiftByScalarCheap
bool isVectorShiftByScalarCheap(Type *Ty) const override
Definition X86TargetTransformInfo.cpp:7240

llvm::X86TTIImpl::isLegalMaskedGather
bool isLegalMaskedGather(Type *DataType, Align Alignment) const override
Definition X86TargetTransformInfo.cpp:6551

llvm::X86TTIImpl::getScalingFactorCost
InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV, StackOffset BaseOffset, bool HasBaseReg, int64_t Scale, unsigned AddrSpace) const override
Return the cost of the scaling factor used in the addressing mode represented by AM for this target,...
Definition X86TargetTransformInfo.cpp:7200

llvm::X86TTIImpl::getAtomicMemIntrinsicMaxElementSize
unsigned getAtomicMemIntrinsicMaxElementSize() const override
Definition X86TargetTransformInfo.cpp:3686

llvm::X86TTIImpl::getPointersChainCost
InstructionCost getPointersChainCost(ArrayRef< const Value * > Ptrs, const Value *Base, const TTI::PointersChainInfo &Info, Type *AccessTy, TTI::TargetCostKind CostKind) const override
Definition X86TargetTransformInfo.cpp:5560

llvm::X86TTIImpl::forceScalarizeMaskedGather
bool forceScalarizeMaskedGather(VectorType *VTy, Align Alignment) const override
Definition X86TargetTransformInfo.cpp:6522

llvm::X86TTIImpl::getBranchMispredictPenalty
InstructionCost getBranchMispredictPenalty() const override
Definition X86TargetTransformInfo.cpp:7235

llvm::X86TTIImpl::isExpensiveToSpeculativelyExecute
bool isExpensiveToSpeculativelyExecute(const Instruction *I) const override
Definition X86TargetTransformInfo.cpp:6602

llvm::X86TTIImpl::hasConditionalLoadStoreForType
bool hasConditionalLoadStoreForType(Type *Ty, bool IsStore) const override
Definition X86TargetTransformInfo.cpp:186

llvm::X86TTIImpl::isLegalMaskedStore
bool isLegalMaskedStore(Type *DataType, Align Alignment, unsigned AddressSpace, TTI::MaskKind MaskKind=TTI::MaskKind::VariableOrConstantMask) const override
Definition X86TargetTransformInfo.cpp:6429

llvm::X86TTIImpl::getCacheSize
std::optional< unsigned > getCacheSize(TargetTransformInfo::CacheLevel Level) const override
Definition X86TargetTransformInfo.cpp:113

llvm::X86TTIImpl::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args={}, const Instruction *CxtI=nullptr) const override
Definition X86TargetTransformInfo.cpp:253

llvm::X86TTIImpl::isLegalMaskedGatherScatter
bool isLegalMaskedGatherScatter(Type *DataType, Align Alignment) const
Definition X86TargetTransformInfo.cpp:6535

llvm::X86TTIImpl::isLegalMaskedLoad
bool isLegalMaskedLoad(Type *DataType, Align Alignment, unsigned AddressSpace, TTI::MaskKind MaskKind=TTI::MaskKind::VariableOrConstantMask) const override
Definition X86TargetTransformInfo.cpp:6415

llvm::X86TTIImpl::enableInterleavedAccessVectorization
bool enableInterleavedAccessVectorization() const override
Definition X86TargetTransformInfo.cpp:6716

llvm::X86TTIImpl::getLoadStoreVecRegBitWidth
unsigned getLoadStoreVecRegBitWidth(unsigned AS) const override
Definition X86TargetTransformInfo.cpp:230

llvm::X86TTIImpl::getNumberOfRegisters
unsigned getNumberOfRegisters(unsigned ClassID) const override
Definition X86TargetTransformInfo.cpp:172

llvm::X86TTIImpl::simplifyDemandedUseBitsIntrinsic
std::optional< Value * > simplifyDemandedUseBitsIntrinsic(InstCombiner &IC, IntrinsicInst &II, APInt DemandedMask, KnownBits &Known, bool &KnownBitsComputed) const override
Definition X86InstCombineIntrinsic.cpp:3213

llvm::X86TTIImpl::getMaxMemIntrinsicInlineSizeThreshold
uint64_t getMaxMemIntrinsicInlineSizeThreshold() const override
Definition X86TargetTransformInfo.h:319

llvm::X86TTIImpl::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, const Value *Op0, const Value *Op1, TTI::VectorInstrContext VIC=TTI::VectorInstrContext::None) const override
Definition X86TargetTransformInfo.cpp:4861

llvm::X86TTIImpl::isLegalMaskedScatter
bool isLegalMaskedScatter(Type *DataType, Align Alignment) const override
Definition X86TargetTransformInfo.cpp:6590

llvm::X86TTIImpl::getStoreMinimumVF
unsigned getStoreMinimumVF(unsigned VF, Type *ScalarMemTy, Type *ScalarValTy, Align Alignment, unsigned AddrSpace) const override
Definition X86TargetTransformInfo.cpp:7262

llvm::X86TTIImpl::hasDivRemOp
bool hasDivRemOp(Type *DataType, bool IsSigned) const override
Definition X86TargetTransformInfo.cpp:6597

llvm::X86TTIImpl::isLegalMaskedCompressStore
bool isLegalMaskedCompressStore(Type *DataType, Align Alignment) const override
Definition X86TargetTransformInfo.cpp:6510

llvm::X86TTIImpl::getIntImmCostIntrin
InstructionCost getIntImmCostIntrin(Intrinsic::ID IID, unsigned Idx, const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind) const override
Definition X86TargetTransformInfo.cpp:6211

llvm::X86TTIImpl::simplifyDemandedVectorEltsIntrinsic
std::optional< Value * > simplifyDemandedVectorEltsIntrinsic(InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts, APInt &UndefElts2, APInt &UndefElts3, std::function< void(Instruction *, unsigned, APInt, APInt &)> SimplifyAndSetOp) const override
Definition X86InstCombineIntrinsic.cpp:3253

llvm::X86TTIImpl::supportsEfficientVectorElementLoadStore
bool supportsEfficientVectorElementLoadStore() const override
Definition X86TargetTransformInfo.cpp:6712

llvm::X86TTIImpl::getIntImmCostInst
InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx, const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind, Instruction *Inst=nullptr) const override
Definition X86TargetTransformInfo.cpp:6098

llvm::X86TTIImpl::isLegalMaskedExpandLoad
bool isLegalMaskedExpandLoad(Type *DataType, Align Alignment) const override
Definition X86TargetTransformInfo.cpp:6486

llvm::X86TTIImpl::getPopcntSupport
TTI::PopcntSupportKind getPopcntSupport(unsigned TyWidth) const override
Definition X86TargetTransformInfo.cpp:105

llvm::X86TTIImpl::isFCmpOrdCheaperThanFCmpZero
bool isFCmpOrdCheaperThanFCmpZero(Type *Ty) const override
Definition X86TargetTransformInfo.cpp:6611

llvm::X86TTIImpl::enableMemCmpExpansion
TTI::MemCmpExpansionOptions enableMemCmpExpansion(bool OptSize, bool IsZeroCmp) const override
Definition X86TargetTransformInfo.cpp:6684

llvm::X86TTIImpl::getIntImmCost
InstructionCost getIntImmCost(int64_t) const
Calculate the cost of materializing a 64-bit value.
Definition X86TargetTransformInfo.cpp:6053

llvm::X86TTIImpl::getMinMaxCost
InstructionCost getMinMaxCost(Intrinsic::ID IID, Type *Ty, TTI::TargetCostKind CostKind, FastMathFlags FMF) const
Definition X86TargetTransformInfo.cpp:5870

llvm::X86TTIImpl::getCFInstrCost
InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const override
Definition X86TargetTransformInfo.cpp:6247

llvm::X86TTIImpl::getInterleavedMemoryOpCost
InstructionCost getInterleavedMemoryOpCost(unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, bool UseMaskForCond=false, bool UseMaskForGaps=false) const override
Definition X86TargetTransformInfo.cpp:6885

llvm::X86TTIImpl::canMacroFuseCmp
bool canMacroFuseCmp() const override
Definition X86TargetTransformInfo.cpp:6387

llvm::X86TTIImpl::areInlineCompatible
bool areInlineCompatible(const Function *Caller, const Function *Callee) const override
Definition X86TargetTransformInfo.cpp:6613

llvm::X86TTIImpl::getMaskedMemoryOpCost
InstructionCost getMaskedMemoryOpCost(const MemIntrinsicCostAttributes &MICA, TTI::TargetCostKind CostKind) const
Definition X86TargetTransformInfo.cpp:5488

llvm::X86TTIImpl::prefersVectorizedAddressing
bool prefersVectorizedAddressing() const override
Definition X86TargetTransformInfo.cpp:6708

llvm::X86TTIImpl::areTypesABICompatible
bool areTypesABICompatible(const Function *Caller, const Function *Callee, ArrayRef< Type * > Type) const override
Definition X86TargetTransformInfo.cpp:6661

llvm::X86TTIImpl::getAltInstrCost
InstructionCost getAltInstrCost(VectorType *VecTy, unsigned Opcode0, unsigned Opcode1, const SmallBitVector &OpcodeMask, TTI::TargetCostKind CostKind) const override
Definition X86TargetTransformInfo.cpp:1526

llvm::X86TTIImpl::forceScalarizeMaskedScatter
bool forceScalarizeMaskedScatter(VectorType *VTy, Align Alignment) const override
Definition X86TargetTransformInfo.h:299

llvm::X86TTIImpl::getIntrinsicInstrCost
InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA, TTI::TargetCostKind CostKind) const override
Get intrinsic cost based on arguments.
Definition X86TargetTransformInfo.cpp:3689

llvm::X86TTIImpl::isProfitableToSinkOperands
bool isProfitableToSinkOperands(Instruction *I, SmallVectorImpl< Use * > &Ops) const override
Definition X86TargetTransformInfo.cpp:7272

llvm::X86TTIImpl::getScalarizationOverhead
InstructionCost getScalarizationOverhead(VectorType *Ty, const APInt &DemandedElts, bool Insert, bool Extract, TTI::TargetCostKind CostKind, bool ForPoisonSrc=true, ArrayRef< Value * > VL={}, TTI::VectorInstrContext VIC=TTI::VectorInstrContext::None) const override
Estimate the overhead of scalarizing an instruction.
Definition X86TargetTransformInfo.cpp:5014

llvm::X86TTIImpl::getArithmeticReductionCost
InstructionCost getArithmeticReductionCost(unsigned Opcode, VectorType *Ty, std::optional< FastMathFlags > FMF, TTI::TargetCostKind CostKind) const override
Definition X86TargetTransformInfo.cpp:5609

llvm::X86TTIImpl::getGatherScatterOpCost
InstructionCost getGatherScatterOpCost(const MemIntrinsicCostAttributes &MICA, TTI::TargetCostKind CostKind) const
Calculate the cost of Gather / Scatter operation.
Definition X86TargetTransformInfo.cpp:6349

llvm::X86TTIImpl::instCombineIntrinsic
std::optional< Instruction * > instCombineIntrinsic(InstCombiner &IC, IntrinsicInst &II) const override
Definition X86InstCombineIntrinsic.cpp:2202

llvm::X86TTIImpl::getMemoryOpCost
InstructionCost getMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, TTI::OperandValueInfo OpInfo={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr) const override
Definition X86TargetTransformInfo.cpp:5303

llvm::X86TTIImpl::getAddressComputationCost
InstructionCost getAddressComputationCost(Type *PtrTy, ScalarEvolution *SE, const SCEV *Ptr, TTI::TargetCostKind CostKind) const override
Definition X86TargetTransformInfo.cpp:5580

llvm::X86TTIImpl::getCmpSelInstrCost
InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr) const override
Definition X86TargetTransformInfo.cpp:3387

llvm::X86TTIImpl::isLSRCostLess
bool isLSRCostLess(const TargetTransformInfo::LSRCost &C1, const TargetTransformInfo::LSRCost &C2) const override
Definition X86TargetTransformInfo.cpp:6378

llvm::X86TargetLowering
Definition X86ISelLowering.h:93

llvm::X86TargetMachine
Definition X86TargetMachine.h:28

uint64_t

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition AMDGPUMetadata.h:396

llvm::Intrinsic::ID
unsigned ID
Definition GenericSSAContext.h:28

llvm::NVPTXAS::AddressSpace
AddressSpace
Definition NVPTXAddrSpace.h:21

llvm::sampleprof::Base
@ Base
Definition Discriminator.h:58

llvm::sandboxir::Instruction
friend class Instruction
Iterator for Instructions in a `BasicBlock.
Definition BasicBlock.h:73

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition FunctionInfo.h:25

llvm::Value
FunctionAddr VTableAddr Value
Definition InstrProf.h:137

llvm::ArrayRef
ArrayRef(const T &OneElt) -> ArrayRef< T >

llvm::VFParamKind::Vector
@ Vector
Definition VFABIDemangler.h:27

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39

llvm::TargetTransformInfo::LSRCost
Definition TargetTransformInfo.h:627

llvm::TargetTransformInfo::MemCmpExpansionOptions
Returns options for expansion of memcmp. IsZeroCmp is.
Definition TargetTransformInfo.h:1108

llvm::TargetTransformInfo::OperandValueInfo
Definition TargetTransformInfo.h:1283

llvm::TargetTransformInfo::PointersChainInfo
Describe known properties for a set of pointers.
Definition TargetTransformInfo.h:382