doxygen/AMDGPUMCCodeEmitter_8cpp_source.html

//===-- AMDGPUMCCodeEmitter.cpp - AMDGPU Code Emitter ---------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

/// \file

/// The AMDGPU code emitter produces machine code that can be executed

/// directly on the GPU device.

//

//===----------------------------------------------------------------------===//


#include "MCTargetDesc/AMDGPUFixupKinds.h"

#include "MCTargetDesc/AMDGPUMCExpr.h"

#include "MCTargetDesc/AMDGPUMCTargetDesc.h"

#include "SIDefines.h"

#include "Utils/AMDGPUBaseInfo.h"

#include "llvm/ADT/APInt.h"

#include "llvm/MC/MCCodeEmitter.h"

#include "llvm/MC/MCContext.h"

#include "llvm/MC/MCExpr.h"

#include "llvm/MC/MCInstrInfo.h"

#include "llvm/MC/MCRegisterInfo.h"

#include "llvm/MC/MCSubtargetInfo.h"

#include "llvm/Support/Casting.h"

#include "llvm/Support/EndianStream.h"

#include <optional>


using namespace llvm;


namespace {


class AMDGPUMCCodeEmitter : public MCCodeEmitter {

  const MCRegisterInfo &MRI;

  const MCInstrInfo &MCII;


public:

  AMDGPUMCCodeEmitter(const MCInstrInfo &MCII, const MCRegisterInfo &MRI)

      : MRI(MRI), MCII(MCII) {}


  /// Encode the instruction and write it to the OS.

  void encodeInstruction(const MCInst &MI, SmallVectorImpl<char> &CB,

                         SmallVectorImpl<MCFixup> &Fixups,

                         const MCSubtargetInfo &STI) const override;


  void getMachineOpValue(const MCInst &MI, const MCOperand &MO, APInt &Op,

                         SmallVectorImpl<MCFixup> &Fixups,

                         const MCSubtargetInfo &STI) const;


  void getMachineOpValueT16(const MCInst &MI, unsigned OpNo, APInt &Op,

                            SmallVectorImpl<MCFixup> &Fixups,

                            const MCSubtargetInfo &STI) const;


  void getMachineOpValueT16Lo128(const MCInst &MI, unsigned OpNo, APInt &Op,

                                 SmallVectorImpl<MCFixup> &Fixups,

                                 const MCSubtargetInfo &STI) const;


  /// Use a fixup to encode the simm16 field for SOPP branch

  ///        instructions.

  void getSOPPBrEncoding(const MCInst &MI, unsigned OpNo, APInt &Op,

                         SmallVectorImpl<MCFixup> &Fixups,

                         const MCSubtargetInfo &STI) const;


  void getSMEMOffsetEncoding(const MCInst &MI, unsigned OpNo, APInt &Op,

                             SmallVectorImpl<MCFixup> &Fixups,

                             const MCSubtargetInfo &STI) const;


  void getSDWASrcEncoding(const MCInst &MI, unsigned OpNo, APInt &Op,

                          SmallVectorImpl<MCFixup> &Fixups,

                          const MCSubtargetInfo &STI) const;


  void getSDWAVopcDstEncoding(const MCInst &MI, unsigned OpNo, APInt &Op,

                              SmallVectorImpl<MCFixup> &Fixups,

                              const MCSubtargetInfo &STI) const;


  void getAVOperandEncoding(const MCInst &MI, unsigned OpNo, APInt &Op,

                            SmallVectorImpl<MCFixup> &Fixups,

                            const MCSubtargetInfo &STI) const;


private:

  uint64_t getImplicitOpSelHiEncoding(int Opcode) const;

  void getMachineOpValueCommon(const MCInst &MI, const MCOperand &MO,

                               unsigned OpNo, APInt &Op,

                               SmallVectorImpl<MCFixup> &Fixups,

                               const MCSubtargetInfo &STI) const;


  /// Encode an fp or int literal.

  std::optional<uint64_t>

  getLitEncoding(const MCInstrDesc &Desc, const MCOperand &MO, unsigned OpNo,

                 const MCSubtargetInfo &STI,

                 bool HasMandatoryLiteral = false) const;


  void getBinaryCodeForInstr(const MCInst &MI, SmallVectorImpl<MCFixup> &Fixups,

                             APInt &Inst, APInt &Scratch,

                             const MCSubtargetInfo &STI) const;


  template <bool HasSrc0, bool HasSrc1, bool HasSrc2>

  APInt postEncodeVOP3(const MCInst &MI, APInt EncodedValue,

                       const MCSubtargetInfo &STI) const;


  APInt postEncodeVOPCX(const MCInst &MI, APInt EncodedValue,

                        const MCSubtargetInfo &STI) const;

};


} // end anonymous namespace


MCCodeEmitter *llvm::createAMDGPUMCCodeEmitter(const MCInstrInfo &MCII,

                                               MCContext &Ctx) {

  return new AMDGPUMCCodeEmitter(MCII, *Ctx.getRegisterInfo());

}


static void addFixup(SmallVectorImpl<MCFixup> &Fixups, uint32_t Offset,

                     const MCExpr *Value, uint16_t Kind, bool PCRel = false) {

  Fixups.push_back(MCFixup::create(Offset, Value, Kind, PCRel));

}


// Returns the encoding value to use if the given integer is an integer inline

// immediate value, or 0 if it is not.

template <typename IntTy>


static uint32_t getIntInlineImmEncoding(IntTy Imm) {

  if (Imm >= 0 && Imm <= 64)

    return 128 + Imm;


  if (Imm >= -16 && Imm <= -1)

    return 192 + std::abs(Imm);


  return 0;

}


static uint32_t getLit16Encoding(uint16_t Val, const MCSubtargetInfo &STI) {

  uint16_t IntImm = getIntInlineImmEncoding(static_cast<int16_t>(Val));

  if (IntImm != 0)

    return IntImm;


  if (Val == 0x3800) // 0.5

    return 240;


  if (Val == 0xB800) // -0.5

    return 241;


  if (Val == 0x3C00) // 1.0

    return 242;


  if (Val == 0xBC00) // -1.0

    return 243;


  if (Val == 0x4000) // 2.0

    return 244;


  if (Val == 0xC000) // -2.0

    return 245;


  if (Val == 0x4400) // 4.0

    return 246;


  if (Val == 0xC400) // -4.0

    return 247;


  if (Val == 0x3118 && // 1.0 / (2.0 * pi)

      STI.hasFeature(AMDGPU::FeatureInv2PiInlineImm))

    return 248;


  return 255;

}


static uint32_t getLitBF16Encoding(uint16_t Val) {

  uint16_t IntImm = getIntInlineImmEncoding(static_cast<int16_t>(Val));

  if (IntImm != 0)

    return IntImm;


  // clang-format off

  switch (Val) {

  case 0x3F00: return 240; // 0.5

  case 0xBF00: return 241; // -0.5

  case 0x3F80: return 242; // 1.0

  case 0xBF80: return 243; // -1.0

  case 0x4000: return 244; // 2.0

  case 0xC000: return 245; // -2.0

  case 0x4080: return 246; // 4.0

  case 0xC080: return 247; // -4.0

  case 0x3E22: return 248; // 1.0 / (2.0 * pi)

  default:     return 255;

  }

  // clang-format on

}


static uint32_t getLit32Encoding(uint32_t Val, const MCSubtargetInfo &STI) {

  uint32_t IntImm = getIntInlineImmEncoding(static_cast<int32_t>(Val));

  if (IntImm != 0)

    return IntImm;


  if (Val == llvm::bit_cast<uint32_t>(0.5f))

    return 240;


  if (Val == llvm::bit_cast<uint32_t>(-0.5f))

    return 241;


  if (Val == llvm::bit_cast<uint32_t>(1.0f))

    return 242;


  if (Val == llvm::bit_cast<uint32_t>(-1.0f))

    return 243;


  if (Val == llvm::bit_cast<uint32_t>(2.0f))

    return 244;


  if (Val == llvm::bit_cast<uint32_t>(-2.0f))

    return 245;


  if (Val == llvm::bit_cast<uint32_t>(4.0f))

    return 246;


  if (Val == llvm::bit_cast<uint32_t>(-4.0f))

    return 247;


  if (Val == 0x3e22f983 && // 1.0 / (2.0 * pi)

      STI.hasFeature(AMDGPU::FeatureInv2PiInlineImm))

    return 248;


  return 255;

}


static uint32_t getLit16IntEncoding(uint32_t Val, const MCSubtargetInfo &STI) {

  return getLit32Encoding(Val, STI);

}


static uint32_t getLit64Encoding(const MCInstrDesc &Desc, uint64_t Val,

                                 const MCSubtargetInfo &STI, bool IsFP) {

  uint32_t IntImm = getIntInlineImmEncoding(static_cast<int64_t>(Val));

  if (IntImm != 0)

    return IntImm;


  if (Val == llvm::bit_cast<uint64_t>(0.5))

    return 240;


  if (Val == llvm::bit_cast<uint64_t>(-0.5))

    return 241;


  if (Val == llvm::bit_cast<uint64_t>(1.0))

    return 242;


  if (Val == llvm::bit_cast<uint64_t>(-1.0))

    return 243;


  if (Val == llvm::bit_cast<uint64_t>(2.0))

    return 244;


  if (Val == llvm::bit_cast<uint64_t>(-2.0))

    return 245;


  if (Val == llvm::bit_cast<uint64_t>(4.0))

    return 246;


  if (Val == llvm::bit_cast<uint64_t>(-4.0))

    return 247;


  if (Val == 0x3fc45f306dc9c882 && // 1.0 / (2.0 * pi)

      STI.hasFeature(AMDGPU::FeatureInv2PiInlineImm))

    return 248;


  // The rest part needs to align with AMDGPUInstPrinter::printLiteral64.


  bool CanUse64BitLiterals =

      STI.hasFeature(AMDGPU::Feature64BitLiterals) &&

      !(Desc.TSFlags & (SIInstrFlags::VOP3 | SIInstrFlags::VOP3P));

  if (IsFP) {

    return CanUse64BitLiterals && Lo_32(Val) ? 254 : 255;

  }


  return CanUse64BitLiterals && (!isInt<32>(Val) || !isUInt<32>(Val)) ? 254

                                                                      : 255;

}


std::optional<uint64_t> AMDGPUMCCodeEmitter::getLitEncoding(

    const MCInstrDesc &Desc, const MCOperand &MO, unsigned OpNo,

    const MCSubtargetInfo &STI, bool HasMandatoryLiteral) const {

  const MCOperandInfo &OpInfo = Desc.operands()[OpNo];

  int64_t Imm = 0;

  if (MO.isExpr()) {

    if (!MO.getExpr()->evaluateAsAbsolute(Imm) ||

        AMDGPU::isLitExpr(MO.getExpr())) {

      if (OpInfo.OperandType == AMDGPU::OPERAND_KIMM16 ||

          OpInfo.OperandType == AMDGPU::OPERAND_KIMM32 ||

          OpInfo.OperandType == AMDGPU::OPERAND_KIMM64)

        return Imm;

      if (STI.hasFeature(AMDGPU::Feature64BitLiterals) &&

          AMDGPU::getOperandSize(OpInfo) == 8 &&

          AMDGPU::getExprKind(MO.getExpr()) != AMDGPUMCExpr::AGVK_Lit)

        return 254;

      return 255;

    }

  } else {

    assert(!MO.isDFPImm());


    if (!MO.isImm())

      return {};


    Imm = MO.getImm();

  }


  switch (OpInfo.OperandType) {

  case AMDGPU::OPERAND_REG_IMM_INT32:

  case AMDGPU::OPERAND_REG_IMM_FP32:

  case AMDGPU::OPERAND_REG_INLINE_C_INT32:

  case AMDGPU::OPERAND_REG_INLINE_C_FP32:

  case AMDGPU::OPERAND_REG_INLINE_AC_INT32:

  case AMDGPU::OPERAND_REG_INLINE_AC_FP32:

  case AMDGPU::OPERAND_REG_IMM_V2INT32:

  case AMDGPU::OPERAND_REG_IMM_V2FP32:

  case AMDGPU::OPERAND_INLINE_SPLIT_BARRIER_INT32:

    return getLit32Encoding(static_cast<uint32_t>(Imm), STI);


  case AMDGPU::OPERAND_REG_IMM_INT64:

  case AMDGPU::OPERAND_REG_INLINE_C_INT64:

    return getLit64Encoding(Desc, static_cast<uint64_t>(Imm), STI, false);


  case AMDGPU::OPERAND_REG_INLINE_C_FP64:

  case AMDGPU::OPERAND_REG_INLINE_AC_FP64:

    return getLit64Encoding(Desc, static_cast<uint64_t>(Imm), STI, true);


  case AMDGPU::OPERAND_REG_IMM_FP64: {

    auto Enc = getLit64Encoding(Desc, static_cast<uint64_t>(Imm), STI, true);

    return (HasMandatoryLiteral && Enc == 255) ? 254 : Enc;

  }


  case AMDGPU::OPERAND_REG_IMM_INT16:

  case AMDGPU::OPERAND_REG_INLINE_C_INT16:

    return getLit16IntEncoding(static_cast<uint32_t>(Imm), STI);


  case AMDGPU::OPERAND_REG_IMM_FP16:

  case AMDGPU::OPERAND_REG_INLINE_C_FP16:

    // FIXME Is this correct? What do inline immediates do on SI for f16 src

    // which does not have f16 support?

    return getLit16Encoding(static_cast<uint16_t>(Imm), STI);


  case AMDGPU::OPERAND_REG_IMM_BF16:

  case AMDGPU::OPERAND_REG_INLINE_C_BF16:

    // We don't actually need to check Inv2Pi here because BF16 instructions can

    // only be emitted for targets that already support the feature.

    return getLitBF16Encoding(static_cast<uint16_t>(Imm));


  case AMDGPU::OPERAND_REG_IMM_V2INT16:

  case AMDGPU::OPERAND_REG_INLINE_C_V2INT16:

    return AMDGPU::getInlineEncodingV2I16(static_cast<uint32_t>(Imm))

        .value_or(255);


  case AMDGPU::OPERAND_REG_IMM_V2FP16:

  case AMDGPU::OPERAND_REG_INLINE_C_V2FP16:

    return AMDGPU::getInlineEncodingV2F16(static_cast<uint32_t>(Imm))

        .value_or(255);


  case AMDGPU::OPERAND_REG_IMM_V2FP16_SPLAT:

    // V_PK_FMAC_F16 has different inline constant behavior on pre-GFX11 vs

    // GFX11+: pre-GFX11 produces (f16, 0), GFX11+ duplicates f16 to both

    // halves.

    return AMDGPU::getPKFMACF16InlineEncoding(static_cast<uint32_t>(Imm),

                                              AMDGPU::isGFX11Plus(STI))

        .value_or(255);


  case AMDGPU::OPERAND_REG_IMM_V2BF16:

  case AMDGPU::OPERAND_REG_INLINE_C_V2BF16:

    return AMDGPU::getInlineEncodingV2BF16(static_cast<uint32_t>(Imm))

        .value_or(255);


  case AMDGPU::OPERAND_REG_IMM_NOINLINE_V2FP16:

    return 255;


  case AMDGPU::OPERAND_KIMM32:

  case AMDGPU::OPERAND_KIMM16:

  case AMDGPU::OPERAND_KIMM64:

    return Imm;

  default:

    llvm_unreachable("invalid operand size");

  }

}


uint64_t AMDGPUMCCodeEmitter::getImplicitOpSelHiEncoding(int Opcode) const {

  using namespace AMDGPU::VOP3PEncoding;


  if (AMDGPU::hasNamedOperand(Opcode, AMDGPU::OpName::op_sel_hi)) {

    if (AMDGPU::hasNamedOperand(Opcode, AMDGPU::OpName::src2))

      return 0;

    if (AMDGPU::hasNamedOperand(Opcode, AMDGPU::OpName::src1))

      return OP_SEL_HI_2;

    if (AMDGPU::hasNamedOperand(Opcode, AMDGPU::OpName::src0))

      return OP_SEL_HI_1 | OP_SEL_HI_2;

  }

  return OP_SEL_HI_0 | OP_SEL_HI_1 | OP_SEL_HI_2;

}


void AMDGPUMCCodeEmitter::encodeInstruction(const MCInst &MI,

                                            SmallVectorImpl<char> &CB,

                                            SmallVectorImpl<MCFixup> &Fixups,

                                            const MCSubtargetInfo &STI) const {

  int Opcode = MI.getOpcode();

  APInt Encoding, Scratch;

  getBinaryCodeForInstr(MI, Fixups, Encoding, Scratch,  STI);

  const MCInstrDesc &Desc = MCII.get(MI.getOpcode());

  unsigned bytes = Desc.getSize();


  // Set unused op_sel_hi bits to 1 for VOP3P and MAI instructions.

  // Note that accvgpr_read/write are MAI, have src0, but do not use op_sel.

  if (((Desc.TSFlags & SIInstrFlags::VOP3P) ||

       Opcode == AMDGPU::V_ACCVGPR_READ_B32_vi ||

       Opcode == AMDGPU::V_ACCVGPR_WRITE_B32_vi) &&

      // Matrix B format operand reuses op_sel_hi.

      !AMDGPU::hasNamedOperand(Opcode, AMDGPU::OpName::matrix_b_fmt) &&

      // Matrix B scale operand reuses op_sel_hi.

      !AMDGPU::hasNamedOperand(Opcode, AMDGPU::OpName::matrix_b_scale) &&

      // Matrix B reuse operand reuses op_sel_hi.

      !AMDGPU::hasNamedOperand(Opcode, AMDGPU::OpName::matrix_b_reuse)) {

    Encoding |= getImplicitOpSelHiEncoding(Opcode);

  }


  for (unsigned i = 0; i < bytes; i++) {

    CB.push_back((uint8_t)Encoding.extractBitsAsZExtValue(8, 8 * i));

  }


  // NSA encoding.

  if (AMDGPU::isGFX10Plus(STI) && Desc.TSFlags & SIInstrFlags::MIMG) {

    int vaddr0 = AMDGPU::getNamedOperandIdx(MI.getOpcode(),

                                            AMDGPU::OpName::vaddr0);

    int srsrc = AMDGPU::getNamedOperandIdx(MI.getOpcode(),

                                           AMDGPU::OpName::srsrc);

    assert(vaddr0 >= 0 && srsrc > vaddr0);

    unsigned NumExtraAddrs = srsrc - vaddr0 - 1;

    unsigned NumPadding = (-NumExtraAddrs) & 3;


    for (unsigned i = 0; i < NumExtraAddrs; ++i) {

      getMachineOpValue(MI, MI.getOperand(vaddr0 + 1 + i), Encoding, Fixups,

                        STI);

      CB.push_back((uint8_t)Encoding.getLimitedValue());

    }

    CB.append(NumPadding, 0);

  }


  if ((bytes > 8 && STI.hasFeature(AMDGPU::FeatureVOP3Literal)) ||

      (bytes > 4 && !STI.hasFeature(AMDGPU::FeatureVOP3Literal)))

    return;


  // Do not print literals from SISrc Operands for insts with mandatory literals

  if (AMDGPU::hasNamedOperand(MI.getOpcode(), AMDGPU::OpName::imm))

    return;


  // Check for additional literals

  for (unsigned i = 0, e = Desc.getNumOperands(); i < e; ++i) {


    // Check if this operand should be encoded as [SV]Src

    if (!AMDGPU::isSISrcOperand(Desc, i))

      continue;


    // Is this operand a literal immediate?

    const MCOperand &Op = MI.getOperand(i);

    auto Enc = getLitEncoding(Desc, Op, i, STI);

    if (!Enc || (*Enc != 255 && *Enc != 254))

      continue;


    // Yes! Encode it

    int64_t Imm = 0;


    bool IsLit = false;

    if (Op.isImm())

      Imm = Op.getImm();

    else if (Op.isExpr()) {

      if (const auto *C = dyn_cast<MCConstantExpr>(Op.getExpr())) {

        Imm = C->getValue();

      } else if (AMDGPU::isLitExpr(Op.getExpr())) {

        IsLit = true;

        Imm = AMDGPU::getLitValue(Op.getExpr());

      }

    } else // Exprs will be replaced with a fixup value.

      llvm_unreachable("Must be immediate or expr");


    if (*Enc == 254) {

      assert(STI.hasFeature(AMDGPU::Feature64BitLiterals));

      support::endian::write<uint64_t>(CB, Imm, llvm::endianness::little);

    } else {

      auto OpType =

          static_cast<AMDGPU::OperandType>(Desc.operands()[i].OperandType);

      Imm = AMDGPU::encode32BitLiteral(Imm, OpType, IsLit);

      support::endian::write<uint32_t>(CB, Imm, llvm::endianness::little);

    }


    // Only one literal value allowed

    break;

  }

}


void AMDGPUMCCodeEmitter::getSOPPBrEncoding(const MCInst &MI, unsigned OpNo,

                                            APInt &Op,

                                            SmallVectorImpl<MCFixup> &Fixups,

                                            const MCSubtargetInfo &STI) const {

  const MCOperand &MO = MI.getOperand(OpNo);


  if (MO.isExpr()) {

    const MCExpr *Expr = MO.getExpr();

    addFixup(Fixups, 0, Expr, AMDGPU::fixup_si_sopp_br, true);

    Op = APInt::getZero(96);

  } else {

    getMachineOpValue(MI, MO, Op, Fixups, STI);

  }

}


void AMDGPUMCCodeEmitter::getSMEMOffsetEncoding(

    const MCInst &MI, unsigned OpNo, APInt &Op,

    SmallVectorImpl<MCFixup> &Fixups, const MCSubtargetInfo &STI) const {

  auto Offset = MI.getOperand(OpNo).getImm();

  // VI only supports 20-bit unsigned offsets.

  assert(!AMDGPU::isVI(STI) || isUInt<20>(Offset));

  Op = Offset;

}


void AMDGPUMCCodeEmitter::getSDWASrcEncoding(const MCInst &MI, unsigned OpNo,

                                             APInt &Op,

                                             SmallVectorImpl<MCFixup> &Fixups,

                                             const MCSubtargetInfo &STI) const {

  using namespace AMDGPU::SDWA;


  uint64_t RegEnc = 0;


  const MCOperand &MO = MI.getOperand(OpNo);


  if (MO.isReg()) {

    MCRegister Reg = MO.getReg();

    RegEnc |= MRI.getEncodingValue(Reg);

    RegEnc &= SDWA9EncValues::SRC_VGPR_MASK;

    if (AMDGPU::isSGPR(AMDGPU::mc2PseudoReg(Reg), &MRI)) {

      RegEnc |= SDWA9EncValues::SRC_SGPR_MASK;

    }

    Op = RegEnc;

    return;

  } else {

    const MCInstrDesc &Desc = MCII.get(MI.getOpcode());

    auto Enc = getLitEncoding(Desc, MO, OpNo, STI);

    if (Enc && *Enc != 255) {

      Op = *Enc | SDWA9EncValues::SRC_SGPR_MASK;

      return;

    }

  }


  llvm_unreachable("Unsupported operand kind");

}


void AMDGPUMCCodeEmitter::getSDWAVopcDstEncoding(

    const MCInst &MI, unsigned OpNo, APInt &Op,

    SmallVectorImpl<MCFixup> &Fixups, const MCSubtargetInfo &STI) const {

  using namespace AMDGPU::SDWA;


  uint64_t RegEnc = 0;


  const MCOperand &MO = MI.getOperand(OpNo);


  MCRegister Reg = MO.getReg();

  if (Reg != AMDGPU::VCC && Reg != AMDGPU::VCC_LO) {

    RegEnc |= MRI.getEncodingValue(Reg);

    RegEnc &= SDWA9EncValues::VOPC_DST_SGPR_MASK;

    RegEnc |= SDWA9EncValues::VOPC_DST_VCC_MASK;

  }

  Op = RegEnc;

}


void AMDGPUMCCodeEmitter::getAVOperandEncoding(

    const MCInst &MI, unsigned OpNo, APInt &Op,

    SmallVectorImpl<MCFixup> &Fixups, const MCSubtargetInfo &STI) const {

  MCRegister Reg = MI.getOperand(OpNo).getReg();

  unsigned Enc = MRI.getEncodingValue(Reg);

  unsigned Idx = Enc & AMDGPU::HWEncoding::LO256_REG_IDX_MASK;

  bool IsVGPROrAGPR =

      Enc & (AMDGPU::HWEncoding::IS_VGPR | AMDGPU::HWEncoding::IS_AGPR);


  // VGPR and AGPR have the same encoding, but SrcA and SrcB operands of mfma

  // instructions use acc[0:1] modifier bits to distinguish. These bits are

  // encoded as a virtual 9th bit of the register for these operands.

  bool IsAGPR = Enc & AMDGPU::HWEncoding::IS_AGPR;


  Op = Idx | (IsVGPROrAGPR << 8) | (IsAGPR << 9);

}


static bool needsPCRel(const MCExpr *Expr) {

  switch (Expr->getKind()) {

  case MCExpr::SymbolRef: {

    auto *SE = cast<MCSymbolRefExpr>(Expr);

    auto Spec = AMDGPU::getSpecifier(SE);

    return Spec != AMDGPUMCExpr::S_ABS32_LO &&

           Spec != AMDGPUMCExpr::S_ABS32_HI && Spec != AMDGPUMCExpr::S_ABS64;

  }

  case MCExpr::Binary: {

    auto *BE = cast<MCBinaryExpr>(Expr);

    if (BE->getOpcode() == MCBinaryExpr::Sub)

      return false;

    return needsPCRel(BE->getLHS()) || needsPCRel(BE->getRHS());

  }

  case MCExpr::Unary:

    return needsPCRel(cast<MCUnaryExpr>(Expr)->getSubExpr());

  case MCExpr::Specifier:

  case MCExpr::Target:

  case MCExpr::Constant:

    return false;

  }

  llvm_unreachable("invalid kind");

}


void AMDGPUMCCodeEmitter::getMachineOpValue(const MCInst &MI,

                                            const MCOperand &MO, APInt &Op,

                                            SmallVectorImpl<MCFixup> &Fixups,

                                            const MCSubtargetInfo &STI) const {

  if (MO.isReg()){

    unsigned Enc = MRI.getEncodingValue(MO.getReg());

    unsigned Idx = Enc & AMDGPU::HWEncoding::LO256_REG_IDX_MASK;

    bool IsVGPROrAGPR =

        Enc & (AMDGPU::HWEncoding::IS_VGPR | AMDGPU::HWEncoding::IS_AGPR);

    Op = Idx | (IsVGPROrAGPR << 8);

    return;

  }

  unsigned OpNo = &MO - MI.begin();

  getMachineOpValueCommon(MI, MO, OpNo, Op, Fixups, STI);

}


void AMDGPUMCCodeEmitter::getMachineOpValueT16(

    const MCInst &MI, unsigned OpNo, APInt &Op,

    SmallVectorImpl<MCFixup> &Fixups, const MCSubtargetInfo &STI) const {

  const MCOperand &MO = MI.getOperand(OpNo);

  if (MO.isReg()) {

    unsigned Enc = MRI.getEncodingValue(MO.getReg());

    unsigned Idx = Enc & AMDGPU::HWEncoding::REG_IDX_MASK;

    bool IsVGPR = Enc & AMDGPU::HWEncoding::IS_VGPR;

    Op = Idx | (IsVGPR << 8);

    return;

  }

  getMachineOpValueCommon(MI, MO, OpNo, Op, Fixups, STI);

  // VGPRs include the suffix/op_sel bit in the register encoding, but

  // immediates and SGPRs include it in src_modifiers. Therefore, copy the

  // op_sel bit from the src operands into src_modifier operands if Op is

  // src_modifiers and the corresponding src is a VGPR

  int SrcMOIdx = -1;

  assert(OpNo < INT_MAX);

  if ((int)OpNo == AMDGPU::getNamedOperandIdx(MI.getOpcode(),

                                              AMDGPU::OpName::src0_modifiers)) {

    SrcMOIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), AMDGPU::OpName::src0);

    int VDstMOIdx =

        AMDGPU::getNamedOperandIdx(MI.getOpcode(), AMDGPU::OpName::vdst);

    if (VDstMOIdx != -1) {

      auto DstReg = MI.getOperand(VDstMOIdx).getReg();

      if (AMDGPU::isHi16Reg(DstReg, MRI))

        Op |= SISrcMods::DST_OP_SEL;

    }

  } else if ((int)OpNo == AMDGPU::getNamedOperandIdx(

                              MI.getOpcode(), AMDGPU::OpName::src1_modifiers))

    SrcMOIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), AMDGPU::OpName::src1);

  else if ((int)OpNo == AMDGPU::getNamedOperandIdx(

                            MI.getOpcode(), AMDGPU::OpName::src2_modifiers))

    SrcMOIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), AMDGPU::OpName::src2);

  if (SrcMOIdx == -1)

    return;


  const MCOperand &SrcMO = MI.getOperand(SrcMOIdx);

  if (!SrcMO.isReg())

    return;

  auto SrcReg = SrcMO.getReg();

  if (AMDGPU::isSGPR(SrcReg, &MRI))

    return;

  if (AMDGPU::isHi16Reg(SrcReg, MRI))

    Op |= SISrcMods::OP_SEL_0;

}


void AMDGPUMCCodeEmitter::getMachineOpValueT16Lo128(

    const MCInst &MI, unsigned OpNo, APInt &Op,

    SmallVectorImpl<MCFixup> &Fixups, const MCSubtargetInfo &STI) const {

  const MCOperand &MO = MI.getOperand(OpNo);

  if (MO.isReg()) {

    uint16_t Encoding = MRI.getEncodingValue(MO.getReg());

    unsigned RegIdx = Encoding & AMDGPU::HWEncoding::LO256_REG_IDX_MASK;

    bool IsHi = Encoding & AMDGPU::HWEncoding::IS_HI16;

    bool IsVGPR = Encoding & AMDGPU::HWEncoding::IS_VGPR;

    assert((!IsVGPR || isUInt<7>(RegIdx)) && "VGPR0-VGPR127 expected!");

    Op = (IsVGPR ? 0x100 : 0) | (IsHi ? 0x80 : 0) | RegIdx;

    return;

  }

  getMachineOpValueCommon(MI, MO, OpNo, Op, Fixups, STI);

}


void AMDGPUMCCodeEmitter::getMachineOpValueCommon(

    const MCInst &MI, const MCOperand &MO, unsigned OpNo, APInt &Op,

    SmallVectorImpl<MCFixup> &Fixups, const MCSubtargetInfo &STI) const {

  bool isLikeImm = false;

  int64_t Val;


  if (MO.isImm()) {

    Val = MO.getImm();

    isLikeImm = true;

  } else if (MO.isExpr() && MO.getExpr()->evaluateAsAbsolute(Val)) {

    isLikeImm = true;

  } else if (MO.isExpr()) {

    // FIXME: If this is expression is PCRel or not should not depend on what

    // the expression looks like. Given that this is just a general expression,

    // it should probably be FK_Data_4 and whatever is producing

    //

    //    s_add_u32 s2, s2, (extern_const_addrspace+16

    //

    // And expecting a PCRel should instead produce

    //

    // .Ltmp1:

    //   s_add_u32 s2, s2, (extern_const_addrspace+16)-.Ltmp1

    bool PCRel = needsPCRel(MO.getExpr());

    const MCInstrDesc &Desc = MCII.get(MI.getOpcode());

    uint32_t Offset = Desc.getSize();

    assert(Offset == 4 || Offset == 8);

    unsigned Size = AMDGPU::getOperandSize(Desc, OpNo);

    MCFixupKind Kind = MCFixup::getDataKindForSize(Size);

    addFixup(Fixups, Offset, MO.getExpr(), Kind, PCRel);

  }


  const MCInstrDesc &Desc = MCII.get(MI.getOpcode());

  if (AMDGPU::isSISrcOperand(Desc, OpNo)) {

    bool HasMandatoryLiteral =

        AMDGPU::hasNamedOperand(MI.getOpcode(), AMDGPU::OpName::imm);

    if (auto Enc = getLitEncoding(Desc, MO, OpNo, STI, HasMandatoryLiteral)) {

      Op = *Enc;

      return;

    }


    llvm_unreachable("Operand not supported for SISrc");

  }


  if (isLikeImm) {

    Op = Val;

    return;

  }


  llvm_unreachable("Encoding of this operand type is not supported yet.");

}


template <bool HasSrc0, bool HasSrc1, bool HasSrc2>

APInt AMDGPUMCCodeEmitter::postEncodeVOP3(const MCInst &MI, APInt EncodedValue,

                                          const MCSubtargetInfo &STI) const {

  if (!AMDGPU::isGFX10Plus(STI))

    return EncodedValue;

  // Set unused source fields in VOP3 encodings to inline immediate 0 to avoid

  // hardware conservatively assuming the instruction reads SGPRs.

  constexpr uint64_t InlineImmediate0 = 0x80;

  if (!HasSrc0)

    EncodedValue |= InlineImmediate0 << 32;

  if (!HasSrc1)

    EncodedValue |= InlineImmediate0 << 41;

  if (!HasSrc2)

    EncodedValue |= InlineImmediate0 << 50;

  return EncodedValue;

}


APInt AMDGPUMCCodeEmitter::postEncodeVOPCX(const MCInst &MI, APInt EncodedValue,

                                           const MCSubtargetInfo &STI) const {

  // GFX10+ v_cmpx opcodes promoted to VOP3 have implied dst=EXEC.

  // Documentation requires dst to be encoded as EXEC (0x7E),

  // but it looks like the actual value encoded for dst operand

  // is ignored by HW. It was decided to define dst as "do not care"

  // in td files to allow disassembler accept any dst value.

  // However, dst is encoded as EXEC for compatibility with SP3.

  [[maybe_unused]] const MCInstrDesc &Desc = MCII.get(MI.getOpcode());

  assert((Desc.TSFlags & SIInstrFlags::VOP3) &&

         Desc.hasImplicitDefOfPhysReg(AMDGPU::EXEC));

  EncodedValue |= MRI.getEncodingValue(AMDGPU::EXEC_LO) &

                  AMDGPU::HWEncoding::LO256_REG_IDX_MASK;

  return postEncodeVOP3<true, true, false>(MI, EncodedValue, STI);

}


#include "AMDGPUGenMCCodeEmitter.inc"

addFixup
static void addFixup(SmallVectorImpl< MCFixup > &Fixups, uint32_t Offset, const MCExpr *Value, uint16_t Kind, bool PCRel=false)
Definition AArch64MCCodeEmitter.cpp:225

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

AMDGPUBaseInfo.h

AMDGPUFixupKinds.h

getLit64Encoding
static uint32_t getLit64Encoding(const MCInstrDesc &Desc, uint64_t Val, const MCSubtargetInfo &STI, bool IsFP)
Definition AMDGPUMCCodeEmitter.cpp:229

getLit16IntEncoding
static uint32_t getLit16IntEncoding(uint32_t Val, const MCSubtargetInfo &STI)
Definition AMDGPUMCCodeEmitter.cpp:225

addFixup
static void addFixup(SmallVectorImpl< MCFixup > &Fixups, uint32_t Offset, const MCExpr *Value, uint16_t Kind, bool PCRel=false)
Definition AMDGPUMCCodeEmitter.cpp:114

getLitBF16Encoding
static uint32_t getLitBF16Encoding(uint16_t Val)
Definition AMDGPUMCCodeEmitter.cpp:168

getLit16Encoding
static uint32_t getLit16Encoding(uint16_t Val, const MCSubtargetInfo &STI)
Definition AMDGPUMCCodeEmitter.cpp:132

getIntInlineImmEncoding
static uint32_t getIntInlineImmEncoding(IntTy Imm)
Definition AMDGPUMCCodeEmitter.cpp:122

needsPCRel
static bool needsPCRel(const MCExpr *Expr)
Definition AMDGPUMCCodeEmitter.cpp:581

getLit32Encoding
static uint32_t getLit32Encoding(uint32_t Val, const MCSubtargetInfo &STI)
Definition AMDGPUMCCodeEmitter.cpp:189

AMDGPUMCExpr.h

AMDGPUMCTargetDesc.h
Provides AMDGPU specific target descriptions.

APInt.h
This file implements a class to represent arbitrary precision integral constant values and operations...

Casting.h

EndianStream.h

MI
IRTranslator LLVM IR MI
Definition IRTranslator.cpp:110

InlinePriorityMode::Size
@ Size
Definition InlineOrder.cpp:25

MCCodeEmitter.h

MCContext.h

MCExpr.h

MCInstrInfo.h

MCRegisterInfo.h

MCSubtargetInfo.h

Reg
Register Reg
Definition MachineSink.cpp:2126

SIDefines.h

llvm::AMDGPUMCExpr::S_ABS32_LO
@ S_ABS32_LO
Definition AMDGPUMCExpr.h:54

llvm::AMDGPUMCExpr::S_ABS64
@ S_ABS64
Definition AMDGPUMCExpr.h:56

llvm::AMDGPUMCExpr::S_ABS32_HI
@ S_ABS32_HI
Definition AMDGPUMCExpr.h:55

llvm::AMDGPUMCExpr::AGVK_Lit
@ AGVK_Lit
Definition AMDGPUMCExpr.h:41

llvm::APInt::extractBitsAsZExtValue
LLVM_ABI uint64_t extractBitsAsZExtValue(unsigned numBits, unsigned bitPosition) const
Definition APInt.cpp:521

llvm::APInt::getLimitedValue
uint64_t getLimitedValue(uint64_t Limit=UINT64_MAX) const
If this value is smaller than the specified limit, return it, otherwise return the limit value.
Definition APInt.h:476

llvm::APInt::getZero
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
Definition APInt.h:201

llvm::MCBinaryExpr::Sub
@ Sub
Subtraction.
Definition MCExpr.h:324

llvm::MCCodeEmitter
MCCodeEmitter - Generic instruction encoding interface.
Definition MCCodeEmitter.h:22

llvm::MCContext
Context object for machine code objects.
Definition MCContext.h:83

llvm::MCExpr
Base class for the full range of assembler expressions which are needed for parsing.
Definition MCExpr.h:34

llvm::MCExpr::Unary
@ Unary
Unary expressions.
Definition MCExpr.h:44

llvm::MCExpr::Constant
@ Constant
Constant expressions.
Definition MCExpr.h:42

llvm::MCExpr::SymbolRef
@ SymbolRef
References to labels and assigned expressions.
Definition MCExpr.h:43

llvm::MCExpr::Target
@ Target
Target specific expression.
Definition MCExpr.h:46

llvm::MCExpr::Specifier
@ Specifier
Expression with a relocation specifier.
Definition MCExpr.h:45

llvm::MCExpr::Binary
@ Binary
Binary expressions.
Definition MCExpr.h:41

llvm::MCExpr::getKind
ExprKind getKind() const
Definition MCExpr.h:85

llvm::MCFixup::getDataKindForSize
static MCFixupKind getDataKindForSize(unsigned Size)
Return the generic fixup kind for a value with the given size.
Definition MCFixup.h:110

llvm::MCFixup::create
static MCFixup create(uint32_t Offset, const MCExpr *Value, MCFixupKind Kind, bool PCRel=false)
Consider bit fields if we need more flags.
Definition MCFixup.h:86

llvm::MCInstrDesc
Describe properties that are true of each instruction in the target description file.
Definition MCInstrDesc.h:199

llvm::MCInstrInfo
Interface to description of machine instruction set.
Definition MCInstrInfo.h:27

llvm::MCInstrInfo::get
const MCInstrDesc & get(unsigned Opcode) const
Return the machine instruction descriptor that corresponds to the specified instruction opcode.
Definition MCInstrInfo.h:90

llvm::MCOperandInfo::OperandType
uint8_t OperandType
Information about the type of the operand.
Definition MCInstrDesc.h:98

llvm::MCOperand
Instances of this class represent operands of the MCInst class.
Definition MCInst.h:40

llvm::MCOperand::getImm
int64_t getImm() const
Definition MCInst.h:84

llvm::MCOperand::isImm
bool isImm() const
Definition MCInst.h:66

llvm::MCOperand::isReg
bool isReg() const
Definition MCInst.h:65

llvm::MCOperand::getReg
MCRegister getReg() const
Returns the register number.
Definition MCInst.h:73

llvm::MCOperand::isDFPImm
bool isDFPImm() const
Definition MCInst.h:68

llvm::MCOperand::getExpr
const MCExpr * getExpr() const
Definition MCInst.h:118

llvm::MCOperand::isExpr
bool isExpr() const
Definition MCInst.h:69

llvm::MCRegisterInfo::getEncodingValue
uint16_t getEncodingValue(MCRegister Reg) const
Returns the encoding for Reg.
Definition MCRegisterInfo.h:484

llvm::MCSubtargetInfo
Generic base class for all target subtargets.
Definition MCSubtargetInfo.h:77

llvm::MCSubtargetInfo::hasFeature
bool hasFeature(unsigned Feature) const
Definition MCSubtargetInfo.h:122

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition SmallVector.h:581

llvm::SmallVectorImpl::append
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
Definition SmallVector.h:691

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition SmallVector.h:423

llvm::Value
LLVM Value Representation.
Definition Value.h:75

uint16_t

uint32_t

uint64_t

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

llvm::AMDGPU::HWEncoding::IS_AGPR
@ IS_AGPR
Definition SIDefines.h:363

llvm::AMDGPU::HWEncoding::IS_VGPR
@ IS_VGPR
Definition SIDefines.h:362

llvm::AMDGPU::HWEncoding::REG_IDX_MASK
@ REG_IDX_MASK
Definition SIDefines.h:360

llvm::AMDGPU::HWEncoding::IS_HI16
@ IS_HI16
Definition SIDefines.h:364

llvm::AMDGPU::HWEncoding::LO256_REG_IDX_MASK
@ LO256_REG_IDX_MASK
Definition SIDefines.h:361

llvm::AMDGPU::VOP3PEncoding::OP_SEL_HI_0
@ OP_SEL_HI_0
Definition SIDefines.h:1075

llvm::AMDGPU::VOP3PEncoding::OP_SEL_HI_1
@ OP_SEL_HI_1
Definition SIDefines.h:1076

llvm::AMDGPU::VOP3PEncoding::OP_SEL_HI_2
@ OP_SEL_HI_2
Definition SIDefines.h:1077

llvm::AMDGPU::isSGPR
bool isSGPR(MCRegister Reg, const MCRegisterInfo *TRI)
Is Reg - scalar register.
Definition AMDGPUBaseInfo.cpp:2714

llvm::AMDGPU::isHi16Reg
bool isHi16Reg(MCRegister Reg, const MCRegisterInfo &MRI)
Definition AMDGPUBaseInfo.cpp:2721

llvm::AMDGPU::getSpecifier
static AMDGPUMCExpr::Specifier getSpecifier(const MCSymbolRefExpr *SRE)
Definition AMDGPUMCExpr.h:130

llvm::AMDGPU::isLitExpr
LLVM_READONLY bool isLitExpr(const MCExpr *Expr)
Definition AMDGPUMCExpr.cpp:670

llvm::AMDGPU::Imm
@ Imm
Definition AMDGPURegBankLegalizeRules.h:152

llvm::AMDGPU::fixup_si_sopp_br
@ fixup_si_sopp_br
16-bit PC relative fixup for SOPP branch instructions.
Definition AMDGPUFixupKinds.h:18

llvm::AMDGPU::hasNamedOperand
LLVM_READONLY bool hasNamedOperand(uint64_t Opcode, OpName NamedIdx)
Definition AMDGPUBaseInfo.h:430

llvm::AMDGPU::isSISrcOperand
constexpr bool isSISrcOperand(const MCOperandInfo &OpInfo)
Is this an AMDGPU specific source operand?
Definition AMDGPUBaseInfo.h:1633

llvm::AMDGPU::getExprKind
LLVM_READONLY AMDGPUMCExpr::VariantKind getExprKind(const MCExpr *Expr)
Definition AMDGPUMCExpr.cpp:682

llvm::AMDGPU::getLitValue
LLVM_READONLY int64_t getLitValue(const MCExpr *Expr)
Definition AMDGPUMCExpr.cpp:676

llvm::AMDGPU::isGFX11Plus
bool isGFX11Plus(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2615

llvm::AMDGPU::getInlineEncodingV2F16
std::optional< unsigned > getInlineEncodingV2F16(uint32_t Literal)
Definition AMDGPUBaseInfo.cpp:3219

llvm::AMDGPU::isGFX10Plus
bool isGFX10Plus(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2607

llvm::AMDGPU::encode32BitLiteral
int64_t encode32BitLiteral(int64_t Imm, OperandType Type, bool IsLit)
Definition AMDGPUBaseInfo.cpp:3299

llvm::AMDGPU::OperandType
OperandType
Definition SIDefines.h:201

llvm::AMDGPU::OPERAND_KIMM32
@ OPERAND_KIMM32
Operand with 32-bit immediate that uses the constant bus.
Definition SIDefines.h:234

llvm::AMDGPU::OPERAND_REG_IMM_INT64
@ OPERAND_REG_IMM_INT64
Definition SIDefines.h:204

llvm::AMDGPU::OPERAND_REG_IMM_V2FP16
@ OPERAND_REG_IMM_V2FP16
Definition SIDefines.h:211

llvm::AMDGPU::OPERAND_REG_INLINE_C_FP64
@ OPERAND_REG_INLINE_C_FP64
Definition SIDefines.h:225

llvm::AMDGPU::OPERAND_REG_INLINE_C_BF16
@ OPERAND_REG_INLINE_C_BF16
Definition SIDefines.h:222

llvm::AMDGPU::OPERAND_REG_INLINE_C_V2BF16
@ OPERAND_REG_INLINE_C_V2BF16
Definition SIDefines.h:227

llvm::AMDGPU::OPERAND_REG_IMM_V2INT16
@ OPERAND_REG_IMM_V2INT16
Definition SIDefines.h:213

llvm::AMDGPU::OPERAND_REG_IMM_BF16
@ OPERAND_REG_IMM_BF16
Definition SIDefines.h:208

llvm::AMDGPU::OPERAND_REG_IMM_INT32
@ OPERAND_REG_IMM_INT32
Operands with register, 32-bit, or 64-bit immediate.
Definition SIDefines.h:203

llvm::AMDGPU::OPERAND_REG_IMM_V2BF16
@ OPERAND_REG_IMM_V2BF16
Definition SIDefines.h:210

llvm::AMDGPU::OPERAND_REG_IMM_FP16
@ OPERAND_REG_IMM_FP16
Definition SIDefines.h:209

llvm::AMDGPU::OPERAND_REG_IMM_V2FP16_SPLAT
@ OPERAND_REG_IMM_V2FP16_SPLAT
Definition SIDefines.h:212

llvm::AMDGPU::OPERAND_REG_INLINE_C_INT64
@ OPERAND_REG_INLINE_C_INT64
Definition SIDefines.h:221

llvm::AMDGPU::OPERAND_KIMM64
@ OPERAND_KIMM64
Definition SIDefines.h:236

llvm::AMDGPU::OPERAND_KIMM16
@ OPERAND_KIMM16
Definition SIDefines.h:235

llvm::AMDGPU::OPERAND_REG_INLINE_C_INT16
@ OPERAND_REG_INLINE_C_INT16
Operands with register or inline constant.
Definition SIDefines.h:219

llvm::AMDGPU::OPERAND_REG_IMM_NOINLINE_V2FP16
@ OPERAND_REG_IMM_NOINLINE_V2FP16
Definition SIDefines.h:214

llvm::AMDGPU::OPERAND_REG_IMM_FP64
@ OPERAND_REG_IMM_FP64
Definition SIDefines.h:207

llvm::AMDGPU::OPERAND_REG_INLINE_C_V2FP16
@ OPERAND_REG_INLINE_C_V2FP16
Definition SIDefines.h:228

llvm::AMDGPU::OPERAND_REG_INLINE_AC_INT32
@ OPERAND_REG_INLINE_AC_INT32
Operands with an AccVGPR register or inline constant.
Definition SIDefines.h:239

llvm::AMDGPU::OPERAND_REG_INLINE_AC_FP32
@ OPERAND_REG_INLINE_AC_FP32
Definition SIDefines.h:240

llvm::AMDGPU::OPERAND_REG_IMM_V2INT32
@ OPERAND_REG_IMM_V2INT32
Definition SIDefines.h:215

llvm::AMDGPU::OPERAND_REG_IMM_FP32
@ OPERAND_REG_IMM_FP32
Definition SIDefines.h:206

llvm::AMDGPU::OPERAND_REG_INLINE_C_FP32
@ OPERAND_REG_INLINE_C_FP32
Definition SIDefines.h:224

llvm::AMDGPU::OPERAND_REG_INLINE_C_INT32
@ OPERAND_REG_INLINE_C_INT32
Definition SIDefines.h:220

llvm::AMDGPU::OPERAND_REG_INLINE_C_V2INT16
@ OPERAND_REG_INLINE_C_V2INT16
Definition SIDefines.h:226

llvm::AMDGPU::OPERAND_REG_IMM_V2FP32
@ OPERAND_REG_IMM_V2FP32
Definition SIDefines.h:216

llvm::AMDGPU::OPERAND_REG_INLINE_AC_FP64
@ OPERAND_REG_INLINE_AC_FP64
Definition SIDefines.h:241

llvm::AMDGPU::OPERAND_REG_INLINE_C_FP16
@ OPERAND_REG_INLINE_C_FP16
Definition SIDefines.h:223

llvm::AMDGPU::OPERAND_REG_IMM_INT16
@ OPERAND_REG_IMM_INT16
Definition SIDefines.h:205

llvm::AMDGPU::OPERAND_INLINE_SPLIT_BARRIER_INT32
@ OPERAND_INLINE_SPLIT_BARRIER_INT32
Definition SIDefines.h:231

llvm::AMDGPU::getPKFMACF16InlineEncoding
std::optional< unsigned > getPKFMACF16InlineEncoding(uint32_t Literal, bool IsGFX11Plus)
Definition AMDGPUBaseInfo.cpp:3227

llvm::AMDGPU::getInlineEncodingV2I16
std::optional< unsigned > getInlineEncodingV2I16(uint32_t Literal)
Definition AMDGPUBaseInfo.cpp:3185

llvm::AMDGPU::isVI
bool isVI(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2569

llvm::AMDGPU::mc2PseudoReg
MCRegister mc2PseudoReg(MCRegister Reg)
Convert hardware register Reg to a pseudo register.
Definition AMDGPUBaseInfo.cpp:2813

llvm::AMDGPU::getInlineEncodingV2BF16
std::optional< unsigned > getInlineEncodingV2BF16(uint32_t Literal)
Definition AMDGPUBaseInfo.cpp:3191

llvm::AMDGPU::getOperandSize
LLVM_READNONE unsigned getOperandSize(const MCOperandInfo &OpInfo)
Definition AMDGPUBaseInfo.h:1658

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::SIInstrFlags::MIMG
@ MIMG
Definition SIDefines.h:86

llvm::SIInstrFlags::VOP3P
@ VOP3P
Definition SIDefines.h:75

llvm::SIInstrFlags::VOP3
@ VOP3
Definition SIDefines.h:74

llvm::SISrcMods::OP_SEL_0
@ OP_SEL_0
Definition SIDefines.h:280

llvm::SISrcMods::DST_OP_SEL
@ DST_OP_SEL
Definition SIDefines.h:282

llvm::lltok::Kind
Kind
Definition LLToken.h:18

llvm::support::endian::write
void write(void *memory, value_type value, endianness endian)
Write a value to memory with a particular endianness.
Definition Endian.h:96

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition FunctionInfo.h:25

llvm::Offset
@ Offset
Definition DWP.cpp:557

llvm::isInt
constexpr bool isInt(int64_t x)
Checks if an integer fits into the given bit width.
Definition MathExtras.h:165

llvm::dyn_cast
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643

llvm::Desc
Op::Description Desc
Definition DWARFExpressionPrinter.cpp:24

llvm::MCFixupKind
uint16_t MCFixupKind
Extensible enumeration to represent the type of a fixup.
Definition MCFixup.h:22

llvm::isUInt
constexpr bool isUInt(uint64_t x)
Checks if an unsigned integer fits into the given bit width.
Definition MathExtras.h:189

llvm::Lo_32
constexpr uint32_t Lo_32(uint64_t Value)
Return the low 32 bits of a 64 bit value.
Definition MathExtras.h:155

llvm::bit_cast
To bit_cast(const From &from) noexcept
Definition bit.h:90

llvm::Op
DWARFExpression::Operation Op
Definition DWARFExpressionPrinter.cpp:23

llvm::cast
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559

llvm::endianness::little
@ little
Definition bit.h:73

llvm::createAMDGPUMCCodeEmitter
MCCodeEmitter * createAMDGPUMCCodeEmitter(const MCInstrInfo &MCII, MCContext &Ctx)
Definition AMDGPUMCCodeEmitter.cpp:109

llvm::Spec
Definition FunctionSpecialization.h:128