doxygen/LoongArchISelLowering_8cpp_source.html

//=- LoongArchISelLowering.cpp - LoongArch DAG Lowering Implementation  ---===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file defines the interfaces that LoongArch uses to lower LLVM code into

// a selection DAG.

//

//===----------------------------------------------------------------------===//


#include "LoongArchISelLowering.h"

#include "LoongArch.h"

#include "LoongArchMachineFunctionInfo.h"

#include "LoongArchRegisterInfo.h"

#include "LoongArchSelectionDAGInfo.h"

#include "LoongArchSubtarget.h"

#include "MCTargetDesc/LoongArchBaseInfo.h"

#include "MCTargetDesc/LoongArchMCTargetDesc.h"

#include "MCTargetDesc/LoongArchMatInt.h"

#include "llvm/ADT/SmallSet.h"

#include "llvm/ADT/Statistic.h"

#include "llvm/ADT/StringExtras.h"

#include "llvm/CodeGen/ISDOpcodes.h"

#include "llvm/CodeGen/MachineInstrBuilder.h"

#include "llvm/CodeGen/RuntimeLibcallUtil.h"

#include "llvm/CodeGen/SelectionDAGNodes.h"

#include "llvm/IR/IRBuilder.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/IntrinsicsLoongArch.h"

#include "llvm/Support/CodeGen.h"

#include "llvm/Support/Debug.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Support/KnownBits.h"

#include "llvm/Support/MathExtras.h"

#include <llvm/Analysis/VectorUtils.h>


using namespace llvm;


#define DEBUG_TYPE "loongarch-isel-lowering"


STATISTIC(NumTailCalls, "Number of tail calls");


enum MaterializeFPImm {

  NoMaterializeFPImm = 0,

  MaterializeFPImm2Ins = 2,

  MaterializeFPImm3Ins = 3,

  MaterializeFPImm4Ins = 4,

  MaterializeFPImm5Ins = 5,

  MaterializeFPImm6Ins = 6

};


static cl::opt<MaterializeFPImm> MaterializeFPImmInsNum(

    "loongarch-materialize-float-imm", cl::Hidden,

    cl::desc("Maximum number of instructions used (including code sequence "

             "to generate the value and moving the value to FPR) when "

             "materializing floating-point immediates (default = 3)"),

    cl::init(MaterializeFPImm3Ins),

    cl::values(clEnumValN(NoMaterializeFPImm, "0", "Use constant pool"),

               clEnumValN(MaterializeFPImm2Ins, "2",

                          "Materialize FP immediate within 2 instructions"),

               clEnumValN(MaterializeFPImm3Ins, "3",

                          "Materialize FP immediate within 3 instructions"),

               clEnumValN(MaterializeFPImm4Ins, "4",

                          "Materialize FP immediate within 4 instructions"),

               clEnumValN(MaterializeFPImm5Ins, "5",

                          "Materialize FP immediate within 5 instructions"),

               clEnumValN(MaterializeFPImm6Ins, "6",

                          "Materialize FP immediate within 6 instructions "

                          "(behaves same as 5 on loongarch64)")));


static cl::opt<bool> ZeroDivCheck("loongarch-check-zero-division", cl::Hidden,

                                  cl::desc("Trap on integer division by zero."),

                                  cl::init(false));


LoongArchTargetLowering::LoongArchTargetLowering(const TargetMachine &TM,

                                                 const LoongArchSubtarget &STI)

    : TargetLowering(TM, STI), Subtarget(STI) {


  MVT GRLenVT = Subtarget.getGRLenVT();


  // Set up the register classes.


  addRegisterClass(GRLenVT, &LoongArch::GPRRegClass);

  if (Subtarget.hasBasicF())

    addRegisterClass(MVT::f32, &LoongArch::FPR32RegClass);

  if (Subtarget.hasBasicD())

    addRegisterClass(MVT::f64, &LoongArch::FPR64RegClass);


  static const MVT::SimpleValueType LSXVTs[] = {

      MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64, MVT::v4f32, MVT::v2f64};

  static const MVT::SimpleValueType LASXVTs[] = {

      MVT::v32i8, MVT::v16i16, MVT::v8i32, MVT::v4i64, MVT::v8f32, MVT::v4f64};


  if (Subtarget.hasExtLSX())

    for (MVT VT : LSXVTs)

      addRegisterClass(VT, &LoongArch::LSX128RegClass);


  if (Subtarget.hasExtLASX())

    for (MVT VT : LASXVTs)

      addRegisterClass(VT, &LoongArch::LASX256RegClass);


  // Set operations for LA32 and LA64.


  setLoadExtAction({ISD::EXTLOAD, ISD::SEXTLOAD, ISD::ZEXTLOAD}, GRLenVT,

                   MVT::i1, Promote);


  setOperationAction(ISD::SHL_PARTS, GRLenVT, Custom);

  setOperationAction(ISD::SRA_PARTS, GRLenVT, Custom);

  setOperationAction(ISD::SRL_PARTS, GRLenVT, Custom);

  setOperationAction(ISD::FP_TO_SINT, GRLenVT, Custom);

  setOperationAction(ISD::ROTL, GRLenVT, Expand);

  setOperationAction(ISD::CTPOP, GRLenVT, Expand);


  setOperationAction({ISD::GlobalAddress, ISD::BlockAddress, ISD::ConstantPool,

                      ISD::JumpTable, ISD::GlobalTLSAddress},

                     GRLenVT, Custom);


  setOperationAction(ISD::EH_DWARF_CFA, GRLenVT, Custom);


  setOperationAction(ISD::DYNAMIC_STACKALLOC, GRLenVT, Expand);

  setOperationAction({ISD::STACKSAVE, ISD::STACKRESTORE}, MVT::Other, Expand);

  setOperationAction(ISD::VASTART, MVT::Other, Custom);

  setOperationAction({ISD::VAARG, ISD::VACOPY, ISD::VAEND}, MVT::Other, Expand);


  setOperationAction(ISD::DEBUGTRAP, MVT::Other, Legal);

  setOperationAction(ISD::TRAP, MVT::Other, Legal);


  setOperationAction(ISD::INTRINSIC_VOID, MVT::Other, Custom);

  setOperationAction(ISD::INTRINSIC_W_CHAIN, MVT::Other, Custom);

  setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::Other, Custom);


  setOperationAction(ISD::PREFETCH, MVT::Other, Custom);


  // BITREV/REVB requires the 32S feature.

  if (STI.has32S()) {

    // Expand bitreverse.i16 with native-width bitrev and shift for now, before

    // we get to know which of sll and revb.2h is faster.

    setOperationAction(ISD::BITREVERSE, MVT::i8, Custom);

    setOperationAction(ISD::BITREVERSE, GRLenVT, Legal);


    // LA32 does not have REVB.2W and REVB.D due to the 64-bit operands, and

    // the narrower REVB.W does not exist. But LA32 does have REVB.2H, so i16

    // and i32 could still be byte-swapped relatively cheaply.

    setOperationAction(ISD::BSWAP, MVT::i16, Custom);

  } else {

    setOperationAction(ISD::BSWAP, GRLenVT, Expand);

    setOperationAction(ISD::CTTZ, GRLenVT, Expand);

    setOperationAction(ISD::CTLZ, GRLenVT, Expand);

    setOperationAction(ISD::ROTR, GRLenVT, Expand);

    setOperationAction(ISD::SELECT, GRLenVT, Custom);

    setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i8, Expand);

    setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i16, Expand);

  }


  setOperationAction(ISD::BR_JT, MVT::Other, Expand);

  setOperationAction(ISD::BR_CC, GRLenVT, Expand);

  setOperationAction(ISD::BRCOND, MVT::Other, Custom);

  setOperationAction(ISD::SELECT_CC, GRLenVT, Expand);

  setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i1, Expand);

  setOperationAction({ISD::SMUL_LOHI, ISD::UMUL_LOHI}, GRLenVT, Expand);


  setOperationAction(ISD::FP_TO_UINT, GRLenVT, Custom);

  setOperationAction(ISD::UINT_TO_FP, GRLenVT, Expand);


  // Set operations for LA64 only.


  if (Subtarget.is64Bit()) {

    setOperationAction(ISD::ADD, MVT::i32, Custom);

    setOperationAction(ISD::SUB, MVT::i32, Custom);

    setOperationAction(ISD::SHL, MVT::i32, Custom);

    setOperationAction(ISD::SRA, MVT::i32, Custom);

    setOperationAction(ISD::SRL, MVT::i32, Custom);

    setOperationAction(ISD::FP_TO_SINT, MVT::i32, Custom);

    setOperationAction(ISD::BITCAST, MVT::i32, Custom);

    setOperationAction(ISD::ROTR, MVT::i32, Custom);

    setOperationAction(ISD::ROTL, MVT::i32, Custom);

    setOperationAction(ISD::CTTZ, MVT::i32, Custom);

    setOperationAction(ISD::CTLZ, MVT::i32, Custom);

    setOperationAction(ISD::EH_DWARF_CFA, MVT::i32, Custom);

    setOperationAction(ISD::READ_REGISTER, MVT::i32, Custom);

    setOperationAction(ISD::WRITE_REGISTER, MVT::i32, Custom);

    setOperationAction(ISD::INTRINSIC_VOID, MVT::i32, Custom);

    setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::i32, Custom);

    setOperationAction(ISD::INTRINSIC_W_CHAIN, MVT::i32, Custom);


    setOperationAction(ISD::BITREVERSE, MVT::i32, Custom);

    setOperationAction(ISD::BSWAP, MVT::i32, Custom);

    setOperationAction({ISD::SDIV, ISD::UDIV, ISD::SREM, ISD::UREM}, MVT::i32,

                       Custom);

    setOperationAction(ISD::LROUND, MVT::i32, Custom);

  }


  // Set operations for LA32 only.


  if (!Subtarget.is64Bit()) {

    setOperationAction(ISD::READ_REGISTER, MVT::i64, Custom);

    setOperationAction(ISD::WRITE_REGISTER, MVT::i64, Custom);

    setOperationAction(ISD::INTRINSIC_VOID, MVT::i64, Custom);

    setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::i64, Custom);

    setOperationAction(ISD::INTRINSIC_W_CHAIN, MVT::i64, Custom);

    if (Subtarget.hasBasicD())

      setOperationAction(ISD::BITCAST, MVT::i64, Custom);

  }


  setOperationAction(ISD::ATOMIC_FENCE, MVT::Other, Custom);


  static const ISD::CondCode FPCCToExpand[] = {

      ISD::SETOGT, ISD::SETOGE, ISD::SETUGT, ISD::SETUGE,

      ISD::SETGE,  ISD::SETNE,  ISD::SETGT};


  // Set operations for 'F' feature.


  if (Subtarget.hasBasicF()) {

    setLoadExtAction(ISD::EXTLOAD, MVT::f32, MVT::f16, Expand);

    setTruncStoreAction(MVT::f32, MVT::f16, Expand);

    setLoadExtAction(ISD::EXTLOAD, MVT::f32, MVT::bf16, Expand);

    setTruncStoreAction(MVT::f32, MVT::bf16, Expand);

    setCondCodeAction(FPCCToExpand, MVT::f32, Expand);


    setOperationAction(ISD::ConstantFP, MVT::f32, Custom);

    setOperationAction(ISD::SELECT_CC, MVT::f32, Expand);

    setOperationAction(ISD::BR_CC, MVT::f32, Expand);

    setOperationAction(ISD::FMA, MVT::f32, Legal);

    setOperationAction(ISD::FMINNUM_IEEE, MVT::f32, Legal);

    setOperationAction(ISD::FMINNUM, MVT::f32, Legal);

    setOperationAction(ISD::FMAXNUM_IEEE, MVT::f32, Legal);

    setOperationAction(ISD::FMAXNUM, MVT::f32, Legal);

    setOperationAction(ISD::FCANONICALIZE, MVT::f32, Legal);

    setOperationAction(ISD::STRICT_FSETCCS, MVT::f32, Legal);

    setOperationAction(ISD::STRICT_FSETCC, MVT::f32, Legal);

    setOperationAction(ISD::IS_FPCLASS, MVT::f32, Legal);

    setOperationAction(ISD::FSIN, MVT::f32, Expand);

    setOperationAction(ISD::FCOS, MVT::f32, Expand);

    setOperationAction(ISD::FSINCOS, MVT::f32, Expand);

    setOperationAction(ISD::FPOW, MVT::f32, Expand);

    setOperationAction(ISD::FREM, MVT::f32, LibCall);

    setOperationAction(ISD::FP16_TO_FP, MVT::f32,

                       Subtarget.isSoftFPABI() ? LibCall : Custom);

    setOperationAction(ISD::FP_TO_FP16, MVT::f32,

                       Subtarget.isSoftFPABI() ? LibCall : Custom);

    setOperationAction(ISD::BF16_TO_FP, MVT::f32, Custom);

    setOperationAction(ISD::FP_TO_BF16, MVT::f32,

                       Subtarget.isSoftFPABI() ? LibCall : Custom);


    if (Subtarget.is64Bit()) {

      setOperationAction(ISD::FRINT, MVT::f32, Legal);

      setOperationAction(ISD::FLOG2, MVT::f32, Legal);

    }


    if (!Subtarget.hasBasicD()) {

      setOperationAction(ISD::FP_TO_UINT, MVT::i32, Custom);

      if (Subtarget.is64Bit()) {

        setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom);

        setOperationAction(ISD::UINT_TO_FP, MVT::i64, Custom);

      }

    }

  }


  // Set operations for 'D' feature.


  if (Subtarget.hasBasicD()) {

    setLoadExtAction(ISD::EXTLOAD, MVT::f64, MVT::f16, Expand);

    setLoadExtAction(ISD::EXTLOAD, MVT::f64, MVT::f32, Expand);

    setLoadExtAction(ISD::EXTLOAD, MVT::f64, MVT::bf16, Expand);

    setTruncStoreAction(MVT::f64, MVT::bf16, Expand);

    setTruncStoreAction(MVT::f64, MVT::f16, Expand);

    setTruncStoreAction(MVT::f64, MVT::f32, Expand);

    setCondCodeAction(FPCCToExpand, MVT::f64, Expand);


    setOperationAction(ISD::ConstantFP, MVT::f64, Custom);

    setOperationAction(ISD::SELECT_CC, MVT::f64, Expand);

    setOperationAction(ISD::BR_CC, MVT::f64, Expand);

    setOperationAction(ISD::STRICT_FSETCCS, MVT::f64, Legal);

    setOperationAction(ISD::STRICT_FSETCC, MVT::f64, Legal);

    setOperationAction(ISD::FMA, MVT::f64, Legal);

    setOperationAction(ISD::FMINNUM_IEEE, MVT::f64, Legal);

    setOperationAction(ISD::FMINNUM, MVT::f64, Legal);

    setOperationAction(ISD::FMAXNUM_IEEE, MVT::f64, Legal);

    setOperationAction(ISD::FCANONICALIZE, MVT::f64, Legal);

    setOperationAction(ISD::FMAXNUM, MVT::f64, Legal);

    setOperationAction(ISD::IS_FPCLASS, MVT::f64, Legal);

    setOperationAction(ISD::FSIN, MVT::f64, Expand);

    setOperationAction(ISD::FCOS, MVT::f64, Expand);

    setOperationAction(ISD::FSINCOS, MVT::f64, Expand);

    setOperationAction(ISD::FPOW, MVT::f64, Expand);

    setOperationAction(ISD::FREM, MVT::f64, LibCall);

    setOperationAction(ISD::FP16_TO_FP, MVT::f64, Expand);

    setOperationAction(ISD::FP_TO_FP16, MVT::f64,

                       Subtarget.isSoftFPABI() ? LibCall : Custom);

    setOperationAction(ISD::BF16_TO_FP, MVT::f64, Custom);

    setOperationAction(ISD::FP_TO_BF16, MVT::f64,

                       Subtarget.isSoftFPABI() ? LibCall : Custom);


    if (Subtarget.is64Bit()) {

      setOperationAction(ISD::FRINT, MVT::f64, Legal);

      setOperationAction(ISD::FLOG2, MVT::f64, Legal);

    }

  }


  // Set operations for 'LSX' feature.


  if (Subtarget.hasExtLSX()) {

    for (MVT VT : MVT::fixedlen_vector_valuetypes()) {

      // Expand all truncating stores and extending loads.

      for (MVT InnerVT : MVT::fixedlen_vector_valuetypes()) {

        setTruncStoreAction(VT, InnerVT, Expand);

        setLoadExtAction(ISD::SEXTLOAD, VT, InnerVT, Expand);

        setLoadExtAction(ISD::ZEXTLOAD, VT, InnerVT, Expand);

        setLoadExtAction(ISD::EXTLOAD, VT, InnerVT, Expand);

      }

      // By default everything must be expanded. Then we will selectively turn

      // on ones that can be effectively codegen'd.

      for (unsigned Op = 0; Op < ISD::BUILTIN_OP_END; ++Op)

        setOperationAction(Op, VT, Expand);

    }


    for (MVT VT : LSXVTs) {

      setOperationAction({ISD::LOAD, ISD::STORE}, VT, Legal);

      setOperationAction(ISD::BITCAST, VT, Legal);

      setOperationAction(ISD::UNDEF, VT, Legal);


      setOperationAction(ISD::INSERT_VECTOR_ELT, VT, Custom);

      setOperationAction(ISD::EXTRACT_VECTOR_ELT, VT, Legal);

      setOperationAction(ISD::BUILD_VECTOR, VT, Custom);


      setOperationAction(ISD::SETCC, VT, Legal);

      setOperationAction(ISD::VSELECT, VT, Legal);

      setOperationAction(ISD::VECTOR_SHUFFLE, VT, Custom);

      setOperationAction(ISD::EXTRACT_SUBVECTOR, VT, Legal);

    }

    for (MVT VT : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64}) {

      setOperationAction({ISD::ADD, ISD::SUB}, VT, Legal);

      setOperationAction({ISD::UMAX, ISD::UMIN, ISD::SMAX, ISD::SMIN}, VT,

                         Legal);

      setOperationAction({ISD::MUL, ISD::SDIV, ISD::SREM, ISD::UDIV, ISD::UREM},

                         VT, Legal);

      setOperationAction({ISD::AND, ISD::OR, ISD::XOR}, VT, Legal);

      setOperationAction({ISD::SHL, ISD::SRA, ISD::SRL}, VT, Legal);

      setOperationAction({ISD::CTPOP, ISD::CTLZ}, VT, Legal);

      setOperationAction({ISD::MULHS, ISD::MULHU}, VT, Legal);

      setCondCodeAction(

          {ISD::SETNE, ISD::SETGE, ISD::SETGT, ISD::SETUGE, ISD::SETUGT}, VT,

          Expand);

      setOperationAction(ISD::SCALAR_TO_VECTOR, VT, Custom);

      setOperationAction(ISD::ABS, VT, Legal);

      setOperationAction(ISD::ABDS, VT, Legal);

      setOperationAction(ISD::ABDU, VT, Legal);

      setOperationAction(ISD::SADDSAT, VT, Legal);

      setOperationAction(ISD::SSUBSAT, VT, Legal);

      setOperationAction(ISD::UADDSAT, VT, Legal);

      setOperationAction(ISD::USUBSAT, VT, Legal);

      setOperationAction(ISD::ROTL, VT, Custom);

      setOperationAction(ISD::ROTR, VT, Custom);

    }

    for (MVT VT : {MVT::v16i8, MVT::v8i16, MVT::v4i32})

      setOperationAction(ISD::BITREVERSE, VT, Custom);

    for (MVT VT : {MVT::v8i16, MVT::v4i32, MVT::v2i64})

      setOperationAction(ISD::BSWAP, VT, Legal);

    for (MVT VT : {MVT::v4i32, MVT::v2i64}) {

      setOperationAction({ISD::SINT_TO_FP, ISD::UINT_TO_FP}, VT, Legal);

      setOperationAction({ISD::FP_TO_SINT, ISD::FP_TO_UINT}, VT, Legal);

    }

    for (MVT VT : {MVT::v4f32, MVT::v2f64}) {

      setOperationAction({ISD::FADD, ISD::FSUB}, VT, Legal);

      setOperationAction({ISD::FMUL, ISD::FDIV}, VT, Legal);

      setOperationAction(ISD::FMA, VT, Legal);

      setOperationAction(ISD::FSQRT, VT, Legal);

      setOperationAction(ISD::FNEG, VT, Legal);

      setOperationAction(ISD::FLOG2, VT, Legal);

      setCondCodeAction({ISD::SETGE, ISD::SETGT, ISD::SETOGE, ISD::SETOGT,

                         ISD::SETUGE, ISD::SETUGT},

                        VT, Expand);

      setOperationAction(ISD::SCALAR_TO_VECTOR, VT, Legal);

      setOperationAction(ISD::FCEIL, VT, Legal);

      setOperationAction(ISD::FFLOOR, VT, Legal);

      setOperationAction(ISD::FTRUNC, VT, Legal);

      setOperationAction(ISD::FROUNDEVEN, VT, Legal);

      setOperationAction(ISD::FMINNUM, VT, Legal);

      setOperationAction(ISD::FMAXNUM, VT, Legal);

    }

    setOperationAction(ISD::CTPOP, GRLenVT, Legal);

    setOperationAction(ISD::FCEIL, {MVT::f32, MVT::f64}, Legal);

    setOperationAction(ISD::FFLOOR, {MVT::f32, MVT::f64}, Legal);

    setOperationAction(ISD::FTRUNC, {MVT::f32, MVT::f64}, Legal);

    setOperationAction(ISD::FROUNDEVEN, {MVT::f32, MVT::f64}, Legal);


    for (MVT VT :

         {MVT::v16i8, MVT::v8i8, MVT::v4i8, MVT::v2i8, MVT::v8i16, MVT::v4i16,

          MVT::v2i16, MVT::v4i32, MVT::v2i32, MVT::v2i64}) {

      setOperationAction(ISD::TRUNCATE, VT, Custom);

      setOperationAction(ISD::VECREDUCE_ADD, VT, Custom);

      setOperationAction(ISD::VECREDUCE_AND, VT, Custom);

      setOperationAction(ISD::VECREDUCE_OR, VT, Custom);

      setOperationAction(ISD::VECREDUCE_XOR, VT, Custom);

      setOperationAction(ISD::VECREDUCE_SMAX, VT, Custom);

      setOperationAction(ISD::VECREDUCE_SMIN, VT, Custom);

      setOperationAction(ISD::VECREDUCE_UMAX, VT, Custom);

      setOperationAction(ISD::VECREDUCE_UMIN, VT, Custom);

    }

  }


  // Set operations for 'LASX' feature.


  if (Subtarget.hasExtLASX()) {

    for (MVT VT : LASXVTs) {

      setOperationAction({ISD::LOAD, ISD::STORE}, VT, Legal);

      setOperationAction(ISD::BITCAST, VT, Legal);

      setOperationAction(ISD::UNDEF, VT, Legal);


      setOperationAction(ISD::INSERT_VECTOR_ELT, VT, Custom);

      setOperationAction(ISD::EXTRACT_VECTOR_ELT, VT, Custom);

      setOperationAction(ISD::BUILD_VECTOR, VT, Custom);

      setOperationAction(ISD::CONCAT_VECTORS, VT, Custom);

      setOperationAction(ISD::INSERT_SUBVECTOR, VT, Legal);


      setOperationAction(ISD::SETCC, VT, Legal);

      setOperationAction(ISD::VSELECT, VT, Legal);

      setOperationAction(ISD::VECTOR_SHUFFLE, VT, Custom);

    }

    for (MVT VT : {MVT::v4i64, MVT::v8i32, MVT::v16i16, MVT::v32i8}) {

      setOperationAction({ISD::ADD, ISD::SUB}, VT, Legal);

      setOperationAction({ISD::UMAX, ISD::UMIN, ISD::SMAX, ISD::SMIN}, VT,

                         Legal);

      setOperationAction({ISD::MUL, ISD::SDIV, ISD::SREM, ISD::UDIV, ISD::UREM},

                         VT, Legal);

      setOperationAction({ISD::AND, ISD::OR, ISD::XOR}, VT, Legal);

      setOperationAction({ISD::SHL, ISD::SRA, ISD::SRL}, VT, Legal);

      setOperationAction({ISD::CTPOP, ISD::CTLZ}, VT, Legal);

      setOperationAction({ISD::MULHS, ISD::MULHU}, VT, Legal);

      setCondCodeAction(

          {ISD::SETNE, ISD::SETGE, ISD::SETGT, ISD::SETUGE, ISD::SETUGT}, VT,

          Expand);

      setOperationAction(ISD::SCALAR_TO_VECTOR, VT, Custom);

      setOperationAction(ISD::ABS, VT, Legal);

      setOperationAction(ISD::ABDS, VT, Legal);

      setOperationAction(ISD::ABDU, VT, Legal);

      setOperationAction(ISD::SADDSAT, VT, Legal);

      setOperationAction(ISD::SSUBSAT, VT, Legal);

      setOperationAction(ISD::UADDSAT, VT, Legal);

      setOperationAction(ISD::USUBSAT, VT, Legal);

      setOperationAction(ISD::VECREDUCE_ADD, VT, Custom);

      setOperationAction(ISD::ROTL, VT, Custom);

      setOperationAction(ISD::ROTR, VT, Custom);

    }

    for (MVT VT : {MVT::v32i8, MVT::v16i16, MVT::v8i32})

      setOperationAction(ISD::BITREVERSE, VT, Custom);

    for (MVT VT : {MVT::v16i16, MVT::v8i32, MVT::v4i64})

      setOperationAction(ISD::BSWAP, VT, Legal);

    for (MVT VT : {MVT::v8i32, MVT::v4i32, MVT::v4i64}) {

      setOperationAction({ISD::SINT_TO_FP, ISD::UINT_TO_FP}, VT, Legal);

      setOperationAction({ISD::FP_TO_SINT, ISD::FP_TO_UINT}, VT, Legal);

    }

    for (MVT VT : {MVT::v8f32, MVT::v4f64}) {

      setOperationAction({ISD::FADD, ISD::FSUB}, VT, Legal);

      setOperationAction({ISD::FMUL, ISD::FDIV}, VT, Legal);

      setOperationAction(ISD::FMA, VT, Legal);

      setOperationAction(ISD::FSQRT, VT, Legal);

      setOperationAction(ISD::FNEG, VT, Legal);

      setOperationAction(ISD::FLOG2, VT, Legal);

      setCondCodeAction({ISD::SETGE, ISD::SETGT, ISD::SETOGE, ISD::SETOGT,

                         ISD::SETUGE, ISD::SETUGT},

                        VT, Expand);

      setOperationAction(ISD::SCALAR_TO_VECTOR, VT, Legal);

      setOperationAction(ISD::FCEIL, VT, Legal);

      setOperationAction(ISD::FFLOOR, VT, Legal);

      setOperationAction(ISD::FTRUNC, VT, Legal);

      setOperationAction(ISD::FROUNDEVEN, VT, Legal);

      setOperationAction(ISD::FMINNUM, VT, Legal);

      setOperationAction(ISD::FMAXNUM, VT, Legal);

    }

  }


  // Set DAG combine for LA32 and LA64.


  setTargetDAGCombine(ISD::AND);

  setTargetDAGCombine(ISD::OR);

  setTargetDAGCombine(ISD::SRL);

  setTargetDAGCombine(ISD::SETCC);


  // Set DAG combine for 'LSX' feature.


  if (Subtarget.hasExtLSX()) {

    setTargetDAGCombine(ISD::INTRINSIC_WO_CHAIN);

    setTargetDAGCombine(ISD::BITCAST);

  }


  // Set DAG combine for 'LASX' feature.


  if (Subtarget.hasExtLASX())

    setTargetDAGCombine(ISD::EXTRACT_VECTOR_ELT);


  // Compute derived properties from the register classes.

  computeRegisterProperties(Subtarget.getRegisterInfo());


  setStackPointerRegisterToSaveRestore(LoongArch::R3);


  setBooleanContents(ZeroOrOneBooleanContent);

  setBooleanVectorContents(ZeroOrNegativeOneBooleanContent);


  setMaxAtomicSizeInBitsSupported(Subtarget.getGRLen());


  setMinCmpXchgSizeInBits(32);


  // Function alignments.

  setMinFunctionAlignment(Align(4));

  // Set preferred alignments.

  setPrefFunctionAlignment(Subtarget.getPrefFunctionAlignment());

  setPrefLoopAlignment(Subtarget.getPrefLoopAlignment());

  setMaxBytesForAlignment(Subtarget.getMaxBytesForAlignment());


  // cmpxchg sizes down to 8 bits become legal if LAMCAS is available.

  if (Subtarget.hasLAMCAS())

    setMinCmpXchgSizeInBits(8);


  if (Subtarget.hasSCQ()) {

    setMaxAtomicSizeInBitsSupported(128);

    setOperationAction(ISD::ATOMIC_CMP_SWAP, MVT::i128, Custom);

  }

}


bool LoongArchTargetLowering::isOffsetFoldingLegal(

    const GlobalAddressSDNode *GA) const {

  // In order to maximise the opportunity for common subexpression elimination,

  // keep a separate ADD node for the global address offset instead of folding

  // it in the global address node. Later peephole optimisations may choose to

  // fold it back in when profitable.

  return false;

}


SDValue LoongArchTargetLowering::LowerOperation(SDValue Op,

                                                SelectionDAG &DAG) const {

  switch (Op.getOpcode()) {

  case ISD::ATOMIC_FENCE:

    return lowerATOMIC_FENCE(Op, DAG);

  case ISD::EH_DWARF_CFA:

    return lowerEH_DWARF_CFA(Op, DAG);

  case ISD::GlobalAddress:

    return lowerGlobalAddress(Op, DAG);

  case ISD::GlobalTLSAddress:

    return lowerGlobalTLSAddress(Op, DAG);

  case ISD::INTRINSIC_WO_CHAIN:

    return lowerINTRINSIC_WO_CHAIN(Op, DAG);

  case ISD::INTRINSIC_W_CHAIN:

    return lowerINTRINSIC_W_CHAIN(Op, DAG);

  case ISD::INTRINSIC_VOID:

    return lowerINTRINSIC_VOID(Op, DAG);

  case ISD::BlockAddress:

    return lowerBlockAddress(Op, DAG);

  case ISD::JumpTable:

    return lowerJumpTable(Op, DAG);

  case ISD::SHL_PARTS:

    return lowerShiftLeftParts(Op, DAG);

  case ISD::SRA_PARTS:

    return lowerShiftRightParts(Op, DAG, true);

  case ISD::SRL_PARTS:

    return lowerShiftRightParts(Op, DAG, false);

  case ISD::ConstantPool:

    return lowerConstantPool(Op, DAG);

  case ISD::FP_TO_SINT:

    return lowerFP_TO_SINT(Op, DAG);

  case ISD::BITCAST:

    return lowerBITCAST(Op, DAG);

  case ISD::UINT_TO_FP:

    return lowerUINT_TO_FP(Op, DAG);

  case ISD::SINT_TO_FP:

    return lowerSINT_TO_FP(Op, DAG);

  case ISD::VASTART:

    return lowerVASTART(Op, DAG);

  case ISD::FRAMEADDR:

    return lowerFRAMEADDR(Op, DAG);

  case ISD::RETURNADDR:

    return lowerRETURNADDR(Op, DAG);

  case ISD::WRITE_REGISTER:

    return lowerWRITE_REGISTER(Op, DAG);

  case ISD::INSERT_VECTOR_ELT:

    return lowerINSERT_VECTOR_ELT(Op, DAG);

  case ISD::EXTRACT_VECTOR_ELT:

    return lowerEXTRACT_VECTOR_ELT(Op, DAG);

  case ISD::BUILD_VECTOR:

    return lowerBUILD_VECTOR(Op, DAG);

  case ISD::CONCAT_VECTORS:

    return lowerCONCAT_VECTORS(Op, DAG);

  case ISD::VECTOR_SHUFFLE:

    return lowerVECTOR_SHUFFLE(Op, DAG);

  case ISD::BITREVERSE:

    return lowerBITREVERSE(Op, DAG);

  case ISD::SCALAR_TO_VECTOR:

    return lowerSCALAR_TO_VECTOR(Op, DAG);

  case ISD::PREFETCH:

    return lowerPREFETCH(Op, DAG);

  case ISD::SELECT:

    return lowerSELECT(Op, DAG);

  case ISD::BRCOND:

    return lowerBRCOND(Op, DAG);

  case ISD::FP_TO_FP16:

    return lowerFP_TO_FP16(Op, DAG);

  case ISD::FP16_TO_FP:

    return lowerFP16_TO_FP(Op, DAG);

  case ISD::FP_TO_BF16:

    return lowerFP_TO_BF16(Op, DAG);

  case ISD::BF16_TO_FP:

    return lowerBF16_TO_FP(Op, DAG);

  case ISD::VECREDUCE_ADD:

    return lowerVECREDUCE_ADD(Op, DAG);

  case ISD::ROTL:

  case ISD::ROTR:

    return lowerRotate(Op, DAG);

  case ISD::VECREDUCE_AND:

  case ISD::VECREDUCE_OR:

  case ISD::VECREDUCE_XOR:

  case ISD::VECREDUCE_SMAX:

  case ISD::VECREDUCE_SMIN:

  case ISD::VECREDUCE_UMAX:

  case ISD::VECREDUCE_UMIN:

    return lowerVECREDUCE(Op, DAG);

  case ISD::ConstantFP:

    return lowerConstantFP(Op, DAG);

  }

  return SDValue();

}


// Helper to attempt to return a cheaper, bit-inverted version of \p V.


static SDValue isNOT(SDValue V, SelectionDAG &DAG) {

  // TODO: don't always ignore oneuse constraints.

  V = peekThroughBitcasts(V);

  EVT VT = V.getValueType();


  // Match not(xor X, -1) -> X.

  if (V.getOpcode() == ISD::XOR &&

      (ISD::isBuildVectorAllOnes(V.getOperand(1).getNode()) ||

       isAllOnesConstant(V.getOperand(1))))

    return V.getOperand(0);


  // Match not(extract_subvector(not(X)) -> extract_subvector(X).

  if (V.getOpcode() == ISD::EXTRACT_SUBVECTOR &&

      (isNullConstant(V.getOperand(1)) || V.getOperand(0).hasOneUse())) {

    if (SDValue Not = isNOT(V.getOperand(0), DAG)) {

      Not = DAG.getBitcast(V.getOperand(0).getValueType(), Not);

      return DAG.getNode(ISD::EXTRACT_SUBVECTOR, SDLoc(Not), VT, Not,

                         V.getOperand(1));

    }

  }


  // Match not(SplatVector(not(X)) -> SplatVector(X).

  if (V.getOpcode() == ISD::BUILD_VECTOR) {

    if (SDValue SplatValue =

            cast<BuildVectorSDNode>(V.getNode())->getSplatValue()) {

      if (!V->isOnlyUserOf(SplatValue.getNode()))

        return SDValue();


      if (SDValue Not = isNOT(SplatValue, DAG)) {

        Not = DAG.getBitcast(V.getOperand(0).getValueType(), Not);

        return DAG.getSplat(VT, SDLoc(Not), Not);

      }

    }

  }


  // Match not(or(not(X),not(Y))) -> and(X, Y).

  if (V.getOpcode() == ISD::OR && DAG.getTargetLoweringInfo().isTypeLegal(VT) &&

      V.getOperand(0).hasOneUse() && V.getOperand(1).hasOneUse()) {

    // TODO: Handle cases with single NOT operand -> VANDN

    if (SDValue Op1 = isNOT(V.getOperand(1), DAG))

      if (SDValue Op0 = isNOT(V.getOperand(0), DAG))

        return DAG.getNode(ISD::AND, SDLoc(V), VT, DAG.getBitcast(VT, Op0),

                           DAG.getBitcast(VT, Op1));

  }


  // TODO: Add more matching patterns. Such as,

  // not(concat_vectors(not(X), not(Y))) -> concat_vectors(X, Y).

  // not(slt(C, X)) -> slt(X - 1, C)


  return SDValue();

}


SDValue LoongArchTargetLowering::lowerConstantFP(SDValue Op,

                                                 SelectionDAG &DAG) const {

  EVT VT = Op.getValueType();

  ConstantFPSDNode *CFP = cast<ConstantFPSDNode>(Op);

  const APFloat &FPVal = CFP->getValueAPF();

  SDLoc DL(CFP);


  assert((VT == MVT::f32 && Subtarget.hasBasicF()) ||

         (VT == MVT::f64 && Subtarget.hasBasicD()));


  // If value is 0.0 or -0.0, just ignore it.

  if (FPVal.isZero())

    return SDValue();


  // If lsx enabled, use cheaper 'vldi' instruction if possible.

  if (isFPImmVLDILegal(FPVal, VT))

    return SDValue();


  // Construct as integer, and move to float register.

  APInt INTVal = FPVal.bitcastToAPInt();


  // If more than MaterializeFPImmInsNum instructions will be used to

  // generate the INTVal and move it to float register, fallback to

  // use floating point load from the constant pool.

  auto Seq = LoongArchMatInt::generateInstSeq(INTVal.getSExtValue());

  int InsNum = Seq.size() + ((VT == MVT::f64 && !Subtarget.is64Bit()) ? 2 : 1);

  if (InsNum > MaterializeFPImmInsNum && !FPVal.isExactlyValue(+1.0))

    return SDValue();


  switch (VT.getSimpleVT().SimpleTy) {

  default:

    llvm_unreachable("Unexpected floating point type!");

    break;

  case MVT::f32: {

    SDValue NewVal = DAG.getConstant(INTVal, DL, MVT::i32);

    if (Subtarget.is64Bit())

      NewVal = DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, NewVal);

    return DAG.getNode(Subtarget.is64Bit() ? LoongArchISD::MOVGR2FR_W_LA64

                                           : LoongArchISD::MOVGR2FR_W,

                       DL, VT, NewVal);

  }

  case MVT::f64: {

    if (Subtarget.is64Bit()) {

      SDValue NewVal = DAG.getConstant(INTVal, DL, MVT::i64);

      return DAG.getNode(LoongArchISD::MOVGR2FR_D, DL, VT, NewVal);

    }

    SDValue Lo = DAG.getConstant(INTVal.trunc(32), DL, MVT::i32);

    SDValue Hi = DAG.getConstant(INTVal.lshr(32).trunc(32), DL, MVT::i32);

    return DAG.getNode(LoongArchISD::MOVGR2FR_D_LO_HI, DL, VT, Lo, Hi);

  }

  }


  return SDValue();

}


// Lower vecreduce_add using vhaddw instructions.

// For Example:

//  call i32 @llvm.vector.reduce.add.v4i32(<4 x i32> %a)

// can be lowered to:

//  VHADDW_D_W    vr0, vr0, vr0

//  VHADDW_Q_D    vr0, vr0, vr0

//  VPICKVE2GR_D  a0,  vr0, 0

//  ADDI_W        a0,  a0,  0

SDValue LoongArchTargetLowering::lowerVECREDUCE_ADD(SDValue Op,

                                                    SelectionDAG &DAG) const {


  SDLoc DL(Op);

  MVT OpVT = Op.getSimpleValueType();

  SDValue Val = Op.getOperand(0);


  unsigned NumEles = Val.getSimpleValueType().getVectorNumElements();

  unsigned EleBits = Val.getSimpleValueType().getScalarSizeInBits();

  unsigned ResBits = OpVT.getScalarSizeInBits();


  unsigned LegalVecSize = 128;

  bool isLASX256Vector =

      Subtarget.hasExtLASX() && Val.getValueSizeInBits() == 256;


  // Ensure operand type legal or enable it legal.

  while (!isTypeLegal(Val.getSimpleValueType())) {

    Val = DAG.WidenVector(Val, DL);

  }


  // NumEles is designed for iterations count, v4i32 for LSX

  // and v8i32 for LASX should have the same count.

  if (isLASX256Vector) {

    NumEles /= 2;

    LegalVecSize = 256;

  }


  for (unsigned i = 1; i < NumEles; i *= 2, EleBits *= 2) {

    MVT IntTy = MVT::getIntegerVT(EleBits);

    MVT VecTy = MVT::getVectorVT(IntTy, LegalVecSize / EleBits);

    Val = DAG.getNode(LoongArchISD::VHADDW, DL, VecTy, Val, Val);

  }


  if (isLASX256Vector) {

    SDValue Tmp = DAG.getNode(LoongArchISD::XVPERMI, DL, MVT::v4i64, Val,

                              DAG.getConstant(2, DL, Subtarget.getGRLenVT()));

    Val = DAG.getNode(ISD::ADD, DL, MVT::v4i64, Tmp, Val);

  }


  Val = DAG.getBitcast(MVT::getVectorVT(OpVT, LegalVecSize / ResBits), Val);

  return DAG.getNode(ISD::EXTRACT_VECTOR_ELT, DL, OpVT, Val,

                     DAG.getConstant(0, DL, Subtarget.getGRLenVT()));

}


// Lower vecreduce_and/or/xor/[s/u]max/[s/u]min.

// For Example:

//  call i32 @llvm.vector.reduce.smax.v4i32(<4 x i32> %a)

// can be lowered to:

//  VBSRL_V       vr1, vr0, 8

//  VMAX_W        vr0, vr1, vr0

//  VBSRL_V       vr1, vr0, 4

//  VMAX_W        vr0, vr1, vr0

//  VPICKVE2GR_W  a0,  vr0, 0

// For 256 bit vector, it is illegal and will be spilt into

// two 128 bit vector by default then processed by this.

SDValue LoongArchTargetLowering::lowerVECREDUCE(SDValue Op,

                                                SelectionDAG &DAG) const {

  SDLoc DL(Op);


  MVT OpVT = Op.getSimpleValueType();

  SDValue Val = Op.getOperand(0);


  unsigned NumEles = Val.getSimpleValueType().getVectorNumElements();

  unsigned EleBits = Val.getSimpleValueType().getScalarSizeInBits();


  // Ensure operand type legal or enable it legal.

  while (!isTypeLegal(Val.getSimpleValueType())) {

    Val = DAG.WidenVector(Val, DL);

  }


  unsigned Opcode = ISD::getVecReduceBaseOpcode(Op.getOpcode());

  MVT VecTy = Val.getSimpleValueType();

  MVT GRLenVT = Subtarget.getGRLenVT();


  for (int i = NumEles; i > 1; i /= 2) {

    SDValue ShiftAmt = DAG.getConstant(i * EleBits / 16, DL, GRLenVT);

    SDValue Tmp = DAG.getNode(LoongArchISD::VBSRL, DL, VecTy, Val, ShiftAmt);

    Val = DAG.getNode(Opcode, DL, VecTy, Tmp, Val);

  }


  return DAG.getNode(ISD::EXTRACT_VECTOR_ELT, DL, OpVT, Val,

                     DAG.getConstant(0, DL, GRLenVT));

}


SDValue LoongArchTargetLowering::lowerPREFETCH(SDValue Op,

                                               SelectionDAG &DAG) const {

  unsigned IsData = Op.getConstantOperandVal(4);


  // We don't support non-data prefetch.

  // Just preserve the chain.

  if (!IsData)

    return Op.getOperand(0);


  return Op;

}


SDValue LoongArchTargetLowering::lowerRotate(SDValue Op,

                                             SelectionDAG &DAG) const {

  MVT VT = Op.getSimpleValueType();

  assert(VT.isVector() && "Unexpected type");


  SDLoc DL(Op);

  SDValue R = Op.getOperand(0);

  SDValue Amt = Op.getOperand(1);

  unsigned Opcode = Op.getOpcode();

  unsigned EltSizeInBits = VT.getScalarSizeInBits();


  auto checkCstSplat = [](SDValue V, APInt &CstSplatValue) {

    if (V.getOpcode() != ISD::BUILD_VECTOR)

      return false;

    if (SDValue SplatValue =

            cast<BuildVectorSDNode>(V.getNode())->getSplatValue()) {

      if (auto *C = dyn_cast<ConstantSDNode>(SplatValue)) {

        CstSplatValue = C->getAPIntValue();

        return true;

      }

    }

    return false;

  };


  // Check for constant splat rotation amount.

  APInt CstSplatValue;

  bool IsCstSplat = checkCstSplat(Amt, CstSplatValue);

  bool isROTL = Opcode == ISD::ROTL;


  // Check for splat rotate by zero.

  if (IsCstSplat && CstSplatValue.urem(EltSizeInBits) == 0)

    return R;


  // LoongArch targets always prefer ISD::ROTR.

  if (isROTL) {

    SDValue Zero = DAG.getConstant(0, DL, VT);

    return DAG.getNode(ISD::ROTR, DL, VT, R,

                       DAG.getNode(ISD::SUB, DL, VT, Zero, Amt));

  }


  // Rotate by a immediate.

  if (IsCstSplat) {

    // ISD::ROTR: Attemp to rotate by a positive immediate.

    SDValue Bits = DAG.getConstant(EltSizeInBits, DL, VT);

    if (SDValue Urem =

            DAG.FoldConstantArithmetic(ISD::UREM, DL, VT, {Amt, Bits}))

      return DAG.getNode(Opcode, DL, VT, R, Urem);

  }


  return Op;

}


// Return true if Val is equal to (setcc LHS, RHS, CC).

// Return false if Val is the inverse of (setcc LHS, RHS, CC).

// Otherwise, return std::nullopt.


static std::optional<bool> matchSetCC(SDValue LHS, SDValue RHS,

                                      ISD::CondCode CC, SDValue Val) {

  assert(Val->getOpcode() == ISD::SETCC);

  SDValue LHS2 = Val.getOperand(0);

  SDValue RHS2 = Val.getOperand(1);

  ISD::CondCode CC2 = cast<CondCodeSDNode>(Val.getOperand(2))->get();


  if (LHS == LHS2 && RHS == RHS2) {

    if (CC == CC2)

      return true;

    if (CC == ISD::getSetCCInverse(CC2, LHS2.getValueType()))

      return false;

  } else if (LHS == RHS2 && RHS == LHS2) {

    CC2 = ISD::getSetCCSwappedOperands(CC2);

    if (CC == CC2)

      return true;

    if (CC == ISD::getSetCCInverse(CC2, LHS2.getValueType()))

      return false;

  }


  return std::nullopt;

}


static SDValue combineSelectToBinOp(SDNode *N, SelectionDAG &DAG,

                                    const LoongArchSubtarget &Subtarget) {

  SDValue CondV = N->getOperand(0);

  SDValue TrueV = N->getOperand(1);

  SDValue FalseV = N->getOperand(2);

  MVT VT = N->getSimpleValueType(0);

  SDLoc DL(N);


  // (select c, -1, y) -> -c | y

  if (isAllOnesConstant(TrueV)) {

    SDValue Neg = DAG.getNegative(CondV, DL, VT);

    return DAG.getNode(ISD::OR, DL, VT, Neg, DAG.getFreeze(FalseV));

  }

  // (select c, y, -1) -> (c-1) | y

  if (isAllOnesConstant(FalseV)) {

    SDValue Neg =

        DAG.getNode(ISD::ADD, DL, VT, CondV, DAG.getAllOnesConstant(DL, VT));

    return DAG.getNode(ISD::OR, DL, VT, Neg, DAG.getFreeze(TrueV));

  }


  // (select c, 0, y) -> (c-1) & y

  if (isNullConstant(TrueV)) {

    SDValue Neg =

        DAG.getNode(ISD::ADD, DL, VT, CondV, DAG.getAllOnesConstant(DL, VT));

    return DAG.getNode(ISD::AND, DL, VT, Neg, DAG.getFreeze(FalseV));

  }

  // (select c, y, 0) -> -c & y

  if (isNullConstant(FalseV)) {

    SDValue Neg = DAG.getNegative(CondV, DL, VT);

    return DAG.getNode(ISD::AND, DL, VT, Neg, DAG.getFreeze(TrueV));

  }


  // select c, ~x, x --> xor -c, x

  if (isa<ConstantSDNode>(TrueV) && isa<ConstantSDNode>(FalseV)) {

    const APInt &TrueVal = TrueV->getAsAPIntVal();

    const APInt &FalseVal = FalseV->getAsAPIntVal();

    if (~TrueVal == FalseVal) {

      SDValue Neg = DAG.getNegative(CondV, DL, VT);

      return DAG.getNode(ISD::XOR, DL, VT, Neg, FalseV);

    }

  }


  // Try to fold (select (setcc lhs, rhs, cc), truev, falsev) into bitwise ops

  // when both truev and falsev are also setcc.

  if (CondV.getOpcode() == ISD::SETCC && TrueV.getOpcode() == ISD::SETCC &&

      FalseV.getOpcode() == ISD::SETCC) {

    SDValue LHS = CondV.getOperand(0);

    SDValue RHS = CondV.getOperand(1);

    ISD::CondCode CC = cast<CondCodeSDNode>(CondV.getOperand(2))->get();


    // (select x, x, y) -> x | y

    // (select !x, x, y) -> x & y

    if (std::optional<bool> MatchResult = matchSetCC(LHS, RHS, CC, TrueV)) {

      return DAG.getNode(*MatchResult ? ISD::OR : ISD::AND, DL, VT, TrueV,

                         DAG.getFreeze(FalseV));

    }

    // (select x, y, x) -> x & y

    // (select !x, y, x) -> x | y

    if (std::optional<bool> MatchResult = matchSetCC(LHS, RHS, CC, FalseV)) {

      return DAG.getNode(*MatchResult ? ISD::AND : ISD::OR, DL, VT,

                         DAG.getFreeze(TrueV), FalseV);

    }

  }


  return SDValue();

}


// Transform `binOp (select cond, x, c0), c1` where `c0` and `c1` are constants

// into `select cond, binOp(x, c1), binOp(c0, c1)` if profitable.

// For now we only consider transformation profitable if `binOp(c0, c1)` ends up

// being `0` or `-1`. In such cases we can replace `select` with `and`.

// TODO: Should we also do this if `binOp(c0, c1)` is cheaper to materialize

// than `c0`?

static SDValue


foldBinOpIntoSelectIfProfitable(SDNode *BO, SelectionDAG &DAG,

                                const LoongArchSubtarget &Subtarget) {

  unsigned SelOpNo = 0;

  SDValue Sel = BO->getOperand(0);

  if (Sel.getOpcode() != ISD::SELECT || !Sel.hasOneUse()) {

    SelOpNo = 1;

    Sel = BO->getOperand(1);

  }


  if (Sel.getOpcode() != ISD::SELECT || !Sel.hasOneUse())

    return SDValue();


  unsigned ConstSelOpNo = 1;

  unsigned OtherSelOpNo = 2;

  if (!isa<ConstantSDNode>(Sel->getOperand(ConstSelOpNo))) {

    ConstSelOpNo = 2;

    OtherSelOpNo = 1;

  }

  SDValue ConstSelOp = Sel->getOperand(ConstSelOpNo);

  ConstantSDNode *ConstSelOpNode = dyn_cast<ConstantSDNode>(ConstSelOp);

  if (!ConstSelOpNode || ConstSelOpNode->isOpaque())

    return SDValue();


  SDValue ConstBinOp = BO->getOperand(SelOpNo ^ 1);

  ConstantSDNode *ConstBinOpNode = dyn_cast<ConstantSDNode>(ConstBinOp);

  if (!ConstBinOpNode || ConstBinOpNode->isOpaque())

    return SDValue();


  SDLoc DL(Sel);

  EVT VT = BO->getValueType(0);


  SDValue NewConstOps[2] = {ConstSelOp, ConstBinOp};

  if (SelOpNo == 1)

    std::swap(NewConstOps[0], NewConstOps[1]);


  SDValue NewConstOp =

      DAG.FoldConstantArithmetic(BO->getOpcode(), DL, VT, NewConstOps);

  if (!NewConstOp)

    return SDValue();


  const APInt &NewConstAPInt = NewConstOp->getAsAPIntVal();

  if (!NewConstAPInt.isZero() && !NewConstAPInt.isAllOnes())

    return SDValue();


  SDValue OtherSelOp = Sel->getOperand(OtherSelOpNo);

  SDValue NewNonConstOps[2] = {OtherSelOp, ConstBinOp};

  if (SelOpNo == 1)

    std::swap(NewNonConstOps[0], NewNonConstOps[1]);

  SDValue NewNonConstOp = DAG.getNode(BO->getOpcode(), DL, VT, NewNonConstOps);


  SDValue NewT = (ConstSelOpNo == 1) ? NewConstOp : NewNonConstOp;

  SDValue NewF = (ConstSelOpNo == 1) ? NewNonConstOp : NewConstOp;

  return DAG.getSelect(DL, VT, Sel.getOperand(0), NewT, NewF);

}


// Changes the condition code and swaps operands if necessary, so the SetCC

// operation matches one of the comparisons supported directly by branches

// in the LoongArch ISA. May adjust compares to favor compare with 0 over

// compare with 1/-1.


static void translateSetCCForBranch(const SDLoc &DL, SDValue &LHS, SDValue &RHS,

                                    ISD::CondCode &CC, SelectionDAG &DAG) {

  // If this is a single bit test that can't be handled by ANDI, shift the

  // bit to be tested to the MSB and perform a signed compare with 0.

  if (isIntEqualitySetCC(CC) && isNullConstant(RHS) &&

      LHS.getOpcode() == ISD::AND && LHS.hasOneUse() &&

      isa<ConstantSDNode>(LHS.getOperand(1))) {

    uint64_t Mask = LHS.getConstantOperandVal(1);

    if ((isPowerOf2_64(Mask) || isMask_64(Mask)) && !isInt<12>(Mask)) {

      unsigned ShAmt = 0;

      if (isPowerOf2_64(Mask)) {

        CC = CC == ISD::SETEQ ? ISD::SETGE : ISD::SETLT;

        ShAmt = LHS.getValueSizeInBits() - 1 - Log2_64(Mask);

      } else {

        ShAmt = LHS.getValueSizeInBits() - llvm::bit_width(Mask);

      }


      LHS = LHS.getOperand(0);

      if (ShAmt != 0)

        LHS = DAG.getNode(ISD::SHL, DL, LHS.getValueType(), LHS,

                          DAG.getConstant(ShAmt, DL, LHS.getValueType()));

      return;

    }

  }


  if (auto *RHSC = dyn_cast<ConstantSDNode>(RHS)) {

    int64_t C = RHSC->getSExtValue();

    switch (CC) {

    default:

      break;

    case ISD::SETGT:

      // Convert X > -1 to X >= 0.

      if (C == -1) {

        RHS = DAG.getConstant(0, DL, RHS.getValueType());

        CC = ISD::SETGE;

        return;

      }

      break;

    case ISD::SETLT:

      // Convert X < 1 to 0 >= X.

      if (C == 1) {

        RHS = LHS;

        LHS = DAG.getConstant(0, DL, RHS.getValueType());

        CC = ISD::SETGE;

        return;

      }

      break;

    }

  }


  switch (CC) {

  default:

    break;

  case ISD::SETGT:

  case ISD::SETLE:

  case ISD::SETUGT:

  case ISD::SETULE:

    CC = ISD::getSetCCSwappedOperands(CC);

    std::swap(LHS, RHS);

    break;

  }

}


SDValue LoongArchTargetLowering::lowerSELECT(SDValue Op,

                                             SelectionDAG &DAG) const {

  SDValue CondV = Op.getOperand(0);

  SDValue TrueV = Op.getOperand(1);

  SDValue FalseV = Op.getOperand(2);

  SDLoc DL(Op);

  MVT VT = Op.getSimpleValueType();

  MVT GRLenVT = Subtarget.getGRLenVT();


  if (SDValue V = combineSelectToBinOp(Op.getNode(), DAG, Subtarget))

    return V;


  if (Op.hasOneUse()) {

    unsigned UseOpc = Op->user_begin()->getOpcode();

    if (isBinOp(UseOpc) && DAG.isSafeToSpeculativelyExecute(UseOpc)) {

      SDNode *BinOp = *Op->user_begin();

      if (SDValue NewSel = foldBinOpIntoSelectIfProfitable(*Op->user_begin(),

                                                           DAG, Subtarget)) {

        DAG.ReplaceAllUsesWith(BinOp, &NewSel);

        // Opcode check is necessary because foldBinOpIntoSelectIfProfitable

        // may return a constant node and cause crash in lowerSELECT.

        if (NewSel.getOpcode() == ISD::SELECT)

          return lowerSELECT(NewSel, DAG);

        return NewSel;

      }

    }

  }


  // If the condition is not an integer SETCC which operates on GRLenVT, we need

  // to emit a LoongArchISD::SELECT_CC comparing the condition to zero. i.e.:

  // (select condv, truev, falsev)

  // -> (loongarchisd::select_cc condv, zero, setne, truev, falsev)

  if (CondV.getOpcode() != ISD::SETCC ||

      CondV.getOperand(0).getSimpleValueType() != GRLenVT) {

    SDValue Zero = DAG.getConstant(0, DL, GRLenVT);

    SDValue SetNE = DAG.getCondCode(ISD::SETNE);


    SDValue Ops[] = {CondV, Zero, SetNE, TrueV, FalseV};


    return DAG.getNode(LoongArchISD::SELECT_CC, DL, VT, Ops);

  }


  // If the CondV is the output of a SETCC node which operates on GRLenVT

  // inputs, then merge the SETCC node into the lowered LoongArchISD::SELECT_CC

  // to take advantage of the integer compare+branch instructions. i.e.: (select

  // (setcc lhs, rhs, cc), truev, falsev)

  // -> (loongarchisd::select_cc lhs, rhs, cc, truev, falsev)

  SDValue LHS = CondV.getOperand(0);

  SDValue RHS = CondV.getOperand(1);

  ISD::CondCode CCVal = cast<CondCodeSDNode>(CondV.getOperand(2))->get();


  // Special case for a select of 2 constants that have a difference of 1.

  // Normally this is done by DAGCombine, but if the select is introduced by

  // type legalization or op legalization, we miss it. Restricting to SETLT

  // case for now because that is what signed saturating add/sub need.

  // FIXME: We don't need the condition to be SETLT or even a SETCC,

  // but we would probably want to swap the true/false values if the condition

  // is SETGE/SETLE to avoid an XORI.

  if (isa<ConstantSDNode>(TrueV) && isa<ConstantSDNode>(FalseV) &&

      CCVal == ISD::SETLT) {

    const APInt &TrueVal = TrueV->getAsAPIntVal();

    const APInt &FalseVal = FalseV->getAsAPIntVal();

    if (TrueVal - 1 == FalseVal)

      return DAG.getNode(ISD::ADD, DL, VT, CondV, FalseV);

    if (TrueVal + 1 == FalseVal)

      return DAG.getNode(ISD::SUB, DL, VT, FalseV, CondV);

  }


  translateSetCCForBranch(DL, LHS, RHS, CCVal, DAG);

  // 1 < x ? x : 1 -> 0 < x ? x : 1

  if (isOneConstant(LHS) && (CCVal == ISD::SETLT || CCVal == ISD::SETULT) &&

      RHS == TrueV && LHS == FalseV) {

    LHS = DAG.getConstant(0, DL, VT);

    // 0 <u x is the same as x != 0.

    if (CCVal == ISD::SETULT) {

      std::swap(LHS, RHS);

      CCVal = ISD::SETNE;

    }

  }


  // x <s -1 ? x : -1 -> x <s 0 ? x : -1

  if (isAllOnesConstant(RHS) && CCVal == ISD::SETLT && LHS == TrueV &&

      RHS == FalseV) {

    RHS = DAG.getConstant(0, DL, VT);

  }


  SDValue TargetCC = DAG.getCondCode(CCVal);


  if (isa<ConstantSDNode>(TrueV) && !isa<ConstantSDNode>(FalseV)) {

    // (select (setcc lhs, rhs, CC), constant, falsev)

    // -> (select (setcc lhs, rhs, InverseCC), falsev, constant)

    std::swap(TrueV, FalseV);

    TargetCC = DAG.getCondCode(ISD::getSetCCInverse(CCVal, LHS.getValueType()));

  }


  SDValue Ops[] = {LHS, RHS, TargetCC, TrueV, FalseV};

  return DAG.getNode(LoongArchISD::SELECT_CC, DL, VT, Ops);

}


SDValue LoongArchTargetLowering::lowerBRCOND(SDValue Op,

                                             SelectionDAG &DAG) const {

  SDValue CondV = Op.getOperand(1);

  SDLoc DL(Op);

  MVT GRLenVT = Subtarget.getGRLenVT();


  if (CondV.getOpcode() == ISD::SETCC) {

    if (CondV.getOperand(0).getValueType() == GRLenVT) {

      SDValue LHS = CondV.getOperand(0);

      SDValue RHS = CondV.getOperand(1);

      ISD::CondCode CCVal = cast<CondCodeSDNode>(CondV.getOperand(2))->get();


      translateSetCCForBranch(DL, LHS, RHS, CCVal, DAG);


      SDValue TargetCC = DAG.getCondCode(CCVal);

      return DAG.getNode(LoongArchISD::BR_CC, DL, Op.getValueType(),

                         Op.getOperand(0), LHS, RHS, TargetCC,

                         Op.getOperand(2));

    } else if (CondV.getOperand(0).getValueType().isFloatingPoint()) {

      return DAG.getNode(LoongArchISD::BRCOND, DL, Op.getValueType(),

                         Op.getOperand(0), CondV, Op.getOperand(2));

    }

  }


  return DAG.getNode(LoongArchISD::BR_CC, DL, Op.getValueType(),

                     Op.getOperand(0), CondV, DAG.getConstant(0, DL, GRLenVT),

                     DAG.getCondCode(ISD::SETNE), Op.getOperand(2));

}


SDValue

LoongArchTargetLowering::lowerSCALAR_TO_VECTOR(SDValue Op,

                                               SelectionDAG &DAG) const {

  SDLoc DL(Op);

  MVT OpVT = Op.getSimpleValueType();


  SDValue Vector = DAG.getUNDEF(OpVT);

  SDValue Val = Op.getOperand(0);

  SDValue Idx = DAG.getConstant(0, DL, Subtarget.getGRLenVT());


  return DAG.getNode(ISD::INSERT_VECTOR_ELT, DL, OpVT, Vector, Val, Idx);

}


SDValue LoongArchTargetLowering::lowerBITREVERSE(SDValue Op,

                                                 SelectionDAG &DAG) const {

  EVT ResTy = Op->getValueType(0);

  SDValue Src = Op->getOperand(0);

  SDLoc DL(Op);


  // LoongArchISD::BITREV_8B is not supported on LA32.

  if (!Subtarget.is64Bit() && (ResTy == MVT::v16i8 || ResTy == MVT::v32i8))

    return SDValue();


  EVT NewVT = ResTy.is128BitVector() ? MVT::v2i64 : MVT::v4i64;

  unsigned int OrigEltNum = ResTy.getVectorNumElements();

  unsigned int NewEltNum = NewVT.getVectorNumElements();


  SDValue NewSrc = DAG.getNode(ISD::BITCAST, DL, NewVT, Src);


  SmallVector<SDValue, 8> Ops;

  for (unsigned int i = 0; i < NewEltNum; i++) {

    SDValue Op = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, DL, MVT::i64, NewSrc,

                             DAG.getConstant(i, DL, Subtarget.getGRLenVT()));

    unsigned RevOp = (ResTy == MVT::v16i8 || ResTy == MVT::v32i8)

                         ? (unsigned)LoongArchISD::BITREV_8B

                         : (unsigned)ISD::BITREVERSE;

    Ops.push_back(DAG.getNode(RevOp, DL, MVT::i64, Op));

  }

  SDValue Res =

      DAG.getNode(ISD::BITCAST, DL, ResTy, DAG.getBuildVector(NewVT, DL, Ops));


  switch (ResTy.getSimpleVT().SimpleTy) {

  default:

    return SDValue();

  case MVT::v16i8:

  case MVT::v32i8:

    return Res;

  case MVT::v8i16:

  case MVT::v16i16:

  case MVT::v4i32:

  case MVT::v8i32: {

    SmallVector<int, 32> Mask;

    for (unsigned int i = 0; i < NewEltNum; i++)

      for (int j = OrigEltNum / NewEltNum - 1; j >= 0; j--)

        Mask.push_back(j + (OrigEltNum / NewEltNum) * i);

    return DAG.getVectorShuffle(ResTy, DL, Res, DAG.getUNDEF(ResTy), Mask);

  }

  }

}


// Widen element type to get a new mask value (if possible).

// For example:

//  shufflevector <4 x i32> %a, <4 x i32> %b,

//                <4 x i32> <i32 6, i32 7, i32 2, i32 3>

// is equivalent to:

//  shufflevector <2 x i64> %a, <2 x i64> %b, <2 x i32> <i32 3, i32 1>

// can be lowered to:

//  VPACKOD_D vr0, vr0, vr1


static SDValue widenShuffleMask(const SDLoc &DL, ArrayRef<int> Mask, MVT VT,

                                SDValue V1, SDValue V2, SelectionDAG &DAG) {

  unsigned EltBits = VT.getScalarSizeInBits();


  if (EltBits > 32 || EltBits == 1)

    return SDValue();


  SmallVector<int, 8> NewMask;

  if (widenShuffleMaskElts(Mask, NewMask)) {

    MVT NewEltVT = VT.isFloatingPoint() ? MVT::getFloatingPointVT(EltBits * 2)

                                        : MVT::getIntegerVT(EltBits * 2);

    MVT NewVT = MVT::getVectorVT(NewEltVT, VT.getVectorNumElements() / 2);

    if (DAG.getTargetLoweringInfo().isTypeLegal(NewVT)) {

      SDValue NewV1 = DAG.getBitcast(NewVT, V1);

      SDValue NewV2 = DAG.getBitcast(NewVT, V2);

      return DAG.getBitcast(

          VT, DAG.getVectorShuffle(NewVT, DL, NewV1, NewV2, NewMask));

    }

  }


  return SDValue();

}


/// Attempts to match a shuffle mask against the VBSLL, VBSRL, VSLLI and VSRLI

/// instruction.

// The funciton matches elements from one of the input vector shuffled to the

// left or right with zeroable elements 'shifted in'. It handles both the

// strictly bit-wise element shifts and the byte shfit across an entire 128-bit

// lane.

// Mostly copied from X86.


static int matchShuffleAsShift(MVT &ShiftVT, unsigned &Opcode,

                               unsigned ScalarSizeInBits, ArrayRef<int> Mask,

                               int MaskOffset, const APInt &Zeroable) {

  int Size = Mask.size();

  unsigned SizeInBits = Size * ScalarSizeInBits;


  auto CheckZeros = [&](int Shift, int Scale, bool Left) {

    for (int i = 0; i < Size; i += Scale)

      for (int j = 0; j < Shift; ++j)

        if (!Zeroable[i + j + (Left ? 0 : (Scale - Shift))])

          return false;


    return true;

  };


  auto isSequentialOrUndefInRange = [&](unsigned Pos, unsigned Size, int Low,

                                        int Step = 1) {

    for (unsigned i = Pos, e = Pos + Size; i != e; ++i, Low += Step)

      if (!(Mask[i] == -1 || Mask[i] == Low))

        return false;

    return true;

  };


  auto MatchShift = [&](int Shift, int Scale, bool Left) {

    for (int i = 0; i != Size; i += Scale) {

      unsigned Pos = Left ? i + Shift : i;

      unsigned Low = Left ? i : i + Shift;

      unsigned Len = Scale - Shift;

      if (!isSequentialOrUndefInRange(Pos, Len, Low + MaskOffset))

        return -1;

    }


    int ShiftEltBits = ScalarSizeInBits * Scale;

    bool ByteShift = ShiftEltBits > 64;

    Opcode = Left ? (ByteShift ? LoongArchISD::VBSLL : LoongArchISD::VSLLI)

                  : (ByteShift ? LoongArchISD::VBSRL : LoongArchISD::VSRLI);

    int ShiftAmt = Shift * ScalarSizeInBits / (ByteShift ? 8 : 1);


    // Normalize the scale for byte shifts to still produce an i64 element

    // type.

    Scale = ByteShift ? Scale / 2 : Scale;


    // We need to round trip through the appropriate type for the shift.

    MVT ShiftSVT = MVT::getIntegerVT(ScalarSizeInBits * Scale);

    ShiftVT = ByteShift ? MVT::getVectorVT(MVT::i8, SizeInBits / 8)

                        : MVT::getVectorVT(ShiftSVT, Size / Scale);

    return (int)ShiftAmt;

  };


  unsigned MaxWidth = 128;

  for (int Scale = 2; Scale * ScalarSizeInBits <= MaxWidth; Scale *= 2)

    for (int Shift = 1; Shift != Scale; ++Shift)

      for (bool Left : {true, false})

        if (CheckZeros(Shift, Scale, Left)) {

          int ShiftAmt = MatchShift(Shift, Scale, Left);

          if (0 < ShiftAmt)

            return ShiftAmt;

        }


  // no match

  return -1;

}


/// Lower VECTOR_SHUFFLE as shift (if possible).

///

/// For example:

///   %2 = shufflevector <4 x i32> %0, <4 x i32> zeroinitializer,

///                      <4 x i32> <i32 4, i32 0, i32 1, i32 2>

/// is lowered to:

///     (VBSLL_V $v0, $v0, 4)

///

///   %2 = shufflevector <4 x i32> %0, <4 x i32> zeroinitializer,

///                      <4 x i32> <i32 4, i32 0, i32 4, i32 2>

/// is lowered to:

///     (VSLLI_D $v0, $v0, 32)


static SDValue lowerVECTOR_SHUFFLEAsShift(const SDLoc &DL, ArrayRef<int> Mask,

                                          MVT VT, SDValue V1, SDValue V2,

                                          SelectionDAG &DAG,

                                          const LoongArchSubtarget &Subtarget,

                                          const APInt &Zeroable) {

  int Size = Mask.size();

  assert(Size == (int)VT.getVectorNumElements() && "Unexpected mask size");


  MVT ShiftVT;

  SDValue V = V1;

  unsigned Opcode;


  // Try to match shuffle against V1 shift.

  int ShiftAmt = matchShuffleAsShift(ShiftVT, Opcode, VT.getScalarSizeInBits(),

                                     Mask, 0, Zeroable);


  // If V1 failed, try to match shuffle against V2 shift.

  if (ShiftAmt < 0) {

    ShiftAmt = matchShuffleAsShift(ShiftVT, Opcode, VT.getScalarSizeInBits(),

                                   Mask, Size, Zeroable);

    V = V2;

  }


  if (ShiftAmt < 0)

    return SDValue();


  assert(DAG.getTargetLoweringInfo().isTypeLegal(ShiftVT) &&

         "Illegal integer vector type");

  V = DAG.getBitcast(ShiftVT, V);

  V = DAG.getNode(Opcode, DL, ShiftVT, V,

                  DAG.getConstant(ShiftAmt, DL, Subtarget.getGRLenVT()));

  return DAG.getBitcast(VT, V);

}


/// Determine whether a range fits a regular pattern of values.

/// This function accounts for the possibility of jumping over the End iterator.

template <typename ValType>

static bool


fitsRegularPattern(typename SmallVectorImpl<ValType>::const_iterator Begin,

                   unsigned CheckStride,

                   typename SmallVectorImpl<ValType>::const_iterator End,

                   ValType ExpectedIndex, unsigned ExpectedIndexStride) {

  auto &I = Begin;


  while (I != End) {

    if (*I != -1 && *I != ExpectedIndex)

      return false;

    ExpectedIndex += ExpectedIndexStride;


    // Incrementing past End is undefined behaviour so we must increment one

    // step at a time and check for End at each step.

    for (unsigned n = 0; n < CheckStride && I != End; ++n, ++I)

      ; // Empty loop body.

  }

  return true;

}


/// Compute whether each element of a shuffle is zeroable.

///

/// A "zeroable" vector shuffle element is one which can be lowered to zero.


static void computeZeroableShuffleElements(ArrayRef<int> Mask, SDValue V1,

                                           SDValue V2, APInt &KnownUndef,

                                           APInt &KnownZero) {

  int Size = Mask.size();

  KnownUndef = KnownZero = APInt::getZero(Size);


  V1 = peekThroughBitcasts(V1);

  V2 = peekThroughBitcasts(V2);


  bool V1IsZero = ISD::isBuildVectorAllZeros(V1.getNode());

  bool V2IsZero = ISD::isBuildVectorAllZeros(V2.getNode());


  int VectorSizeInBits = V1.getValueSizeInBits();

  int ScalarSizeInBits = VectorSizeInBits / Size;

  assert(!(VectorSizeInBits % ScalarSizeInBits) && "Illegal shuffle mask size");

  (void)ScalarSizeInBits;


  for (int i = 0; i < Size; ++i) {

    int M = Mask[i];

    if (M < 0) {

      KnownUndef.setBit(i);

      continue;

    }

    if ((M >= 0 && M < Size && V1IsZero) || (M >= Size && V2IsZero)) {

      KnownZero.setBit(i);

      continue;

    }

  }

}


/// Test whether a shuffle mask is equivalent within each sub-lane.

///

/// The specific repeated shuffle mask is populated in \p RepeatedMask, as it is

/// non-trivial to compute in the face of undef lanes. The representation is

/// suitable for use with existing 128-bit shuffles as entries from the second

/// vector have been remapped to [LaneSize, 2*LaneSize).


static bool isRepeatedShuffleMask(unsigned LaneSizeInBits, MVT VT,

                                  ArrayRef<int> Mask,

                                  SmallVectorImpl<int> &RepeatedMask) {

  auto LaneSize = LaneSizeInBits / VT.getScalarSizeInBits();

  RepeatedMask.assign(LaneSize, -1);

  int Size = Mask.size();

  for (int i = 0; i < Size; ++i) {

    assert(Mask[i] == -1 || Mask[i] >= 0);

    if (Mask[i] < 0)

      continue;

    if ((Mask[i] % Size) / LaneSize != i / LaneSize)

      // This entry crosses lanes, so there is no way to model this shuffle.

      return false;


    // Ok, handle the in-lane shuffles by detecting if and when they repeat.

    // Adjust second vector indices to start at LaneSize instead of Size.

    int LocalM =

        Mask[i] < Size ? Mask[i] % LaneSize : Mask[i] % LaneSize + LaneSize;

    if (RepeatedMask[i % LaneSize] < 0)

      // This is the first non-undef entry in this slot of a 128-bit lane.

      RepeatedMask[i % LaneSize] = LocalM;

    else if (RepeatedMask[i % LaneSize] != LocalM)

      // Found a mismatch with the repeated mask.

      return false;

  }

  return true;

}


/// Attempts to match vector shuffle as byte rotation.


static int matchShuffleAsByteRotate(MVT VT, SDValue &V1, SDValue &V2,

                                    ArrayRef<int> Mask) {


  SDValue Lo, Hi;

  SmallVector<int, 16> RepeatedMask;


  if (!isRepeatedShuffleMask(128, VT, Mask, RepeatedMask))

    return -1;


  int NumElts = RepeatedMask.size();

  int Rotation = 0;

  int Scale = 16 / NumElts;


  for (int i = 0; i < NumElts; ++i) {

    int M = RepeatedMask[i];

    assert((M == -1 || (0 <= M && M < (2 * NumElts))) &&

           "Unexpected mask index.");

    if (M < 0)

      continue;


    // Determine where a rotated vector would have started.

    int StartIdx = i - (M % NumElts);

    if (StartIdx == 0)

      return -1;


    // If we found the tail of a vector the rotation must be the missing

    // front. If we found the head of a vector, it must be how much of the

    // head.

    int CandidateRotation = StartIdx < 0 ? -StartIdx : NumElts - StartIdx;


    if (Rotation == 0)

      Rotation = CandidateRotation;

    else if (Rotation != CandidateRotation)

      return -1;


    // Compute which value this mask is pointing at.

    SDValue MaskV = M < NumElts ? V1 : V2;


    // Compute which of the two target values this index should be assigned

    // to. This reflects whether the high elements are remaining or the low

    // elements are remaining.

    SDValue &TargetV = StartIdx < 0 ? Hi : Lo;


    // Either set up this value if we've not encountered it before, or check

    // that it remains consistent.

    if (!TargetV)

      TargetV = MaskV;

    else if (TargetV != MaskV)

      return -1;

  }


  // Check that we successfully analyzed the mask, and normalize the results.

  assert(Rotation != 0 && "Failed to locate a viable rotation!");

  assert((Lo || Hi) && "Failed to find a rotated input vector!");

  if (!Lo)

    Lo = Hi;

  else if (!Hi)

    Hi = Lo;


  V1 = Lo;

  V2 = Hi;


  return Rotation * Scale;

}


/// Lower VECTOR_SHUFFLE as byte rotate (if possible).

///

/// For example:

///   %shuffle = shufflevector <2 x i64> %a, <2 x i64> %b,

///                            <2 x i32> <i32 3, i32 0>

/// is lowered to:

///      (VBSRL_V $v1, $v1, 8)

///      (VBSLL_V $v0, $v0, 8)

///      (VOR_V $v0, $V0, $v1)

static SDValue


lowerVECTOR_SHUFFLEAsByteRotate(const SDLoc &DL, ArrayRef<int> Mask, MVT VT,

                                SDValue V1, SDValue V2, SelectionDAG &DAG,

                                const LoongArchSubtarget &Subtarget) {


  SDValue Lo = V1, Hi = V2;

  int ByteRotation = matchShuffleAsByteRotate(VT, Lo, Hi, Mask);

  if (ByteRotation <= 0)

    return SDValue();


  MVT ByteVT = MVT::getVectorVT(MVT::i8, VT.getSizeInBits() / 8);

  Lo = DAG.getBitcast(ByteVT, Lo);

  Hi = DAG.getBitcast(ByteVT, Hi);


  int LoByteShift = 16 - ByteRotation;

  int HiByteShift = ByteRotation;

  MVT GRLenVT = Subtarget.getGRLenVT();


  SDValue LoShift = DAG.getNode(LoongArchISD::VBSLL, DL, ByteVT, Lo,

                                DAG.getConstant(LoByteShift, DL, GRLenVT));

  SDValue HiShift = DAG.getNode(LoongArchISD::VBSRL, DL, ByteVT, Hi,

                                DAG.getConstant(HiByteShift, DL, GRLenVT));

  return DAG.getBitcast(VT, DAG.getNode(ISD::OR, DL, ByteVT, LoShift, HiShift));

}


/// Lower VECTOR_SHUFFLE as ZERO_EXTEND Or ANY_EXTEND (if possible).

///

/// For example:

///   %2 = shufflevector <4 x i32> %0, <4 x i32> zeroinitializer,

///                      <4 x i32> <i32 0, i32 4, i32 1, i32 4>

///   %3 = bitcast <4 x i32> %2 to <2 x i64>

/// is lowered to:

///     (VREPLI $v1, 0)

///     (VILVL $v0, $v1, $v0)


static SDValue lowerVECTOR_SHUFFLEAsZeroOrAnyExtend(const SDLoc &DL,

                                                    ArrayRef<int> Mask, MVT VT,

                                                    SDValue V1, SDValue V2,

                                                    SelectionDAG &DAG,

                                                    const APInt &Zeroable) {

  int Bits = VT.getSizeInBits();

  int EltBits = VT.getScalarSizeInBits();

  int NumElements = VT.getVectorNumElements();


  if (Zeroable.isAllOnes())

    return DAG.getConstant(0, DL, VT);


  // Define a helper function to check a particular ext-scale and lower to it if

  // valid.

  auto Lower = [&](int Scale) -> SDValue {

    SDValue InputV;

    bool AnyExt = true;

    int Offset = 0;

    for (int i = 0; i < NumElements; i++) {

      int M = Mask[i];

      if (M < 0)

        continue;

      if (i % Scale != 0) {

        // Each of the extended elements need to be zeroable.

        if (!Zeroable[i])

          return SDValue();


        AnyExt = false;

        continue;

      }


      // Each of the base elements needs to be consecutive indices into the

      // same input vector.

      SDValue V = M < NumElements ? V1 : V2;

      M = M % NumElements;

      if (!InputV) {

        InputV = V;

        Offset = M - (i / Scale);


        // These offset can't be handled

        if (Offset % (NumElements / Scale))

          return SDValue();

      } else if (InputV != V)

        return SDValue();


      if (M != (Offset + (i / Scale)))

        return SDValue(); // Non-consecutive strided elements.

    }


    // If we fail to find an input, we have a zero-shuffle which should always

    // have already been handled.

    if (!InputV)

      return SDValue();


    do {

      unsigned VilVLoHi = LoongArchISD::VILVL;

      if (Offset >= (NumElements / 2)) {

        VilVLoHi = LoongArchISD::VILVH;

        Offset -= (NumElements / 2);

      }


      MVT InputVT = MVT::getVectorVT(MVT::getIntegerVT(EltBits), NumElements);

      SDValue Ext =

          AnyExt ? DAG.getFreeze(InputV) : DAG.getConstant(0, DL, InputVT);

      InputV = DAG.getBitcast(InputVT, InputV);

      InputV = DAG.getNode(VilVLoHi, DL, InputVT, Ext, InputV);

      Scale /= 2;

      EltBits *= 2;

      NumElements /= 2;

    } while (Scale > 1);

    return DAG.getBitcast(VT, InputV);

  };


  // Each iteration, try extending the elements half as much, but into twice as

  // many elements.

  for (int NumExtElements = Bits / 64; NumExtElements < NumElements;

       NumExtElements *= 2) {

    if (SDValue V = Lower(NumElements / NumExtElements))

      return V;

  }

  return SDValue();

}


/// Lower VECTOR_SHUFFLE into VREPLVEI (if possible).

///

/// VREPLVEI performs vector broadcast based on an element specified by an

/// integer immediate, with its mask being similar to:

///   <x, x, x, ...>

/// where x is any valid index.

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above form.

static SDValue


lowerVECTOR_SHUFFLE_VREPLVEI(const SDLoc &DL, ArrayRef<int> Mask, MVT VT,

                             SDValue V1, SelectionDAG &DAG,

                             const LoongArchSubtarget &Subtarget) {

  int SplatIndex = -1;

  for (const auto &M : Mask) {

    if (M != -1) {

      SplatIndex = M;

      break;

    }

  }


  if (SplatIndex == -1)

    return DAG.getUNDEF(VT);


  assert(SplatIndex < (int)Mask.size() && "Out of bounds mask index");

  if (fitsRegularPattern<int>(Mask.begin(), 1, Mask.end(), SplatIndex, 0)) {

    return DAG.getNode(LoongArchISD::VREPLVEI, DL, VT, V1,

                       DAG.getConstant(SplatIndex, DL, Subtarget.getGRLenVT()));

  }


  return SDValue();

}


/// Lower VECTOR_SHUFFLE into VSHUF4I (if possible).

///

/// VSHUF4I splits the vector into blocks of four elements, then shuffles these

/// elements according to a <4 x i2> constant (encoded as an integer immediate).

///

/// It is therefore possible to lower into VSHUF4I when the mask takes the form:

///   <a, b, c, d, a+4, b+4, c+4, d+4, a+8, b+8, c+8, d+8, ...>

/// When undef's appear they are treated as if they were whatever value is

/// necessary in order to fit the above forms.

///

/// For example:

///   %2 = shufflevector <8 x i16> %0, <8 x i16> undef,

///                      <8 x i32> <i32 3, i32 2, i32 1, i32 0,

///                                 i32 7, i32 6, i32 5, i32 4>

/// is lowered to:

///   (VSHUF4I_H $v0, $v1, 27)

/// where the 27 comes from:

///   3 + (2 << 2) + (1 << 4) + (0 << 6)

static SDValue


lowerVECTOR_SHUFFLE_VSHUF4I(const SDLoc &DL, ArrayRef<int> Mask, MVT VT,

                            SDValue V1, SDValue V2, SelectionDAG &DAG,

                            const LoongArchSubtarget &Subtarget) {


  unsigned SubVecSize = 4;

  if (VT == MVT::v2f64 || VT == MVT::v2i64)

    SubVecSize = 2;


  int SubMask[4] = {-1, -1, -1, -1};

  for (unsigned i = 0; i < SubVecSize; ++i) {

    for (unsigned j = i; j < Mask.size(); j += SubVecSize) {

      int M = Mask[j];


      // Convert from vector index to 4-element subvector index

      // If an index refers to an element outside of the subvector then give up

      if (M != -1) {

        M -= 4 * (j / SubVecSize);

        if (M < 0 || M >= 4)

          return SDValue();

      }


      // If the mask has an undef, replace it with the current index.

      // Note that it might still be undef if the current index is also undef

      if (SubMask[i] == -1)

        SubMask[i] = M;

      // Check that non-undef values are the same as in the mask. If they

      // aren't then give up

      else if (M != -1 && M != SubMask[i])

        return SDValue();

    }

  }


  // Calculate the immediate. Replace any remaining undefs with zero

  int Imm = 0;

  for (int i = SubVecSize - 1; i >= 0; --i) {

    int M = SubMask[i];


    if (M == -1)

      M = 0;


    Imm <<= 2;

    Imm |= M & 0x3;

  }


  MVT GRLenVT = Subtarget.getGRLenVT();


  // Return vshuf4i.d

  if (VT == MVT::v2f64 || VT == MVT::v2i64)

    return DAG.getNode(LoongArchISD::VSHUF4I_D, DL, VT, V1, V2,

                       DAG.getConstant(Imm, DL, GRLenVT));


  return DAG.getNode(LoongArchISD::VSHUF4I, DL, VT, V1,

                     DAG.getConstant(Imm, DL, GRLenVT));

}


/// Lower VECTOR_SHUFFLE whose result is the reversed source vector.

///

/// It is possible to do optimization for VECTOR_SHUFFLE performing vector

/// reverse whose mask likes:

///   <7, 6, 5, 4, 3, 2, 1, 0>

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above forms.

static SDValue


lowerVECTOR_SHUFFLE_IsReverse(const SDLoc &DL, ArrayRef<int> Mask, MVT VT,

                              SDValue V1, SelectionDAG &DAG,

                              const LoongArchSubtarget &Subtarget) {

  // Only vectors with i8/i16 elements which cannot match other patterns

  // directly needs to do this.

  if (VT != MVT::v16i8 && VT != MVT::v8i16 && VT != MVT::v32i8 &&

      VT != MVT::v16i16)

    return SDValue();


  if (!ShuffleVectorInst::isReverseMask(Mask, Mask.size()))

    return SDValue();


  int WidenNumElts = VT.getVectorNumElements() / 4;

  SmallVector<int, 16> WidenMask(WidenNumElts, -1);

  for (int i = 0; i < WidenNumElts; ++i)

    WidenMask[i] = WidenNumElts - 1 - i;


  MVT WidenVT = MVT::getVectorVT(

      VT.getVectorElementType() == MVT::i8 ? MVT::i32 : MVT::i64, WidenNumElts);

  SDValue NewV1 = DAG.getBitcast(WidenVT, V1);

  SDValue WidenRev = DAG.getVectorShuffle(WidenVT, DL, NewV1,

                                          DAG.getUNDEF(WidenVT), WidenMask);


  return DAG.getNode(LoongArchISD::VSHUF4I, DL, VT,

                     DAG.getBitcast(VT, WidenRev),

                     DAG.getConstant(27, DL, Subtarget.getGRLenVT()));

}


/// Lower VECTOR_SHUFFLE into VPACKEV (if possible).

///

/// VPACKEV interleaves the even elements from each vector.

///

/// It is possible to lower into VPACKEV when the mask consists of two of the

/// following forms interleaved:

///   <0, 2, 4, ...>

///   <n, n+2, n+4, ...>

/// where n is the number of elements in the vector.

/// For example:

///   <0, 0, 2, 2, 4, 4, ...>

///   <0, n, 2, n+2, 4, n+4, ...>

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above forms.


static SDValue lowerVECTOR_SHUFFLE_VPACKEV(const SDLoc &DL, ArrayRef<int> Mask,

                                           MVT VT, SDValue V1, SDValue V2,

                                           SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &End = Mask.end();

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 2, End, 0, 2))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 2, End, Mask.size(), 2))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Begin + 1, 2, End, 0, 2))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Begin + 1, 2, End, Mask.size(), 2))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VPACKEV, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into VPACKOD (if possible).

///

/// VPACKOD interleaves the odd elements from each vector.

///

/// It is possible to lower into VPACKOD when the mask consists of two of the

/// following forms interleaved:

///   <1, 3, 5, ...>

///   <n+1, n+3, n+5, ...>

/// where n is the number of elements in the vector.

/// For example:

///   <1, 1, 3, 3, 5, 5, ...>

///   <1, n+1, 3, n+3, 5, n+5, ...>

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above forms.


static SDValue lowerVECTOR_SHUFFLE_VPACKOD(const SDLoc &DL, ArrayRef<int> Mask,

                                           MVT VT, SDValue V1, SDValue V2,

                                           SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &End = Mask.end();

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 2, End, 1, 2))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 2, End, Mask.size() + 1, 2))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Begin + 1, 2, End, 1, 2))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Begin + 1, 2, End, Mask.size() + 1, 2))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VPACKOD, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into VILVH (if possible).

///

/// VILVH interleaves consecutive elements from the left (highest-indexed) half

/// of each vector.

///

/// It is possible to lower into VILVH when the mask consists of two of the

/// following forms interleaved:

///   <x, x+1, x+2, ...>

///   <n+x, n+x+1, n+x+2, ...>

/// where n is the number of elements in the vector and x is half n.

/// For example:

///   <x, x, x+1, x+1, x+2, x+2, ...>

///   <x, n+x, x+1, n+x+1, x+2, n+x+2, ...>

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above forms.


static SDValue lowerVECTOR_SHUFFLE_VILVH(const SDLoc &DL, ArrayRef<int> Mask,

                                         MVT VT, SDValue V1, SDValue V2,

                                         SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &End = Mask.end();

  unsigned HalfSize = Mask.size() / 2;

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 2, End, HalfSize, 1))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 2, End, Mask.size() + HalfSize, 1))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Begin + 1, 2, End, HalfSize, 1))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Begin + 1, 2, End, Mask.size() + HalfSize,

                                   1))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VILVH, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into VILVL (if possible).

///

/// VILVL interleaves consecutive elements from the right (lowest-indexed) half

/// of each vector.

///

/// It is possible to lower into VILVL when the mask consists of two of the

/// following forms interleaved:

///   <0, 1, 2, ...>

///   <n, n+1, n+2, ...>

/// where n is the number of elements in the vector.

/// For example:

///   <0, 0, 1, 1, 2, 2, ...>

///   <0, n, 1, n+1, 2, n+2, ...>

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above forms.


static SDValue lowerVECTOR_SHUFFLE_VILVL(const SDLoc &DL, ArrayRef<int> Mask,

                                         MVT VT, SDValue V1, SDValue V2,

                                         SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &End = Mask.end();

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 2, End, 0, 1))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 2, End, Mask.size(), 1))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Begin + 1, 2, End, 0, 1))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Begin + 1, 2, End, Mask.size(), 1))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VILVL, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into VPICKEV (if possible).

///

/// VPICKEV copies the even elements of each vector into the result vector.

///

/// It is possible to lower into VPICKEV when the mask consists of two of the

/// following forms concatenated:

///   <0, 2, 4, ...>

///   <n, n+2, n+4, ...>

/// where n is the number of elements in the vector.

/// For example:

///   <0, 2, 4, ..., 0, 2, 4, ...>

///   <0, 2, 4, ..., n, n+2, n+4, ...>

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above forms.


static SDValue lowerVECTOR_SHUFFLE_VPICKEV(const SDLoc &DL, ArrayRef<int> Mask,

                                           MVT VT, SDValue V1, SDValue V2,

                                           SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &Mid = Mask.begin() + Mask.size() / 2;

  const auto &End = Mask.end();

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 1, Mid, 0, 2))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 1, Mid, Mask.size(), 2))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Mid, 1, End, 0, 2))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Mid, 1, End, Mask.size(), 2))

    V2 = OriV2;


  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VPICKEV, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into VPICKOD (if possible).

///

/// VPICKOD copies the odd elements of each vector into the result vector.

///

/// It is possible to lower into VPICKOD when the mask consists of two of the

/// following forms concatenated:

///   <1, 3, 5, ...>

///   <n+1, n+3, n+5, ...>

/// where n is the number of elements in the vector.

/// For example:

///   <1, 3, 5, ..., 1, 3, 5, ...>

///   <1, 3, 5, ..., n+1, n+3, n+5, ...>

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above forms.


static SDValue lowerVECTOR_SHUFFLE_VPICKOD(const SDLoc &DL, ArrayRef<int> Mask,

                                           MVT VT, SDValue V1, SDValue V2,

                                           SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &Mid = Mask.begin() + Mask.size() / 2;

  const auto &End = Mask.end();

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 1, Mid, 1, 2))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 1, Mid, Mask.size() + 1, 2))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Mid, 1, End, 1, 2))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Mid, 1, End, Mask.size() + 1, 2))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VPICKOD, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into VSHUF.

///

/// This mostly consists of converting the shuffle mask into a BUILD_VECTOR and

/// adding it as an operand to the resulting VSHUF.


static SDValue lowerVECTOR_SHUFFLE_VSHUF(const SDLoc &DL, ArrayRef<int> Mask,

                                         MVT VT, SDValue V1, SDValue V2,

                                         SelectionDAG &DAG,

                                         const LoongArchSubtarget &Subtarget) {


  SmallVector<SDValue, 16> Ops;

  for (auto M : Mask)

    Ops.push_back(DAG.getSignedConstant(M, DL, Subtarget.getGRLenVT()));


  EVT MaskVecTy = VT.changeVectorElementTypeToInteger();

  SDValue MaskVec = DAG.getBuildVector(MaskVecTy, DL, Ops);


  // VECTOR_SHUFFLE concatenates the vectors in an vectorwise fashion.

  // <0b00, 0b01> + <0b10, 0b11> -> <0b00, 0b01, 0b10, 0b11>

  // VSHF concatenates the vectors in a bitwise fashion:

  // <0b00, 0b01> + <0b10, 0b11> ->

  // 0b0100       + 0b1110       -> 0b01001110

  //                                <0b10, 0b11, 0b00, 0b01>

  // We must therefore swap the operands to get the correct result.

  return DAG.getNode(LoongArchISD::VSHUF, DL, VT, MaskVec, V2, V1);

}


/// Dispatching routine to lower various 128-bit LoongArch vector shuffles.

///

/// This routine breaks down the specific type of 128-bit shuffle and

/// dispatches to the lowering routines accordingly.


static SDValue lower128BitShuffle(const SDLoc &DL, ArrayRef<int> Mask, MVT VT,

                                  SDValue V1, SDValue V2, SelectionDAG &DAG,

                                  const LoongArchSubtarget &Subtarget) {

  assert((VT.SimpleTy == MVT::v16i8 || VT.SimpleTy == MVT::v8i16 ||

          VT.SimpleTy == MVT::v4i32 || VT.SimpleTy == MVT::v2i64 ||

          VT.SimpleTy == MVT::v4f32 || VT.SimpleTy == MVT::v2f64) &&

         "Vector type is unsupported for lsx!");

  assert(V1.getSimpleValueType() == V2.getSimpleValueType() &&

         "Two operands have different types!");

  assert(VT.getVectorNumElements() == Mask.size() &&

         "Unexpected mask size for shuffle!");

  assert(Mask.size() % 2 == 0 && "Expected even mask size.");


  APInt KnownUndef, KnownZero;

  computeZeroableShuffleElements(Mask, V1, V2, KnownUndef, KnownZero);

  APInt Zeroable = KnownUndef | KnownZero;


  SDValue Result;

  // TODO: Add more comparison patterns.

  if (V2.isUndef()) {

    if ((Result =

             lowerVECTOR_SHUFFLE_VREPLVEI(DL, Mask, VT, V1, DAG, Subtarget)))

      return Result;

    if ((Result =

             lowerVECTOR_SHUFFLE_VSHUF4I(DL, Mask, VT, V1, V2, DAG, Subtarget)))

      return Result;

    if ((Result =

             lowerVECTOR_SHUFFLE_IsReverse(DL, Mask, VT, V1, DAG, Subtarget)))

      return Result;


    // TODO: This comment may be enabled in the future to better match the

    // pattern for instruction selection.

    /* V2 = V1; */

  }


  // It is recommended not to change the pattern comparison order for better

  // performance.

  if ((Result = lowerVECTOR_SHUFFLE_VPACKEV(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_VPACKOD(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_VILVH(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_VILVL(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_VPICKEV(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_VPICKOD(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((VT.SimpleTy == MVT::v2i64 || VT.SimpleTy == MVT::v2f64) &&

      (Result =

           lowerVECTOR_SHUFFLE_VSHUF4I(DL, Mask, VT, V1, V2, DAG, Subtarget)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLEAsZeroOrAnyExtend(DL, Mask, VT, V1, V2, DAG,

                                                     Zeroable)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLEAsShift(DL, Mask, VT, V1, V2, DAG, Subtarget,

                                           Zeroable)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLEAsByteRotate(DL, Mask, VT, V1, V2, DAG,

                                                Subtarget)))

    return Result;

  if (SDValue NewShuffle = widenShuffleMask(DL, Mask, VT, V1, V2, DAG))

    return NewShuffle;

  if ((Result =

           lowerVECTOR_SHUFFLE_VSHUF(DL, Mask, VT, V1, V2, DAG, Subtarget)))

    return Result;

  return SDValue();

}


/// Lower VECTOR_SHUFFLE into XVREPLVEI (if possible).

///

/// It is a XVREPLVEI when the mask is:

///   <x, x, x, ..., x+n, x+n, x+n, ...>

/// where the number of x is equal to n and n is half the length of vector.

///

/// When undef's appear in the mask they are treated as if they were whatever

/// value is necessary in order to fit the above form.

static SDValue


lowerVECTOR_SHUFFLE_XVREPLVEI(const SDLoc &DL, ArrayRef<int> Mask, MVT VT,

                              SDValue V1, SelectionDAG &DAG,

                              const LoongArchSubtarget &Subtarget) {

  int SplatIndex = -1;

  for (const auto &M : Mask) {

    if (M != -1) {

      SplatIndex = M;

      break;

    }

  }


  if (SplatIndex == -1)

    return DAG.getUNDEF(VT);


  const auto &Begin = Mask.begin();

  const auto &End = Mask.end();

  int HalfSize = Mask.size() / 2;


  if (SplatIndex >= HalfSize)

    return SDValue();


  assert(SplatIndex < (int)Mask.size() && "Out of bounds mask index");

  if (fitsRegularPattern<int>(Begin, 1, End - HalfSize, SplatIndex, 0) &&

      fitsRegularPattern<int>(Begin + HalfSize, 1, End, SplatIndex + HalfSize,

                              0)) {

    return DAG.getNode(LoongArchISD::VREPLVEI, DL, VT, V1,

                       DAG.getConstant(SplatIndex, DL, Subtarget.getGRLenVT()));

  }


  return SDValue();

}


/// Lower VECTOR_SHUFFLE into XVSHUF4I (if possible).

static SDValue


lowerVECTOR_SHUFFLE_XVSHUF4I(const SDLoc &DL, ArrayRef<int> Mask, MVT VT,

                             SDValue V1, SDValue V2, SelectionDAG &DAG,

                             const LoongArchSubtarget &Subtarget) {

  // When the size is less than or equal to 4, lower cost instructions may be

  // used.

  if (Mask.size() <= 4)

    return SDValue();

  return lowerVECTOR_SHUFFLE_VSHUF4I(DL, Mask, VT, V1, V2, DAG, Subtarget);

}


/// Lower VECTOR_SHUFFLE into XVPERMI (if possible).

static SDValue


lowerVECTOR_SHUFFLE_XVPERMI(const SDLoc &DL, ArrayRef<int> Mask, MVT VT,

                            SDValue V1, SelectionDAG &DAG,

                            const LoongArchSubtarget &Subtarget) {

  // Only consider XVPERMI_D.

  if (Mask.size() != 4 || (VT != MVT::v4i64 && VT != MVT::v4f64))

    return SDValue();


  unsigned MaskImm = 0;

  for (unsigned i = 0; i < Mask.size(); ++i) {

    if (Mask[i] == -1)

      continue;

    MaskImm |= Mask[i] << (i * 2);

  }


  return DAG.getNode(LoongArchISD::XVPERMI, DL, VT, V1,

                     DAG.getConstant(MaskImm, DL, Subtarget.getGRLenVT()));

}


/// Lower VECTOR_SHUFFLE into XVPERM (if possible).


static SDValue lowerVECTOR_SHUFFLE_XVPERM(const SDLoc &DL, ArrayRef<int> Mask,

                                          MVT VT, SDValue V1, SelectionDAG &DAG,

                                          const LoongArchSubtarget &Subtarget) {

  // LoongArch LASX only have XVPERM_W.

  if (Mask.size() != 8 || (VT != MVT::v8i32 && VT != MVT::v8f32))

    return SDValue();


  unsigned NumElts = VT.getVectorNumElements();

  unsigned HalfSize = NumElts / 2;

  bool FrontLo = true, FrontHi = true;

  bool BackLo = true, BackHi = true;


  auto inRange = [](int val, int low, int high) {

    return (val == -1) || (val >= low && val < high);

  };


  for (unsigned i = 0; i < HalfSize; ++i) {

    int Fronti = Mask[i];

    int Backi = Mask[i + HalfSize];


    FrontLo &= inRange(Fronti, 0, HalfSize);

    FrontHi &= inRange(Fronti, HalfSize, NumElts);

    BackLo &= inRange(Backi, 0, HalfSize);

    BackHi &= inRange(Backi, HalfSize, NumElts);

  }


  // If both the lower and upper 128-bit parts access only one half of the

  // vector (either lower or upper), avoid using xvperm.w. The latency of

  // xvperm.w(3) is higher than using xvshuf(1) and xvori(1).

  if ((FrontLo || FrontHi) && (BackLo || BackHi))

    return SDValue();


  SmallVector<SDValue, 8> Masks;

  MVT GRLenVT = Subtarget.getGRLenVT();

  for (unsigned i = 0; i < NumElts; ++i)

    Masks.push_back(Mask[i] == -1 ? DAG.getUNDEF(GRLenVT)

                                  : DAG.getConstant(Mask[i], DL, GRLenVT));

  SDValue MaskVec = DAG.getBuildVector(MVT::v8i32, DL, Masks);


  return DAG.getNode(LoongArchISD::XVPERM, DL, VT, V1, MaskVec);

}


/// Lower VECTOR_SHUFFLE into XVPACKEV (if possible).


static SDValue lowerVECTOR_SHUFFLE_XVPACKEV(const SDLoc &DL, ArrayRef<int> Mask,

                                            MVT VT, SDValue V1, SDValue V2,

                                            SelectionDAG &DAG) {

  return lowerVECTOR_SHUFFLE_VPACKEV(DL, Mask, VT, V1, V2, DAG);

}


/// Lower VECTOR_SHUFFLE into XVPACKOD (if possible).


static SDValue lowerVECTOR_SHUFFLE_XVPACKOD(const SDLoc &DL, ArrayRef<int> Mask,

                                            MVT VT, SDValue V1, SDValue V2,

                                            SelectionDAG &DAG) {

  return lowerVECTOR_SHUFFLE_VPACKOD(DL, Mask, VT, V1, V2, DAG);

}


/// Lower VECTOR_SHUFFLE into XVILVH (if possible).


static SDValue lowerVECTOR_SHUFFLE_XVILVH(const SDLoc &DL, ArrayRef<int> Mask,

                                          MVT VT, SDValue V1, SDValue V2,

                                          SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &End = Mask.end();

  unsigned HalfSize = Mask.size() / 2;

  unsigned LeftSize = HalfSize / 2;

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 2, End - HalfSize, HalfSize - LeftSize,

                              1) &&

      fitsRegularPattern<int>(Begin + HalfSize, 2, End, HalfSize + LeftSize, 1))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 2, End - HalfSize,

                                   Mask.size() + HalfSize - LeftSize, 1) &&

           fitsRegularPattern<int>(Begin + HalfSize, 2, End,

                                   Mask.size() + HalfSize + LeftSize, 1))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Begin + 1, 2, End - HalfSize, HalfSize - LeftSize,

                              1) &&

      fitsRegularPattern<int>(Begin + 1 + HalfSize, 2, End, HalfSize + LeftSize,

                              1))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Begin + 1, 2, End - HalfSize,

                                   Mask.size() + HalfSize - LeftSize, 1) &&

           fitsRegularPattern<int>(Begin + 1 + HalfSize, 2, End,

                                   Mask.size() + HalfSize + LeftSize, 1))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VILVH, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into XVILVL (if possible).


static SDValue lowerVECTOR_SHUFFLE_XVILVL(const SDLoc &DL, ArrayRef<int> Mask,

                                          MVT VT, SDValue V1, SDValue V2,

                                          SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &End = Mask.end();

  unsigned HalfSize = Mask.size() / 2;

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 2, End - HalfSize, 0, 1) &&

      fitsRegularPattern<int>(Begin + HalfSize, 2, End, HalfSize, 1))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 2, End - HalfSize, Mask.size(), 1) &&

           fitsRegularPattern<int>(Begin + HalfSize, 2, End,

                                   Mask.size() + HalfSize, 1))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(Begin + 1, 2, End - HalfSize, 0, 1) &&

      fitsRegularPattern<int>(Begin + 1 + HalfSize, 2, End, HalfSize, 1))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(Begin + 1, 2, End - HalfSize, Mask.size(),

                                   1) &&

           fitsRegularPattern<int>(Begin + 1 + HalfSize, 2, End,

                                   Mask.size() + HalfSize, 1))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VILVL, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into XVPICKEV (if possible).


static SDValue lowerVECTOR_SHUFFLE_XVPICKEV(const SDLoc &DL, ArrayRef<int> Mask,

                                            MVT VT, SDValue V1, SDValue V2,

                                            SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &LeftMid = Mask.begin() + Mask.size() / 4;

  const auto &Mid = Mask.begin() + Mask.size() / 2;

  const auto &RightMid = Mask.end() - Mask.size() / 4;

  const auto &End = Mask.end();

  unsigned HalfSize = Mask.size() / 2;

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 1, LeftMid, 0, 2) &&

      fitsRegularPattern<int>(Mid, 1, RightMid, HalfSize, 2))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 1, LeftMid, Mask.size(), 2) &&

           fitsRegularPattern<int>(Mid, 1, RightMid, Mask.size() + HalfSize, 2))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(LeftMid, 1, Mid, 0, 2) &&

      fitsRegularPattern<int>(RightMid, 1, End, HalfSize, 2))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(LeftMid, 1, Mid, Mask.size(), 2) &&

           fitsRegularPattern<int>(RightMid, 1, End, Mask.size() + HalfSize, 2))

    V2 = OriV2;


  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VPICKEV, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into XVPICKOD (if possible).


static SDValue lowerVECTOR_SHUFFLE_XVPICKOD(const SDLoc &DL, ArrayRef<int> Mask,

                                            MVT VT, SDValue V1, SDValue V2,

                                            SelectionDAG &DAG) {


  const auto &Begin = Mask.begin();

  const auto &LeftMid = Mask.begin() + Mask.size() / 4;

  const auto &Mid = Mask.begin() + Mask.size() / 2;

  const auto &RightMid = Mask.end() - Mask.size() / 4;

  const auto &End = Mask.end();

  unsigned HalfSize = Mask.size() / 2;

  SDValue OriV1 = V1, OriV2 = V2;


  if (fitsRegularPattern<int>(Begin, 1, LeftMid, 1, 2) &&

      fitsRegularPattern<int>(Mid, 1, RightMid, HalfSize + 1, 2))

    V1 = OriV1;

  else if (fitsRegularPattern<int>(Begin, 1, LeftMid, Mask.size() + 1, 2) &&

           fitsRegularPattern<int>(Mid, 1, RightMid, Mask.size() + HalfSize + 1,

                                   2))

    V1 = OriV2;

  else

    return SDValue();


  if (fitsRegularPattern<int>(LeftMid, 1, Mid, 1, 2) &&

      fitsRegularPattern<int>(RightMid, 1, End, HalfSize + 1, 2))

    V2 = OriV1;

  else if (fitsRegularPattern<int>(LeftMid, 1, Mid, Mask.size() + 1, 2) &&

           fitsRegularPattern<int>(RightMid, 1, End, Mask.size() + HalfSize + 1,

                                   2))

    V2 = OriV2;

  else

    return SDValue();


  return DAG.getNode(LoongArchISD::VPICKOD, DL, VT, V2, V1);

}


/// Lower VECTOR_SHUFFLE into XVINSVE0 (if possible).

static SDValue


lowerVECTOR_SHUFFLE_XVINSVE0(const SDLoc &DL, ArrayRef<int> Mask, MVT VT,

                             SDValue V1, SDValue V2, SelectionDAG &DAG,

                             const LoongArchSubtarget &Subtarget) {

  // LoongArch LASX only supports xvinsve0.{w/d}.

  if (VT != MVT::v8i32 && VT != MVT::v8f32 && VT != MVT::v4i64 &&

      VT != MVT::v4f64)

    return SDValue();


  MVT GRLenVT = Subtarget.getGRLenVT();

  int MaskSize = Mask.size();

  assert(MaskSize == (int)VT.getVectorNumElements() && "Unexpected mask size");


  // Check if exactly one element of the Mask is replaced by 'Replaced', while

  // all other elements are either 'Base + i' or undef (-1). On success, return

  // the index of the replaced element. Otherwise, just return -1.

  auto checkReplaceOne = [&](int Base, int Replaced) -> int {

    int Idx = -1;

    for (int i = 0; i < MaskSize; ++i) {

      if (Mask[i] == Base + i || Mask[i] == -1)

        continue;

      if (Mask[i] != Replaced)

        return -1;

      if (Idx == -1)

        Idx = i;

      else

        return -1;

    }

    return Idx;

  };


  // Case 1: the lowest element of V2 replaces one element in V1.

  int Idx = checkReplaceOne(0, MaskSize);

  if (Idx != -1)

    return DAG.getNode(LoongArchISD::XVINSVE0, DL, VT, V1, V2,

                       DAG.getConstant(Idx, DL, GRLenVT));


  // Case 2: the lowest element of V1 replaces one element in V2.

  Idx = checkReplaceOne(MaskSize, 0);

  if (Idx != -1)

    return DAG.getNode(LoongArchISD::XVINSVE0, DL, VT, V2, V1,

                       DAG.getConstant(Idx, DL, GRLenVT));


  return SDValue();

}


/// Lower VECTOR_SHUFFLE into XVSHUF (if possible).


static SDValue lowerVECTOR_SHUFFLE_XVSHUF(const SDLoc &DL, ArrayRef<int> Mask,

                                          MVT VT, SDValue V1, SDValue V2,

                                          SelectionDAG &DAG) {


  int MaskSize = Mask.size();

  int HalfSize = Mask.size() / 2;

  const auto &Begin = Mask.begin();

  const auto &Mid = Mask.begin() + HalfSize;

  const auto &End = Mask.end();


  // VECTOR_SHUFFLE concatenates the vectors:

  //  <0, 1, 2, 3, 4, 5, 6, 7> + <8, 9, 10, 11, 12, 13, 14, 15>

  //  shuffling ->

  //  <0, 1, 2, 3, 8, 9, 10, 11> <4, 5, 6, 7, 12, 13, 14, 15>

  //

  // XVSHUF concatenates the vectors:

  //  <a0, a1, a2, a3, b0, b1, b2, b3> + <a4, a5, a6, a7, b4, b5, b6, b7>

  //  shuffling ->

  //  <a0, a1, a2, a3, a4, a5, a6, a7> + <b0, b1, b2, b3, b4, b5, b6, b7>

  SmallVector<SDValue, 8> MaskAlloc;

  for (auto it = Begin; it < Mid; it++) {

    if (*it < 0) // UNDEF

      MaskAlloc.push_back(DAG.getTargetConstant(0, DL, MVT::i64));

    else if ((*it >= 0 && *it < HalfSize) ||

             (*it >= MaskSize && *it < MaskSize + HalfSize)) {

      int M = *it < HalfSize ? *it : *it - HalfSize;

      MaskAlloc.push_back(DAG.getTargetConstant(M, DL, MVT::i64));

    } else

      return SDValue();

  }

  assert((int)MaskAlloc.size() == HalfSize && "xvshuf convert failed!");


  for (auto it = Mid; it < End; it++) {

    if (*it < 0) // UNDEF

      MaskAlloc.push_back(DAG.getTargetConstant(0, DL, MVT::i64));

    else if ((*it >= HalfSize && *it < MaskSize) ||

             (*it >= MaskSize + HalfSize && *it < MaskSize * 2)) {

      int M = *it < MaskSize ? *it - HalfSize : *it - MaskSize;

      MaskAlloc.push_back(DAG.getTargetConstant(M, DL, MVT::i64));

    } else

      return SDValue();

  }

  assert((int)MaskAlloc.size() == MaskSize && "xvshuf convert failed!");


  EVT MaskVecTy = VT.changeVectorElementTypeToInteger();

  SDValue MaskVec = DAG.getBuildVector(MaskVecTy, DL, MaskAlloc);

  return DAG.getNode(LoongArchISD::VSHUF, DL, VT, MaskVec, V2, V1);

}


/// Shuffle vectors by lane to generate more optimized instructions.

/// 256-bit shuffles are always considered as 2-lane 128-bit shuffles.

///

/// Therefore, except for the following four cases, other cases are regarded

/// as cross-lane shuffles, where optimization is relatively limited.

///

/// - Shuffle high, low lanes of two inputs vector

///   <0, 1, 2, 3> + <4, 5, 6, 7> --- <0, 5, 3, 6>

/// - Shuffle low, high lanes of two inputs vector

///   <0, 1, 2, 3> + <4, 5, 6, 7> --- <3, 6, 0, 5>

/// - Shuffle low, low lanes of two inputs vector

///   <0, 1, 2, 3> + <4, 5, 6, 7> --- <3, 6, 3, 6>

/// - Shuffle high, high lanes of two inputs vector

///   <0, 1, 2, 3> + <4, 5, 6, 7> --- <0, 5, 0, 5>

///

/// The first case is the closest to LoongArch instructions and the other

/// cases need to be converted to it for processing.

///

/// This function will return true for the last three cases above and will

/// modify V1, V2 and Mask. Otherwise, return false for the first case and

/// cross-lane shuffle cases.


static bool canonicalizeShuffleVectorByLane(

    const SDLoc &DL, MutableArrayRef<int> Mask, MVT VT, SDValue &V1,

    SDValue &V2, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget) {


  enum HalfMaskType { HighLaneTy, LowLaneTy, None };


  int MaskSize = Mask.size();

  int HalfSize = Mask.size() / 2;

  MVT GRLenVT = Subtarget.getGRLenVT();


  HalfMaskType preMask = None, postMask = None;


  if (std::all_of(Mask.begin(), Mask.begin() + HalfSize, [&](int M) {

        return M < 0 || (M >= 0 && M < HalfSize) ||

               (M >= MaskSize && M < MaskSize + HalfSize);

      }))

    preMask = HighLaneTy;

  else if (std::all_of(Mask.begin(), Mask.begin() + HalfSize, [&](int M) {

             return M < 0 || (M >= HalfSize && M < MaskSize) ||

                    (M >= MaskSize + HalfSize && M < MaskSize * 2);

           }))

    preMask = LowLaneTy;


  if (std::all_of(Mask.begin() + HalfSize, Mask.end(), [&](int M) {

        return M < 0 || (M >= HalfSize && M < MaskSize) ||

               (M >= MaskSize + HalfSize && M < MaskSize * 2);

      }))

    postMask = LowLaneTy;

  else if (std::all_of(Mask.begin() + HalfSize, Mask.end(), [&](int M) {

             return M < 0 || (M >= 0 && M < HalfSize) ||

                    (M >= MaskSize && M < MaskSize + HalfSize);

           }))

    postMask = HighLaneTy;


  // The pre-half of mask is high lane type, and the post-half of mask

  // is low lane type, which is closest to the LoongArch instructions.

  //

  // Note: In the LoongArch architecture, the high lane of mask corresponds

  // to the lower 128-bit of vector register, and the low lane of mask

  // corresponds the higher 128-bit of vector register.

  if (preMask == HighLaneTy && postMask == LowLaneTy) {

    return false;

  }

  if (preMask == LowLaneTy && postMask == HighLaneTy) {

    V1 = DAG.getBitcast(MVT::v4i64, V1);

    V1 = DAG.getNode(LoongArchISD::XVPERMI, DL, MVT::v4i64, V1,

                     DAG.getConstant(0b01001110, DL, GRLenVT));

    V1 = DAG.getBitcast(VT, V1);


    if (!V2.isUndef()) {

      V2 = DAG.getBitcast(MVT::v4i64, V2);

      V2 = DAG.getNode(LoongArchISD::XVPERMI, DL, MVT::v4i64, V2,

                       DAG.getConstant(0b01001110, DL, GRLenVT));

      V2 = DAG.getBitcast(VT, V2);

    }


    for (auto it = Mask.begin(); it < Mask.begin() + HalfSize; it++) {

      *it = *it < 0 ? *it : *it - HalfSize;

    }

    for (auto it = Mask.begin() + HalfSize; it < Mask.end(); it++) {

      *it = *it < 0 ? *it : *it + HalfSize;

    }

  } else if (preMask == LowLaneTy && postMask == LowLaneTy) {

    V1 = DAG.getBitcast(MVT::v4i64, V1);

    V1 = DAG.getNode(LoongArchISD::XVPERMI, DL, MVT::v4i64, V1,

                     DAG.getConstant(0b11101110, DL, GRLenVT));

    V1 = DAG.getBitcast(VT, V1);


    if (!V2.isUndef()) {

      V2 = DAG.getBitcast(MVT::v4i64, V2);

      V2 = DAG.getNode(LoongArchISD::XVPERMI, DL, MVT::v4i64, V2,

                       DAG.getConstant(0b11101110, DL, GRLenVT));

      V2 = DAG.getBitcast(VT, V2);

    }


    for (auto it = Mask.begin(); it < Mask.begin() + HalfSize; it++) {

      *it = *it < 0 ? *it : *it - HalfSize;

    }

  } else if (preMask == HighLaneTy && postMask == HighLaneTy) {

    V1 = DAG.getBitcast(MVT::v4i64, V1);

    V1 = DAG.getNode(LoongArchISD::XVPERMI, DL, MVT::v4i64, V1,

                     DAG.getConstant(0b01000100, DL, GRLenVT));

    V1 = DAG.getBitcast(VT, V1);


    if (!V2.isUndef()) {

      V2 = DAG.getBitcast(MVT::v4i64, V2);

      V2 = DAG.getNode(LoongArchISD::XVPERMI, DL, MVT::v4i64, V2,

                       DAG.getConstant(0b01000100, DL, GRLenVT));

      V2 = DAG.getBitcast(VT, V2);

    }


    for (auto it = Mask.begin() + HalfSize; it < Mask.end(); it++) {

      *it = *it < 0 ? *it : *it + HalfSize;

    }

  } else { // cross-lane

    return false;

  }


  return true;

}


/// Lower VECTOR_SHUFFLE as lane permute and then shuffle (if possible).

/// Only for 256-bit vector.

///

/// For example:

/// %2 = shufflevector <4 x i64> %0, <4 x i64> posion,

///                    <4 x i64> <i32 0, i32 3, i32 2, i32 0>

/// is lowerded to:

///     (XVPERMI $xr2, $xr0, 78)

///     (XVSHUF  $xr1, $xr2, $xr0)

///     (XVORI   $xr0, $xr1, 0)


static SDValue lowerVECTOR_SHUFFLEAsLanePermuteAndShuffle(const SDLoc &DL,

                                                          ArrayRef<int> Mask,

                                                          MVT VT, SDValue V1,

                                                          SDValue V2,

                                                          SelectionDAG &DAG) {

  assert(VT.is256BitVector() && "Only for 256-bit vector shuffles!");

  int Size = Mask.size();

  int LaneSize = Size / 2;


  bool LaneCrossing[2] = {false, false};

  for (int i = 0; i < Size; ++i)

    if (Mask[i] >= 0 && ((Mask[i] % Size) / LaneSize) != (i / LaneSize))

      LaneCrossing[(Mask[i] % Size) / LaneSize] = true;


  // Ensure that all lanes ared involved.

  if (!LaneCrossing[0] && !LaneCrossing[1])

    return SDValue();


  SmallVector<int> InLaneMask;

  InLaneMask.assign(Mask.begin(), Mask.end());

  for (int i = 0; i < Size; ++i) {

    int &M = InLaneMask[i];

    if (M < 0)

      continue;

    if (((M % Size) / LaneSize) != (i / LaneSize))

      M = (M % LaneSize) + ((i / LaneSize) * LaneSize) + Size;

  }


  SDValue Flipped = DAG.getBitcast(MVT::v4i64, V1);

  Flipped = DAG.getVectorShuffle(MVT::v4i64, DL, Flipped,

                                 DAG.getUNDEF(MVT::v4i64), {2, 3, 0, 1});

  Flipped = DAG.getBitcast(VT, Flipped);

  return DAG.getVectorShuffle(VT, DL, V1, Flipped, InLaneMask);

}


/// Dispatching routine to lower various 256-bit LoongArch vector shuffles.

///

/// This routine breaks down the specific type of 256-bit shuffle and

/// dispatches to the lowering routines accordingly.


static SDValue lower256BitShuffle(const SDLoc &DL, ArrayRef<int> Mask, MVT VT,

                                  SDValue V1, SDValue V2, SelectionDAG &DAG,

                                  const LoongArchSubtarget &Subtarget) {

  assert((VT.SimpleTy == MVT::v32i8 || VT.SimpleTy == MVT::v16i16 ||

          VT.SimpleTy == MVT::v8i32 || VT.SimpleTy == MVT::v4i64 ||

          VT.SimpleTy == MVT::v8f32 || VT.SimpleTy == MVT::v4f64) &&

         "Vector type is unsupported for lasx!");

  assert(V1.getSimpleValueType() == V2.getSimpleValueType() &&

         "Two operands have different types!");

  assert(VT.getVectorNumElements() == Mask.size() &&

         "Unexpected mask size for shuffle!");

  assert(Mask.size() % 2 == 0 && "Expected even mask size.");

  assert(Mask.size() >= 4 && "Mask size is less than 4.");


  APInt KnownUndef, KnownZero;

  computeZeroableShuffleElements(Mask, V1, V2, KnownUndef, KnownZero);

  APInt Zeroable = KnownUndef | KnownZero;


  SDValue Result;

  // TODO: Add more comparison patterns.

  if (V2.isUndef()) {

    if ((Result =

             lowerVECTOR_SHUFFLE_XVREPLVEI(DL, Mask, VT, V1, DAG, Subtarget)))

      return Result;

    if ((Result = lowerVECTOR_SHUFFLE_XVSHUF4I(DL, Mask, VT, V1, V2, DAG,

                                               Subtarget)))

      return Result;

    // Try to widen vectors to gain more optimization opportunities.

    if (SDValue NewShuffle = widenShuffleMask(DL, Mask, VT, V1, V2, DAG))

      return NewShuffle;

    if ((Result =

             lowerVECTOR_SHUFFLE_XVPERMI(DL, Mask, VT, V1, DAG, Subtarget)))

      return Result;

    if ((Result = lowerVECTOR_SHUFFLE_XVPERM(DL, Mask, VT, V1, DAG, Subtarget)))

      return Result;

    if ((Result =

             lowerVECTOR_SHUFFLE_IsReverse(DL, Mask, VT, V1, DAG, Subtarget)))

      return Result;


    // TODO: This comment may be enabled in the future to better match the

    // pattern for instruction selection.

    /* V2 = V1; */

  }


  // It is recommended not to change the pattern comparison order for better

  // performance.

  if ((Result = lowerVECTOR_SHUFFLE_XVPACKEV(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_XVPACKOD(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_XVILVH(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_XVILVL(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_XVPICKEV(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLE_XVPICKOD(DL, Mask, VT, V1, V2, DAG)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLEAsShift(DL, Mask, VT, V1, V2, DAG, Subtarget,

                                           Zeroable)))

    return Result;

  if ((Result =

           lowerVECTOR_SHUFFLE_XVINSVE0(DL, Mask, VT, V1, V2, DAG, Subtarget)))

    return Result;

  if ((Result = lowerVECTOR_SHUFFLEAsByteRotate(DL, Mask, VT, V1, V2, DAG,

                                                Subtarget)))

    return Result;


  // canonicalize non cross-lane shuffle vector

  SmallVector<int> NewMask(Mask);

  if (canonicalizeShuffleVectorByLane(DL, NewMask, VT, V1, V2, DAG, Subtarget))

    return lower256BitShuffle(DL, NewMask, VT, V1, V2, DAG, Subtarget);


  // FIXME: Handling the remaining cases earlier can degrade performance

  // in some situations. Further analysis is required to enable more

  // effective optimizations.

  if (V2.isUndef()) {

    if ((Result = lowerVECTOR_SHUFFLEAsLanePermuteAndShuffle(DL, NewMask, VT,

                                                             V1, V2, DAG)))

      return Result;

  }


  if (SDValue NewShuffle = widenShuffleMask(DL, NewMask, VT, V1, V2, DAG))

    return NewShuffle;

  if ((Result = lowerVECTOR_SHUFFLE_XVSHUF(DL, NewMask, VT, V1, V2, DAG)))

    return Result;


  return SDValue();

}


SDValue LoongArchTargetLowering::lowerVECTOR_SHUFFLE(SDValue Op,

                                                     SelectionDAG &DAG) const {

  ShuffleVectorSDNode *SVOp = cast<ShuffleVectorSDNode>(Op);

  ArrayRef<int> OrigMask = SVOp->getMask();

  SDValue V1 = Op.getOperand(0);

  SDValue V2 = Op.getOperand(1);

  MVT VT = Op.getSimpleValueType();

  int NumElements = VT.getVectorNumElements();

  SDLoc DL(Op);


  bool V1IsUndef = V1.isUndef();

  bool V2IsUndef = V2.isUndef();

  if (V1IsUndef && V2IsUndef)

    return DAG.getUNDEF(VT);


  // When we create a shuffle node we put the UNDEF node to second operand,

  // but in some cases the first operand may be transformed to UNDEF.

  // In this case we should just commute the node.

  if (V1IsUndef)

    return DAG.getCommutedVectorShuffle(*SVOp);


  // Check for non-undef masks pointing at an undef vector and make the masks

  // undef as well. This makes it easier to match the shuffle based solely on

  // the mask.

  if (V2IsUndef &&

      any_of(OrigMask, [NumElements](int M) { return M >= NumElements; })) {

    SmallVector<int, 8> NewMask(OrigMask);

    for (int &M : NewMask)

      if (M >= NumElements)

        M = -1;

    return DAG.getVectorShuffle(VT, DL, V1, V2, NewMask);

  }


  // Check for illegal shuffle mask element index values.

  int MaskUpperLimit = OrigMask.size() * (V2IsUndef ? 1 : 2);

  (void)MaskUpperLimit;

  assert(llvm::all_of(OrigMask,

                      [&](int M) { return -1 <= M && M < MaskUpperLimit; }) &&

         "Out of bounds shuffle index");


  // For each vector width, delegate to a specialized lowering routine.

  if (VT.is128BitVector())

    return lower128BitShuffle(DL, OrigMask, VT, V1, V2, DAG, Subtarget);


  if (VT.is256BitVector())

    return lower256BitShuffle(DL, OrigMask, VT, V1, V2, DAG, Subtarget);


  return SDValue();

}


SDValue LoongArchTargetLowering::lowerFP_TO_FP16(SDValue Op,

                                                 SelectionDAG &DAG) const {

  // Custom lower to ensure the libcall return is passed in an FPR on hard

  // float ABIs.

  SDLoc DL(Op);

  MakeLibCallOptions CallOptions;

  SDValue Op0 = Op.getOperand(0);

  SDValue Chain = SDValue();

  RTLIB::Libcall LC = RTLIB::getFPROUND(Op0.getValueType(), MVT::f16);

  SDValue Res;

  std::tie(Res, Chain) =

      makeLibCall(DAG, LC, MVT::f32, Op0, CallOptions, DL, Chain);

  if (Subtarget.is64Bit())

    return DAG.getNode(LoongArchISD::MOVFR2GR_S_LA64, DL, MVT::i64, Res);

  return DAG.getBitcast(MVT::i32, Res);

}


SDValue LoongArchTargetLowering::lowerFP16_TO_FP(SDValue Op,

                                                 SelectionDAG &DAG) const {

  // Custom lower to ensure the libcall argument is passed in an FPR on hard

  // float ABIs.

  SDLoc DL(Op);

  MakeLibCallOptions CallOptions;

  SDValue Op0 = Op.getOperand(0);

  SDValue Chain = SDValue();

  SDValue Arg = Subtarget.is64Bit() ? DAG.getNode(LoongArchISD::MOVGR2FR_W_LA64,

                                                  DL, MVT::f32, Op0)

                                    : DAG.getBitcast(MVT::f32, Op0);

  SDValue Res;

  std::tie(Res, Chain) = makeLibCall(DAG, RTLIB::FPEXT_F16_F32, MVT::f32, Arg,

                                     CallOptions, DL, Chain);

  return Res;

}


SDValue LoongArchTargetLowering::lowerFP_TO_BF16(SDValue Op,

                                                 SelectionDAG &DAG) const {

  assert(Subtarget.hasBasicF() && "Unexpected custom legalization");

  SDLoc DL(Op);

  MakeLibCallOptions CallOptions;

  RTLIB::Libcall LC =

      RTLIB::getFPROUND(Op.getOperand(0).getValueType(), MVT::bf16);

  SDValue Res =

      makeLibCall(DAG, LC, MVT::f32, Op.getOperand(0), CallOptions, DL).first;

  if (Subtarget.is64Bit())

    return DAG.getNode(LoongArchISD::MOVFR2GR_S_LA64, DL, MVT::i64, Res);

  return DAG.getBitcast(MVT::i32, Res);

}


SDValue LoongArchTargetLowering::lowerBF16_TO_FP(SDValue Op,

                                                 SelectionDAG &DAG) const {

  assert(Subtarget.hasBasicF() && "Unexpected custom legalization");

  MVT VT = Op.getSimpleValueType();

  SDLoc DL(Op);

  Op = DAG.getNode(

      ISD::SHL, DL, Op.getOperand(0).getValueType(), Op.getOperand(0),

      DAG.getShiftAmountConstant(16, Op.getOperand(0).getValueType(), DL));

  SDValue Res = Subtarget.is64Bit() ? DAG.getNode(LoongArchISD::MOVGR2FR_W_LA64,

                                                  DL, MVT::f32, Op)

                                    : DAG.getBitcast(MVT::f32, Op);

  if (VT != MVT::f32)

    return DAG.getNode(ISD::FP_EXTEND, DL, VT, Res);

  return Res;

}


// Lower BUILD_VECTOR as broadcast load (if possible).

// For example:

//   %a = load i8, ptr %ptr

//   %b = build_vector %a, %a, %a, %a

// is lowered to :

//   (VLDREPL_B $a0, 0)


static SDValue lowerBUILD_VECTORAsBroadCastLoad(BuildVectorSDNode *BVOp,

                                                const SDLoc &DL,

                                                SelectionDAG &DAG) {

  MVT VT = BVOp->getSimpleValueType(0);

  int NumOps = BVOp->getNumOperands();


  assert((VT.is128BitVector() || VT.is256BitVector()) &&

         "Unsupported vector type for broadcast.");


  SDValue IdentitySrc;

  bool IsIdeneity = true;


  for (int i = 0; i != NumOps; i++) {

    SDValue Op = BVOp->getOperand(i);

    if (Op.getOpcode() != ISD::LOAD || (IdentitySrc && Op != IdentitySrc)) {

      IsIdeneity = false;

      break;

    }

    IdentitySrc = BVOp->getOperand(0);

  }


  // make sure that this load is valid and only has one user.

  if (!IsIdeneity || !IdentitySrc || !BVOp->isOnlyUserOf(IdentitySrc.getNode()))

    return SDValue();


  auto *LN = cast<LoadSDNode>(IdentitySrc);

  auto ExtType = LN->getExtensionType();


  if ((ExtType == ISD::EXTLOAD || ExtType == ISD::NON_EXTLOAD) &&

      VT.getScalarSizeInBits() == LN->getMemoryVT().getScalarSizeInBits()) {

    // Indexed loads and stores are not supported on LoongArch.

    assert(LN->isUnindexed() && "Unexpected indexed load.");


    SDVTList Tys = DAG.getVTList(VT, MVT::Other);

    // The offset operand of unindexed load is always undefined, so there is

    // no need to pass it to VLDREPL.

    SDValue Ops[] = {LN->getChain(), LN->getBasePtr()};

    SDValue BCast = DAG.getNode(LoongArchISD::VLDREPL, DL, Tys, Ops);

    DAG.ReplaceAllUsesOfValueWith(SDValue(LN, 1), BCast.getValue(1));

    return BCast;

  }

  return SDValue();

}


// Sequentially insert elements from Ops into Vector, from low to high indices.

// Note: Ops can have fewer elements than Vector.


static void fillVector(ArrayRef<SDValue> Ops, SelectionDAG &DAG, SDLoc DL,

                       const LoongArchSubtarget &Subtarget, SDValue &Vector,

                       EVT ResTy) {

  assert(Ops.size() <= ResTy.getVectorNumElements());


  SDValue Op0 = Ops[0];

  if (!Op0.isUndef())

    Vector = DAG.getNode(ISD::SCALAR_TO_VECTOR, DL, ResTy, Op0);

  for (unsigned i = 1; i < Ops.size(); ++i) {

    SDValue Opi = Ops[i];

    if (Opi.isUndef())

      continue;

    Vector = DAG.getNode(ISD::INSERT_VECTOR_ELT, DL, ResTy, Vector, Opi,

                         DAG.getConstant(i, DL, Subtarget.getGRLenVT()));

  }

}


// Build a ResTy subvector from Node, taking NumElts elements starting at index

// 'first'.


static SDValue fillSubVectorFromBuildVector(BuildVectorSDNode *Node,

                                            SelectionDAG &DAG, SDLoc DL,

                                            const LoongArchSubtarget &Subtarget,

                                            EVT ResTy, unsigned first) {

  unsigned NumElts = ResTy.getVectorNumElements();


  assert(first + NumElts <= Node->getSimpleValueType(0).getVectorNumElements());


  SmallVector<SDValue, 16> Ops(Node->op_begin() + first,

                               Node->op_begin() + first + NumElts);

  SDValue Vector = DAG.getUNDEF(ResTy);

  fillVector(Ops, DAG, DL, Subtarget, Vector, ResTy);

  return Vector;

}


SDValue LoongArchTargetLowering::lowerBUILD_VECTOR(SDValue Op,

                                                   SelectionDAG &DAG) const {

  BuildVectorSDNode *Node = cast<BuildVectorSDNode>(Op);

  MVT VT = Node->getSimpleValueType(0);

  EVT ResTy = Op->getValueType(0);

  unsigned NumElts = ResTy.getVectorNumElements();

  SDLoc DL(Op);

  APInt SplatValue, SplatUndef;

  unsigned SplatBitSize;

  bool HasAnyUndefs;

  bool IsConstant = false;

  bool UseSameConstant = true;

  SDValue ConstantValue;

  bool Is128Vec = ResTy.is128BitVector();

  bool Is256Vec = ResTy.is256BitVector();


  if ((!Subtarget.hasExtLSX() || !Is128Vec) &&

      (!Subtarget.hasExtLASX() || !Is256Vec))

    return SDValue();


  if (SDValue Result = lowerBUILD_VECTORAsBroadCastLoad(Node, DL, DAG))

    return Result;


  if (Node->isConstantSplat(SplatValue, SplatUndef, SplatBitSize, HasAnyUndefs,

                            /*MinSplatBits=*/8) &&

      SplatBitSize <= 64) {

    // We can only cope with 8, 16, 32, or 64-bit elements.

    if (SplatBitSize != 8 && SplatBitSize != 16 && SplatBitSize != 32 &&

        SplatBitSize != 64)

      return SDValue();


    if (SplatBitSize == 64 && !Subtarget.is64Bit()) {

      // We can only handle 64-bit elements that are within

      // the signed 10-bit range or match vldi patterns on 32-bit targets.

      // See the BUILD_VECTOR case in LoongArchDAGToDAGISel::Select().

      if (!SplatValue.isSignedIntN(10) &&

          !isImmVLDILegalForMode1(SplatValue, SplatBitSize).first)

        return SDValue();

      if ((Is128Vec && ResTy == MVT::v4i32) ||

          (Is256Vec && ResTy == MVT::v8i32))

        return Op;

    }


    EVT ViaVecTy;


    switch (SplatBitSize) {

    default:

      return SDValue();

    case 8:

      ViaVecTy = Is128Vec ? MVT::v16i8 : MVT::v32i8;

      break;

    case 16:

      ViaVecTy = Is128Vec ? MVT::v8i16 : MVT::v16i16;

      break;

    case 32:

      ViaVecTy = Is128Vec ? MVT::v4i32 : MVT::v8i32;

      break;

    case 64:

      ViaVecTy = Is128Vec ? MVT::v2i64 : MVT::v4i64;

      break;

    }


    // SelectionDAG::getConstant will promote SplatValue appropriately.

    SDValue Result = DAG.getConstant(SplatValue, DL, ViaVecTy);


    // Bitcast to the type we originally wanted.

    if (ViaVecTy != ResTy)

      Result = DAG.getNode(ISD::BITCAST, SDLoc(Node), ResTy, Result);


    return Result;

  }


  if (DAG.isSplatValue(Op, /*AllowUndefs=*/false))

    return Op;


  for (unsigned i = 0; i < NumElts; ++i) {

    SDValue Opi = Node->getOperand(i);

    if (isIntOrFPConstant(Opi)) {

      IsConstant = true;

      if (!ConstantValue.getNode())

        ConstantValue = Opi;

      else if (ConstantValue != Opi)

        UseSameConstant = false;

    }

  }


  // If the type of BUILD_VECTOR is v2f64, custom legalizing it has no benefits.

  if (IsConstant && UseSameConstant && ResTy != MVT::v2f64) {

    SDValue Result = DAG.getSplatBuildVector(ResTy, DL, ConstantValue);

    for (unsigned i = 0; i < NumElts; ++i) {

      SDValue Opi = Node->getOperand(i);

      if (!isIntOrFPConstant(Opi))

        Result = DAG.getNode(ISD::INSERT_VECTOR_ELT, DL, ResTy, Result, Opi,

                             DAG.getConstant(i, DL, Subtarget.getGRLenVT()));

    }

    return Result;

  }


  if (!IsConstant) {

    // If the BUILD_VECTOR has a repeated pattern, use INSERT_VECTOR_ELT to fill

    // the sub-sequence of the vector and then broadcast the sub-sequence.

    //

    // TODO: If the BUILD_VECTOR contains undef elements, consider falling

    // back to use INSERT_VECTOR_ELT to materialize the vector, because it

    // generates worse code in some cases. This could be further optimized

    // with more consideration.

    SmallVector<SDValue> Sequence;

    BitVector UndefElements;

    if (Node->getRepeatedSequence(Sequence, &UndefElements) &&

        UndefElements.count() == 0) {

      // Using LSX instructions to fill the sub-sequence of 256-bits vector,

      // because the high part can be simply treated as undef.

      SDValue Vector = DAG.getUNDEF(ResTy);

      EVT FillTy = Is256Vec

                       ? ResTy.getHalfNumVectorElementsVT(*DAG.getContext())

                       : ResTy;

      SDValue FillVec =

          Is256Vec ? DAG.getExtractSubvector(DL, FillTy, Vector, 0) : Vector;


      fillVector(Sequence, DAG, DL, Subtarget, FillVec, FillTy);


      unsigned SeqLen = Sequence.size();

      unsigned SplatLen = NumElts / SeqLen;

      MVT SplatEltTy = MVT::getIntegerVT(VT.getScalarSizeInBits() * SeqLen);

      MVT SplatTy = MVT::getVectorVT(SplatEltTy, SplatLen);


      // If size of the sub-sequence is half of a 256-bits vector, bitcast the

      // vector to v4i64 type in order to match the pattern of XVREPLVE0Q.

      if (SplatEltTy == MVT::i128)

        SplatTy = MVT::v4i64;


      SDValue SplatVec;

      SDValue SrcVec = DAG.getBitcast(

          SplatTy,

          Is256Vec ? DAG.getInsertSubvector(DL, Vector, FillVec, 0) : FillVec);

      if (Is256Vec) {

        SplatVec =

            DAG.getNode((SplatEltTy == MVT::i128) ? LoongArchISD::XVREPLVE0Q

                                                  : LoongArchISD::XVREPLVE0,

                        DL, SplatTy, SrcVec);

      } else {

        SplatVec = DAG.getNode(LoongArchISD::VREPLVEI, DL, SplatTy, SrcVec,

                               DAG.getConstant(0, DL, Subtarget.getGRLenVT()));

      }


      return DAG.getBitcast(ResTy, SplatVec);

    }


    // Use INSERT_VECTOR_ELT operations rather than expand to stores, because

    // using memory operations is much lower.

    //

    // For 256-bit vectors, normally split into two halves and concatenate.

    // Special case: for v8i32/v8f32/v4i64/v4f64, if the upper half has only

    // one non-undef element, skip spliting to avoid a worse result.

    if (ResTy == MVT::v8i32 || ResTy == MVT::v8f32 || ResTy == MVT::v4i64 ||

        ResTy == MVT::v4f64) {

      unsigned NonUndefCount = 0;

      for (unsigned i = NumElts / 2; i < NumElts; ++i) {

        if (!Node->getOperand(i).isUndef()) {

          ++NonUndefCount;

          if (NonUndefCount > 1)

            break;

        }

      }

      if (NonUndefCount == 1)

        return fillSubVectorFromBuildVector(Node, DAG, DL, Subtarget, ResTy, 0);

    }


    EVT VecTy =

        Is256Vec ? ResTy.getHalfNumVectorElementsVT(*DAG.getContext()) : ResTy;

    SDValue Vector =

        fillSubVectorFromBuildVector(Node, DAG, DL, Subtarget, VecTy, 0);


    if (Is128Vec)

      return Vector;


    SDValue VectorHi = fillSubVectorFromBuildVector(Node, DAG, DL, Subtarget,

                                                    VecTy, NumElts / 2);


    return DAG.getNode(ISD::CONCAT_VECTORS, DL, ResTy, Vector, VectorHi);

  }


  return SDValue();

}


SDValue LoongArchTargetLowering::lowerCONCAT_VECTORS(SDValue Op,

                                                     SelectionDAG &DAG) const {

  SDLoc DL(Op);

  MVT ResVT = Op.getSimpleValueType();

  assert(ResVT.is256BitVector() && Op.getNumOperands() == 2);


  unsigned NumOperands = Op.getNumOperands();

  unsigned NumFreezeUndef = 0;

  unsigned NumZero = 0;

  unsigned NumNonZero = 0;

  unsigned NonZeros = 0;

  SmallSet<SDValue, 4> Undefs;

  for (unsigned i = 0; i != NumOperands; ++i) {

    SDValue SubVec = Op.getOperand(i);

    if (SubVec.isUndef())

      continue;

    if (ISD::isFreezeUndef(SubVec.getNode())) {

      // If the freeze(undef) has multiple uses then we must fold to zero.

      if (SubVec.hasOneUse()) {

        ++NumFreezeUndef;

      } else {

        ++NumZero;

        Undefs.insert(SubVec);

      }

    } else if (ISD::isBuildVectorAllZeros(SubVec.getNode()))

      ++NumZero;

    else {

      assert(i < sizeof(NonZeros) * CHAR_BIT); // Ensure the shift is in range.

      NonZeros |= 1 << i;

      ++NumNonZero;

    }

  }


  // If we have more than 2 non-zeros, build each half separately.

  if (NumNonZero > 2) {

    MVT HalfVT = ResVT.getHalfNumVectorElementsVT();

    ArrayRef<SDUse> Ops = Op->ops();

    SDValue Lo = DAG.getNode(ISD::CONCAT_VECTORS, DL, HalfVT,

                             Ops.slice(0, NumOperands / 2));

    SDValue Hi = DAG.getNode(ISD::CONCAT_VECTORS, DL, HalfVT,

                             Ops.slice(NumOperands / 2));

    return DAG.getNode(ISD::CONCAT_VECTORS, DL, ResVT, Lo, Hi);

  }


  // Otherwise, build it up through insert_subvectors.

  SDValue Vec = NumZero ? DAG.getConstant(0, DL, ResVT)

                        : (NumFreezeUndef ? DAG.getFreeze(DAG.getUNDEF(ResVT))

                                          : DAG.getUNDEF(ResVT));


  // Replace Undef operands with ZeroVector.

  for (SDValue U : Undefs)

    DAG.ReplaceAllUsesWith(U, DAG.getConstant(0, DL, U.getSimpleValueType()));


  MVT SubVT = Op.getOperand(0).getSimpleValueType();

  unsigned NumSubElems = SubVT.getVectorNumElements();

  for (unsigned i = 0; i != NumOperands; ++i) {

    if ((NonZeros & (1 << i)) == 0)

      continue;


    Vec = DAG.getNode(ISD::INSERT_SUBVECTOR, DL, ResVT, Vec, Op.getOperand(i),

                      DAG.getVectorIdxConstant(i * NumSubElems, DL));

  }


  return Vec;

}


SDValue

LoongArchTargetLowering::lowerEXTRACT_VECTOR_ELT(SDValue Op,

                                                 SelectionDAG &DAG) const {

  MVT EltVT = Op.getSimpleValueType();

  SDValue Vec = Op->getOperand(0);

  EVT VecTy = Vec->getValueType(0);

  SDValue Idx = Op->getOperand(1);

  SDLoc DL(Op);

  MVT GRLenVT = Subtarget.getGRLenVT();


  assert(VecTy.is256BitVector() && "Unexpected EXTRACT_VECTOR_ELT vector type");


  if (isa<ConstantSDNode>(Idx))

    return Op;


  switch (VecTy.getSimpleVT().SimpleTy) {

  default:

    llvm_unreachable("Unexpected type");

  case MVT::v32i8:

  case MVT::v16i16:

  case MVT::v4i64:

  case MVT::v4f64: {

    // Extract the high half subvector and place it to the low half of a new

    // vector. It doesn't matter what the high half of the new vector is.

    EVT HalfTy = VecTy.getHalfNumVectorElementsVT(*DAG.getContext());

    SDValue VecHi =

        DAG.getExtractSubvector(DL, HalfTy, Vec, HalfTy.getVectorNumElements());

    SDValue TmpVec =

        DAG.getNode(ISD::INSERT_SUBVECTOR, DL, VecTy, DAG.getUNDEF(VecTy),

                    VecHi, DAG.getConstant(0, DL, GRLenVT));


    // Shuffle the origin Vec and the TmpVec using MaskVec, the lowest element

    // of MaskVec is Idx, the rest do not matter. ResVec[0] will hold the

    // desired element.

    SDValue IdxCp =

        Subtarget.is64Bit()

            ? DAG.getNode(LoongArchISD::MOVGR2FR_W_LA64, DL, MVT::f32, Idx)

            : DAG.getBitcast(MVT::f32, Idx);

    SDValue IdxVec = DAG.getNode(ISD::SCALAR_TO_VECTOR, DL, MVT::v8f32, IdxCp);

    SDValue MaskVec =

        DAG.getBitcast((VecTy == MVT::v4f64) ? MVT::v4i64 : VecTy, IdxVec);

    SDValue ResVec =

        DAG.getNode(LoongArchISD::VSHUF, DL, VecTy, MaskVec, TmpVec, Vec);


    return DAG.getNode(ISD::EXTRACT_VECTOR_ELT, DL, EltVT, ResVec,

                       DAG.getConstant(0, DL, GRLenVT));

  }

  case MVT::v8i32:

  case MVT::v8f32: {

    SDValue SplatIdx = DAG.getSplatBuildVector(MVT::v8i32, DL, Idx);

    SDValue SplatValue =

        DAG.getNode(LoongArchISD::XVPERM, DL, VecTy, Vec, SplatIdx);


    return DAG.getNode(ISD::EXTRACT_VECTOR_ELT, DL, EltVT, SplatValue,

                       DAG.getConstant(0, DL, GRLenVT));

  }

  }

}


SDValue

LoongArchTargetLowering::lowerINSERT_VECTOR_ELT(SDValue Op,

                                                SelectionDAG &DAG) const {

  MVT VT = Op.getSimpleValueType();

  MVT EltVT = VT.getVectorElementType();

  unsigned NumElts = VT.getVectorNumElements();

  unsigned EltSizeInBits = EltVT.getScalarSizeInBits();

  SDLoc DL(Op);

  SDValue Op0 = Op.getOperand(0);

  SDValue Op1 = Op.getOperand(1);

  SDValue Op2 = Op.getOperand(2);


  if (isa<ConstantSDNode>(Op2))

    return Op;


  MVT IdxTy = MVT::getIntegerVT(EltSizeInBits);

  MVT IdxVTy = MVT::getVectorVT(IdxTy, NumElts);


  if (!isTypeLegal(VT) || !isTypeLegal(IdxVTy))

    return SDValue();


  SDValue SplatElt = DAG.getSplatBuildVector(VT, DL, Op1);

  SmallVector<SDValue, 32> RawIndices;

  SDValue SplatIdx;

  SDValue Indices;


  if (!Subtarget.is64Bit() && IdxTy == MVT::i64) {

    MVT PairVTy = MVT::getVectorVT(MVT::i32, NumElts * 2);

    for (unsigned i = 0; i < NumElts; ++i) {

      RawIndices.push_back(Op2);

      RawIndices.push_back(DAG.getConstant(0, DL, MVT::i32));

    }

    SplatIdx = DAG.getBuildVector(PairVTy, DL, RawIndices);

    SplatIdx = DAG.getBitcast(IdxVTy, SplatIdx);


    RawIndices.clear();

    for (unsigned i = 0; i < NumElts; ++i) {

      RawIndices.push_back(DAG.getConstant(i, DL, MVT::i32));

      RawIndices.push_back(DAG.getConstant(0, DL, MVT::i32));

    }

    Indices = DAG.getBuildVector(PairVTy, DL, RawIndices);

    Indices = DAG.getBitcast(IdxVTy, Indices);

  } else {

    SplatIdx = DAG.getSplatBuildVector(IdxVTy, DL, Op2);


    for (unsigned i = 0; i < NumElts; ++i)

      RawIndices.push_back(DAG.getConstant(i, DL, Subtarget.getGRLenVT()));

    Indices = DAG.getBuildVector(IdxVTy, DL, RawIndices);

  }


  // insert vec, elt, idx

  // =>

  // select (splatidx == {0,1,2...}) ? splatelt : vec

  SDValue SelectCC =

      DAG.getSetCC(DL, IdxVTy, SplatIdx, Indices, ISD::CondCode::SETEQ);

  return DAG.getNode(ISD::VSELECT, DL, VT, SelectCC, SplatElt, Op0);

}


SDValue LoongArchTargetLowering::lowerATOMIC_FENCE(SDValue Op,

                                                   SelectionDAG &DAG) const {

  SDLoc DL(Op);

  SyncScope::ID FenceSSID =

      static_cast<SyncScope::ID>(Op.getConstantOperandVal(2));


  // singlethread fences only synchronize with signal handlers on the same

  // thread and thus only need to preserve instruction order, not actually

  // enforce memory ordering.

  if (FenceSSID == SyncScope::SingleThread)

    // MEMBARRIER is a compiler barrier; it codegens to a no-op.

    return DAG.getNode(ISD::MEMBARRIER, DL, MVT::Other, Op.getOperand(0));


  return Op;

}


SDValue LoongArchTargetLowering::lowerWRITE_REGISTER(SDValue Op,

                                                     SelectionDAG &DAG) const {


  if (Subtarget.is64Bit() && Op.getOperand(2).getValueType() == MVT::i32) {

    DAG.getContext()->emitError(

        "On LA64, only 64-bit registers can be written.");

    return Op.getOperand(0);

  }


  if (!Subtarget.is64Bit() && Op.getOperand(2).getValueType() == MVT::i64) {

    DAG.getContext()->emitError(

        "On LA32, only 32-bit registers can be written.");

    return Op.getOperand(0);

  }


  return Op;

}


SDValue LoongArchTargetLowering::lowerFRAMEADDR(SDValue Op,

                                                SelectionDAG &DAG) const {

  if (!isa<ConstantSDNode>(Op.getOperand(0))) {

    DAG.getContext()->emitError("argument to '__builtin_frame_address' must "

                                "be a constant integer");

    return SDValue();

  }


  MachineFunction &MF = DAG.getMachineFunction();

  MF.getFrameInfo().setFrameAddressIsTaken(true);

  Register FrameReg = Subtarget.getRegisterInfo()->getFrameRegister(MF);

  EVT VT = Op.getValueType();

  SDLoc DL(Op);

  SDValue FrameAddr = DAG.getCopyFromReg(DAG.getEntryNode(), DL, FrameReg, VT);

  unsigned Depth = Op.getConstantOperandVal(0);

  int GRLenInBytes = Subtarget.getGRLen() / 8;


  while (Depth--) {

    int Offset = -(GRLenInBytes * 2);

    SDValue Ptr = DAG.getNode(ISD::ADD, DL, VT, FrameAddr,

                              DAG.getSignedConstant(Offset, DL, VT));

    FrameAddr =

        DAG.getLoad(VT, DL, DAG.getEntryNode(), Ptr, MachinePointerInfo());

  }

  return FrameAddr;

}


SDValue LoongArchTargetLowering::lowerRETURNADDR(SDValue Op,

                                                 SelectionDAG &DAG) const {

  // Currently only support lowering return address for current frame.

  if (Op.getConstantOperandVal(0) != 0) {

    DAG.getContext()->emitError(

        "return address can only be determined for the current frame");

    return SDValue();

  }


  MachineFunction &MF = DAG.getMachineFunction();

  MF.getFrameInfo().setReturnAddressIsTaken(true);

  MVT GRLenVT = Subtarget.getGRLenVT();


  // Return the value of the return address register, marking it an implicit

  // live-in.

  Register Reg = MF.addLiveIn(Subtarget.getRegisterInfo()->getRARegister(),

                              getRegClassFor(GRLenVT));

  return DAG.getCopyFromReg(DAG.getEntryNode(), SDLoc(Op), Reg, GRLenVT);

}


SDValue LoongArchTargetLowering::lowerEH_DWARF_CFA(SDValue Op,

                                                   SelectionDAG &DAG) const {

  MachineFunction &MF = DAG.getMachineFunction();

  auto Size = Subtarget.getGRLen() / 8;

  auto FI = MF.getFrameInfo().CreateFixedObject(Size, 0, false);

  return DAG.getFrameIndex(FI, getPointerTy(DAG.getDataLayout()));

}


SDValue LoongArchTargetLowering::lowerVASTART(SDValue Op,

                                              SelectionDAG &DAG) const {

  MachineFunction &MF = DAG.getMachineFunction();

  auto *FuncInfo = MF.getInfo<LoongArchMachineFunctionInfo>();


  SDLoc DL(Op);

  SDValue FI = DAG.getFrameIndex(FuncInfo->getVarArgsFrameIndex(),

                                 getPointerTy(MF.getDataLayout()));


  // vastart just stores the address of the VarArgsFrameIndex slot into the

  // memory location argument.

  const Value *SV = cast<SrcValueSDNode>(Op.getOperand(2))->getValue();

  return DAG.getStore(Op.getOperand(0), DL, FI, Op.getOperand(1),

                      MachinePointerInfo(SV));

}


SDValue LoongArchTargetLowering::lowerUINT_TO_FP(SDValue Op,

                                                 SelectionDAG &DAG) const {

  assert(Subtarget.is64Bit() && Subtarget.hasBasicF() &&

         !Subtarget.hasBasicD() && "unexpected target features");


  SDLoc DL(Op);

  SDValue Op0 = Op.getOperand(0);

  if (Op0->getOpcode() == ISD::AND) {

    auto *C = dyn_cast<ConstantSDNode>(Op0.getOperand(1));

    if (C && C->getZExtValue() < UINT64_C(0xFFFFFFFF))

      return Op;

  }


  if (Op0->getOpcode() == LoongArchISD::BSTRPICK &&

      Op0.getConstantOperandVal(1) < UINT64_C(0X1F) &&

      Op0.getConstantOperandVal(2) == UINT64_C(0))

    return Op;


  if (Op0.getOpcode() == ISD::AssertZext &&

      dyn_cast<VTSDNode>(Op0.getOperand(1))->getVT().bitsLT(MVT::i32))

    return Op;


  EVT OpVT = Op0.getValueType();

  EVT RetVT = Op.getValueType();

  RTLIB::Libcall LC = RTLIB::getUINTTOFP(OpVT, RetVT);

  MakeLibCallOptions CallOptions;

  CallOptions.setTypeListBeforeSoften(OpVT, RetVT);

  SDValue Chain = SDValue();

  SDValue Result;

  std::tie(Result, Chain) =

      makeLibCall(DAG, LC, Op.getValueType(), Op0, CallOptions, DL, Chain);

  return Result;

}


SDValue LoongArchTargetLowering::lowerSINT_TO_FP(SDValue Op,

                                                 SelectionDAG &DAG) const {

  assert(Subtarget.is64Bit() && Subtarget.hasBasicF() &&

         !Subtarget.hasBasicD() && "unexpected target features");


  SDLoc DL(Op);

  SDValue Op0 = Op.getOperand(0);


  if ((Op0.getOpcode() == ISD::AssertSext ||

       Op0.getOpcode() == ISD::SIGN_EXTEND_INREG) &&

      dyn_cast<VTSDNode>(Op0.getOperand(1))->getVT().bitsLE(MVT::i32))

    return Op;


  EVT OpVT = Op0.getValueType();

  EVT RetVT = Op.getValueType();

  RTLIB::Libcall LC = RTLIB::getSINTTOFP(OpVT, RetVT);

  MakeLibCallOptions CallOptions;

  CallOptions.setTypeListBeforeSoften(OpVT, RetVT);

  SDValue Chain = SDValue();

  SDValue Result;

  std::tie(Result, Chain) =

      makeLibCall(DAG, LC, Op.getValueType(), Op0, CallOptions, DL, Chain);

  return Result;

}


SDValue LoongArchTargetLowering::lowerBITCAST(SDValue Op,

                                              SelectionDAG &DAG) const {


  SDLoc DL(Op);

  EVT VT = Op.getValueType();

  SDValue Op0 = Op.getOperand(0);

  EVT Op0VT = Op0.getValueType();


  if (Op.getValueType() == MVT::f32 && Op0VT == MVT::i32 &&

      Subtarget.is64Bit() && Subtarget.hasBasicF()) {

    SDValue NewOp0 = DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op0);

    return DAG.getNode(LoongArchISD::MOVGR2FR_W_LA64, DL, MVT::f32, NewOp0);

  }

  if (VT == MVT::f64 && Op0VT == MVT::i64 && !Subtarget.is64Bit()) {

    SDValue Lo, Hi;

    std::tie(Lo, Hi) = DAG.SplitScalar(Op0, DL, MVT::i32, MVT::i32);

    return DAG.getNode(LoongArchISD::BUILD_PAIR_F64, DL, MVT::f64, Lo, Hi);

  }

  return Op;

}


SDValue LoongArchTargetLowering::lowerFP_TO_SINT(SDValue Op,

                                                 SelectionDAG &DAG) const {


  SDLoc DL(Op);

  SDValue Op0 = Op.getOperand(0);


  if (Op0.getValueType() == MVT::f16)

    Op0 = DAG.getNode(ISD::FP_EXTEND, DL, MVT::f32, Op0);


  if (Op.getValueSizeInBits() > 32 && Subtarget.hasBasicF() &&

      !Subtarget.hasBasicD()) {

    SDValue Dst = DAG.getNode(LoongArchISD::FTINT, DL, MVT::f32, Op0);

    return DAG.getNode(LoongArchISD::MOVFR2GR_S_LA64, DL, MVT::i64, Dst);

  }


  EVT FPTy = EVT::getFloatingPointVT(Op.getValueSizeInBits());

  SDValue Trunc = DAG.getNode(LoongArchISD::FTINT, DL, FPTy, Op0);

  return DAG.getNode(ISD::BITCAST, DL, Op.getValueType(), Trunc);

}


static SDValue getTargetNode(GlobalAddressSDNode *N, SDLoc DL, EVT Ty,

                             SelectionDAG &DAG, unsigned Flags) {

  return DAG.getTargetGlobalAddress(N->getGlobal(), DL, Ty, 0, Flags);

}


static SDValue getTargetNode(BlockAddressSDNode *N, SDLoc DL, EVT Ty,

                             SelectionDAG &DAG, unsigned Flags) {

  return DAG.getTargetBlockAddress(N->getBlockAddress(), Ty, N->getOffset(),

                                   Flags);

}


static SDValue getTargetNode(ConstantPoolSDNode *N, SDLoc DL, EVT Ty,

                             SelectionDAG &DAG, unsigned Flags) {

  return DAG.getTargetConstantPool(N->getConstVal(), Ty, N->getAlign(),

                                   N->getOffset(), Flags);

}


static SDValue getTargetNode(JumpTableSDNode *N, SDLoc DL, EVT Ty,

                             SelectionDAG &DAG, unsigned Flags) {

  return DAG.getTargetJumpTable(N->getIndex(), Ty, Flags);

}


template <class NodeTy>

SDValue LoongArchTargetLowering::getAddr(NodeTy *N, SelectionDAG &DAG,

                                         CodeModel::Model M,

                                         bool IsLocal) const {

  SDLoc DL(N);

  EVT Ty = getPointerTy(DAG.getDataLayout());

  SDValue Addr = getTargetNode(N, DL, Ty, DAG, 0);

  SDValue Load;


  switch (M) {

  default:

    report_fatal_error("Unsupported code model");


  case CodeModel::Large: {

    assert(Subtarget.is64Bit() && "Large code model requires LA64");


    // This is not actually used, but is necessary for successfully matching

    // the PseudoLA_*_LARGE nodes.

    SDValue Tmp = DAG.getConstant(0, DL, Ty);

    if (IsLocal) {

      // This generates the pattern (PseudoLA_PCREL_LARGE tmp sym), that

      // eventually becomes the desired 5-insn code sequence.

      Load = SDValue(DAG.getMachineNode(LoongArch::PseudoLA_PCREL_LARGE, DL, Ty,

                                        Tmp, Addr),

                     0);

    } else {

      // This generates the pattern (PseudoLA_GOT_LARGE tmp sym), that

      // eventually becomes the desired 5-insn code sequence.

      Load = SDValue(

          DAG.getMachineNode(LoongArch::PseudoLA_GOT_LARGE, DL, Ty, Tmp, Addr),

          0);

    }

    break;

  }


  case CodeModel::Small:

  case CodeModel::Medium:

    if (IsLocal) {

      // This generates the pattern (PseudoLA_PCREL sym), which expands to

      // (addi.w/d (pcalau12i %pc_hi20(sym)) %pc_lo12(sym)).

      Load = SDValue(

          DAG.getMachineNode(LoongArch::PseudoLA_PCREL, DL, Ty, Addr), 0);

    } else {

      // This generates the pattern (PseudoLA_GOT sym), which expands to (ld.w/d

      // (pcalau12i %got_pc_hi20(sym)) %got_pc_lo12(sym)).

      Load =

          SDValue(DAG.getMachineNode(LoongArch::PseudoLA_GOT, DL, Ty, Addr), 0);

    }

  }


  if (!IsLocal) {

    // Mark the load instruction as invariant to enable hoisting in MachineLICM.

    MachineFunction &MF = DAG.getMachineFunction();

    MachineMemOperand *MemOp = MF.getMachineMemOperand(

        MachinePointerInfo::getGOT(MF),

        MachineMemOperand::MOLoad | MachineMemOperand::MODereferenceable |

            MachineMemOperand::MOInvariant,

        LLT(Ty.getSimpleVT()), Align(Ty.getFixedSizeInBits() / 8));

    DAG.setNodeMemRefs(cast<MachineSDNode>(Load.getNode()), {MemOp});

  }


  return Load;

}


SDValue LoongArchTargetLowering::lowerBlockAddress(SDValue Op,

                                                   SelectionDAG &DAG) const {

  return getAddr(cast<BlockAddressSDNode>(Op), DAG,

                 DAG.getTarget().getCodeModel());

}


SDValue LoongArchTargetLowering::lowerJumpTable(SDValue Op,

                                                SelectionDAG &DAG) const {

  return getAddr(cast<JumpTableSDNode>(Op), DAG,

                 DAG.getTarget().getCodeModel());

}


SDValue LoongArchTargetLowering::lowerConstantPool(SDValue Op,

                                                   SelectionDAG &DAG) const {

  return getAddr(cast<ConstantPoolSDNode>(Op), DAG,

                 DAG.getTarget().getCodeModel());

}


SDValue LoongArchTargetLowering::lowerGlobalAddress(SDValue Op,

                                                    SelectionDAG &DAG) const {

  GlobalAddressSDNode *N = cast<GlobalAddressSDNode>(Op);

  assert(N->getOffset() == 0 && "unexpected offset in global node");

  auto CM = DAG.getTarget().getCodeModel();

  const GlobalValue *GV = N->getGlobal();


  if (GV->isDSOLocal() && isa<GlobalVariable>(GV)) {

    if (auto GCM = dyn_cast<GlobalVariable>(GV)->getCodeModel())

      CM = *GCM;

  }


  return getAddr(N, DAG, CM, GV->isDSOLocal());

}


SDValue LoongArchTargetLowering::getStaticTLSAddr(GlobalAddressSDNode *N,

                                                  SelectionDAG &DAG,

                                                  unsigned Opc, bool UseGOT,

                                                  bool Large) const {

  SDLoc DL(N);

  EVT Ty = getPointerTy(DAG.getDataLayout());

  MVT GRLenVT = Subtarget.getGRLenVT();


  // This is not actually used, but is necessary for successfully matching the

  // PseudoLA_*_LARGE nodes.

  SDValue Tmp = DAG.getConstant(0, DL, Ty);

  SDValue Addr = DAG.getTargetGlobalAddress(N->getGlobal(), DL, Ty, 0, 0);


  // Only IE needs an extra argument for large code model.

  SDValue Offset = Opc == LoongArch::PseudoLA_TLS_IE_LARGE

                       ? SDValue(DAG.getMachineNode(Opc, DL, Ty, Tmp, Addr), 0)

                       : SDValue(DAG.getMachineNode(Opc, DL, Ty, Addr), 0);


  // If it is LE for normal/medium code model, the add tp operation will occur

  // during the pseudo-instruction expansion.

  if (Opc == LoongArch::PseudoLA_TLS_LE && !Large)

    return Offset;


  if (UseGOT) {

    // Mark the load instruction as invariant to enable hoisting in MachineLICM.

    MachineFunction &MF = DAG.getMachineFunction();

    MachineMemOperand *MemOp = MF.getMachineMemOperand(

        MachinePointerInfo::getGOT(MF),

        MachineMemOperand::MOLoad | MachineMemOperand::MODereferenceable |

            MachineMemOperand::MOInvariant,

        LLT(Ty.getSimpleVT()), Align(Ty.getFixedSizeInBits() / 8));

    DAG.setNodeMemRefs(cast<MachineSDNode>(Offset.getNode()), {MemOp});

  }


  // Add the thread pointer.

  return DAG.getNode(ISD::ADD, DL, Ty, Offset,

                     DAG.getRegister(LoongArch::R2, GRLenVT));

}


SDValue LoongArchTargetLowering::getDynamicTLSAddr(GlobalAddressSDNode *N,

                                                   SelectionDAG &DAG,

                                                   unsigned Opc,

                                                   bool Large) const {

  SDLoc DL(N);

  EVT Ty = getPointerTy(DAG.getDataLayout());

  IntegerType *CallTy = Type::getIntNTy(*DAG.getContext(), Ty.getSizeInBits());


  // This is not actually used, but is necessary for successfully matching the

  // PseudoLA_*_LARGE nodes.

  SDValue Tmp = DAG.getConstant(0, DL, Ty);


  // Use a PC-relative addressing mode to access the dynamic GOT address.

  SDValue Addr = DAG.getTargetGlobalAddress(N->getGlobal(), DL, Ty, 0, 0);

  SDValue Load = Large ? SDValue(DAG.getMachineNode(Opc, DL, Ty, Tmp, Addr), 0)

                       : SDValue(DAG.getMachineNode(Opc, DL, Ty, Addr), 0);


  // Prepare argument list to generate call.

  ArgListTy Args;

  Args.emplace_back(Load, CallTy);


  // Setup call to __tls_get_addr.

  TargetLowering::CallLoweringInfo CLI(DAG);

  CLI.setDebugLoc(DL)

      .setChain(DAG.getEntryNode())

      .setLibCallee(CallingConv::C, CallTy,

                    DAG.getExternalSymbol("__tls_get_addr", Ty),

                    std::move(Args));


  return LowerCallTo(CLI).first;

}


SDValue LoongArchTargetLowering::getTLSDescAddr(GlobalAddressSDNode *N,

                                                SelectionDAG &DAG, unsigned Opc,

                                                bool Large) const {

  SDLoc DL(N);

  EVT Ty = getPointerTy(DAG.getDataLayout());

  const GlobalValue *GV = N->getGlobal();


  // This is not actually used, but is necessary for successfully matching the

  // PseudoLA_*_LARGE nodes.

  SDValue Tmp = DAG.getConstant(0, DL, Ty);


  // Use a PC-relative addressing mode to access the global dynamic GOT address.

  // This generates the pattern (PseudoLA_TLS_DESC_PC{,LARGE} sym).

  SDValue Addr = DAG.getTargetGlobalAddress(GV, DL, Ty, 0, 0);

  return Large ? SDValue(DAG.getMachineNode(Opc, DL, Ty, Tmp, Addr), 0)

               : SDValue(DAG.getMachineNode(Opc, DL, Ty, Addr), 0);

}


SDValue

LoongArchTargetLowering::lowerGlobalTLSAddress(SDValue Op,

                                               SelectionDAG &DAG) const {

  if (DAG.getMachineFunction().getFunction().getCallingConv() ==

      CallingConv::GHC)

    report_fatal_error("In GHC calling convention TLS is not supported");


  bool Large = DAG.getTarget().getCodeModel() == CodeModel::Large;

  assert((!Large || Subtarget.is64Bit()) && "Large code model requires LA64");


  GlobalAddressSDNode *N = cast<GlobalAddressSDNode>(Op);

  assert(N->getOffset() == 0 && "unexpected offset in global node");


  if (DAG.getTarget().useEmulatedTLS())

    reportFatalUsageError("the emulated TLS is prohibited");


  bool IsDesc = DAG.getTarget().useTLSDESC();


  switch (getTargetMachine().getTLSModel(N->getGlobal())) {

  case TLSModel::GeneralDynamic:

    // In this model, application code calls the dynamic linker function

    // __tls_get_addr to locate TLS offsets into the dynamic thread vector at

    // runtime.

    if (!IsDesc)

      return getDynamicTLSAddr(N, DAG,

                               Large ? LoongArch::PseudoLA_TLS_GD_LARGE

                                     : LoongArch::PseudoLA_TLS_GD,

                               Large);

    break;

  case TLSModel::LocalDynamic:

    // Same as GeneralDynamic, except for assembly modifiers and relocation

    // records.

    if (!IsDesc)

      return getDynamicTLSAddr(N, DAG,

                               Large ? LoongArch::PseudoLA_TLS_LD_LARGE

                                     : LoongArch::PseudoLA_TLS_LD,

                               Large);

    break;

  case TLSModel::InitialExec:

    // This model uses the GOT to resolve TLS offsets.

    return getStaticTLSAddr(N, DAG,

                            Large ? LoongArch::PseudoLA_TLS_IE_LARGE

                                  : LoongArch::PseudoLA_TLS_IE,

                            /*UseGOT=*/true, Large);

  case TLSModel::LocalExec:

    // This model is used when static linking as the TLS offsets are resolved

    // during program linking.

    //

    // This node doesn't need an extra argument for the large code model.

    return getStaticTLSAddr(N, DAG, LoongArch::PseudoLA_TLS_LE,

                            /*UseGOT=*/false, Large);

  }


  return getTLSDescAddr(N, DAG,

                        Large ? LoongArch::PseudoLA_TLS_DESC_LARGE

                              : LoongArch::PseudoLA_TLS_DESC,

                        Large);

}


template <unsigned N>


static SDValue checkIntrinsicImmArg(SDValue Op, unsigned ImmOp,

                                    SelectionDAG &DAG, bool IsSigned = false) {

  auto *CImm = cast<ConstantSDNode>(Op->getOperand(ImmOp));

  // Check the ImmArg.

  if ((IsSigned && !isInt<N>(CImm->getSExtValue())) ||

      (!IsSigned && !isUInt<N>(CImm->getZExtValue()))) {

    DAG.getContext()->emitError(Op->getOperationName(0) +

                                ": argument out of range.");

    return DAG.getNode(ISD::UNDEF, SDLoc(Op), Op.getValueType());

  }

  return SDValue();

}


SDValue

LoongArchTargetLowering::lowerINTRINSIC_WO_CHAIN(SDValue Op,

                                                 SelectionDAG &DAG) const {

  switch (Op.getConstantOperandVal(0)) {

  default:

    return SDValue(); // Don't custom lower most intrinsics.

  case Intrinsic::thread_pointer: {

    EVT PtrVT = getPointerTy(DAG.getDataLayout());

    return DAG.getRegister(LoongArch::R2, PtrVT);

  }

  case Intrinsic::loongarch_lsx_vpickve2gr_d:

  case Intrinsic::loongarch_lsx_vpickve2gr_du:

  case Intrinsic::loongarch_lsx_vreplvei_d:

  case Intrinsic::loongarch_lasx_xvrepl128vei_d:

    return checkIntrinsicImmArg<1>(Op, 2, DAG);

  case Intrinsic::loongarch_lsx_vreplvei_w:

  case Intrinsic::loongarch_lasx_xvrepl128vei_w:

  case Intrinsic::loongarch_lasx_xvpickve2gr_d:

  case Intrinsic::loongarch_lasx_xvpickve2gr_du:

  case Intrinsic::loongarch_lasx_xvpickve_d:

  case Intrinsic::loongarch_lasx_xvpickve_d_f:

    return checkIntrinsicImmArg<2>(Op, 2, DAG);

  case Intrinsic::loongarch_lasx_xvinsve0_d:

    return checkIntrinsicImmArg<2>(Op, 3, DAG);

  case Intrinsic::loongarch_lsx_vsat_b:

  case Intrinsic::loongarch_lsx_vsat_bu:

  case Intrinsic::loongarch_lsx_vrotri_b:

  case Intrinsic::loongarch_lsx_vsllwil_h_b:

  case Intrinsic::loongarch_lsx_vsllwil_hu_bu:

  case Intrinsic::loongarch_lsx_vsrlri_b:

  case Intrinsic::loongarch_lsx_vsrari_b:

  case Intrinsic::loongarch_lsx_vreplvei_h:

  case Intrinsic::loongarch_lasx_xvsat_b:

  case Intrinsic::loongarch_lasx_xvsat_bu:

  case Intrinsic::loongarch_lasx_xvrotri_b:

  case Intrinsic::loongarch_lasx_xvsllwil_h_b:

  case Intrinsic::loongarch_lasx_xvsllwil_hu_bu:

  case Intrinsic::loongarch_lasx_xvsrlri_b:

  case Intrinsic::loongarch_lasx_xvsrari_b:

  case Intrinsic::loongarch_lasx_xvrepl128vei_h:

  case Intrinsic::loongarch_lasx_xvpickve_w:

  case Intrinsic::loongarch_lasx_xvpickve_w_f:

    return checkIntrinsicImmArg<3>(Op, 2, DAG);

  case Intrinsic::loongarch_lasx_xvinsve0_w:

    return checkIntrinsicImmArg<3>(Op, 3, DAG);

  case Intrinsic::loongarch_lsx_vsat_h:

  case Intrinsic::loongarch_lsx_vsat_hu:

  case Intrinsic::loongarch_lsx_vrotri_h:

  case Intrinsic::loongarch_lsx_vsllwil_w_h:

  case Intrinsic::loongarch_lsx_vsllwil_wu_hu:

  case Intrinsic::loongarch_lsx_vsrlri_h:

  case Intrinsic::loongarch_lsx_vsrari_h:

  case Intrinsic::loongarch_lsx_vreplvei_b:

  case Intrinsic::loongarch_lasx_xvsat_h:

  case Intrinsic::loongarch_lasx_xvsat_hu:

  case Intrinsic::loongarch_lasx_xvrotri_h:

  case Intrinsic::loongarch_lasx_xvsllwil_w_h:

  case Intrinsic::loongarch_lasx_xvsllwil_wu_hu:

  case Intrinsic::loongarch_lasx_xvsrlri_h:

  case Intrinsic::loongarch_lasx_xvsrari_h:

  case Intrinsic::loongarch_lasx_xvrepl128vei_b:

    return checkIntrinsicImmArg<4>(Op, 2, DAG);

  case Intrinsic::loongarch_lsx_vsrlni_b_h:

  case Intrinsic::loongarch_lsx_vsrani_b_h:

  case Intrinsic::loongarch_lsx_vsrlrni_b_h:

  case Intrinsic::loongarch_lsx_vsrarni_b_h:

  case Intrinsic::loongarch_lsx_vssrlni_b_h:

  case Intrinsic::loongarch_lsx_vssrani_b_h:

  case Intrinsic::loongarch_lsx_vssrlni_bu_h:

  case Intrinsic::loongarch_lsx_vssrani_bu_h:

  case Intrinsic::loongarch_lsx_vssrlrni_b_h:

  case Intrinsic::loongarch_lsx_vssrarni_b_h:

  case Intrinsic::loongarch_lsx_vssrlrni_bu_h:

  case Intrinsic::loongarch_lsx_vssrarni_bu_h:

  case Intrinsic::loongarch_lasx_xvsrlni_b_h:

  case Intrinsic::loongarch_lasx_xvsrani_b_h:

  case Intrinsic::loongarch_lasx_xvsrlrni_b_h:

  case Intrinsic::loongarch_lasx_xvsrarni_b_h:

  case Intrinsic::loongarch_lasx_xvssrlni_b_h:

  case Intrinsic::loongarch_lasx_xvssrani_b_h:

  case Intrinsic::loongarch_lasx_xvssrlni_bu_h:

  case Intrinsic::loongarch_lasx_xvssrani_bu_h:

  case Intrinsic::loongarch_lasx_xvssrlrni_b_h:

  case Intrinsic::loongarch_lasx_xvssrarni_b_h:

  case Intrinsic::loongarch_lasx_xvssrlrni_bu_h:

  case Intrinsic::loongarch_lasx_xvssrarni_bu_h:

    return checkIntrinsicImmArg<4>(Op, 3, DAG);

  case Intrinsic::loongarch_lsx_vsat_w:

  case Intrinsic::loongarch_lsx_vsat_wu:

  case Intrinsic::loongarch_lsx_vrotri_w:

  case Intrinsic::loongarch_lsx_vsllwil_d_w:

  case Intrinsic::loongarch_lsx_vsllwil_du_wu:

  case Intrinsic::loongarch_lsx_vsrlri_w:

  case Intrinsic::loongarch_lsx_vsrari_w:

  case Intrinsic::loongarch_lsx_vslei_bu:

  case Intrinsic::loongarch_lsx_vslei_hu:

  case Intrinsic::loongarch_lsx_vslei_wu:

  case Intrinsic::loongarch_lsx_vslei_du:

  case Intrinsic::loongarch_lsx_vslti_bu:

  case Intrinsic::loongarch_lsx_vslti_hu:

  case Intrinsic::loongarch_lsx_vslti_wu:

  case Intrinsic::loongarch_lsx_vslti_du:

  case Intrinsic::loongarch_lsx_vbsll_v:

  case Intrinsic::loongarch_lsx_vbsrl_v:

  case Intrinsic::loongarch_lasx_xvsat_w:

  case Intrinsic::loongarch_lasx_xvsat_wu:

  case Intrinsic::loongarch_lasx_xvrotri_w:

  case Intrinsic::loongarch_lasx_xvsllwil_d_w:

  case Intrinsic::loongarch_lasx_xvsllwil_du_wu:

  case Intrinsic::loongarch_lasx_xvsrlri_w:

  case Intrinsic::loongarch_lasx_xvsrari_w:

  case Intrinsic::loongarch_lasx_xvslei_bu:

  case Intrinsic::loongarch_lasx_xvslei_hu:

  case Intrinsic::loongarch_lasx_xvslei_wu:

  case Intrinsic::loongarch_lasx_xvslei_du:

  case Intrinsic::loongarch_lasx_xvslti_bu:

  case Intrinsic::loongarch_lasx_xvslti_hu:

  case Intrinsic::loongarch_lasx_xvslti_wu:

  case Intrinsic::loongarch_lasx_xvslti_du:

  case Intrinsic::loongarch_lasx_xvbsll_v:

  case Intrinsic::loongarch_lasx_xvbsrl_v:

    return checkIntrinsicImmArg<5>(Op, 2, DAG);

  case Intrinsic::loongarch_lsx_vseqi_b:

  case Intrinsic::loongarch_lsx_vseqi_h:

  case Intrinsic::loongarch_lsx_vseqi_w:

  case Intrinsic::loongarch_lsx_vseqi_d:

  case Intrinsic::loongarch_lsx_vslei_b:

  case Intrinsic::loongarch_lsx_vslei_h:

  case Intrinsic::loongarch_lsx_vslei_w:

  case Intrinsic::loongarch_lsx_vslei_d:

  case Intrinsic::loongarch_lsx_vslti_b:

  case Intrinsic::loongarch_lsx_vslti_h:

  case Intrinsic::loongarch_lsx_vslti_w:

  case Intrinsic::loongarch_lsx_vslti_d:

  case Intrinsic::loongarch_lasx_xvseqi_b:

  case Intrinsic::loongarch_lasx_xvseqi_h:

  case Intrinsic::loongarch_lasx_xvseqi_w:

  case Intrinsic::loongarch_lasx_xvseqi_d:

  case Intrinsic::loongarch_lasx_xvslei_b:

  case Intrinsic::loongarch_lasx_xvslei_h:

  case Intrinsic::loongarch_lasx_xvslei_w:

  case Intrinsic::loongarch_lasx_xvslei_d:

  case Intrinsic::loongarch_lasx_xvslti_b:

  case Intrinsic::loongarch_lasx_xvslti_h:

  case Intrinsic::loongarch_lasx_xvslti_w:

  case Intrinsic::loongarch_lasx_xvslti_d:

    return checkIntrinsicImmArg<5>(Op, 2, DAG, /*IsSigned=*/true);

  case Intrinsic::loongarch_lsx_vsrlni_h_w:

  case Intrinsic::loongarch_lsx_vsrani_h_w:

  case Intrinsic::loongarch_lsx_vsrlrni_h_w:

  case Intrinsic::loongarch_lsx_vsrarni_h_w:

  case Intrinsic::loongarch_lsx_vssrlni_h_w:

  case Intrinsic::loongarch_lsx_vssrani_h_w:

  case Intrinsic::loongarch_lsx_vssrlni_hu_w:

  case Intrinsic::loongarch_lsx_vssrani_hu_w:

  case Intrinsic::loongarch_lsx_vssrlrni_h_w:

  case Intrinsic::loongarch_lsx_vssrarni_h_w:

  case Intrinsic::loongarch_lsx_vssrlrni_hu_w:

  case Intrinsic::loongarch_lsx_vssrarni_hu_w:

  case Intrinsic::loongarch_lsx_vfrstpi_b:

  case Intrinsic::loongarch_lsx_vfrstpi_h:

  case Intrinsic::loongarch_lasx_xvsrlni_h_w:

  case Intrinsic::loongarch_lasx_xvsrani_h_w:

  case Intrinsic::loongarch_lasx_xvsrlrni_h_w:

  case Intrinsic::loongarch_lasx_xvsrarni_h_w:

  case Intrinsic::loongarch_lasx_xvssrlni_h_w:

  case Intrinsic::loongarch_lasx_xvssrani_h_w:

  case Intrinsic::loongarch_lasx_xvssrlni_hu_w:

  case Intrinsic::loongarch_lasx_xvssrani_hu_w:

  case Intrinsic::loongarch_lasx_xvssrlrni_h_w:

  case Intrinsic::loongarch_lasx_xvssrarni_h_w:

  case Intrinsic::loongarch_lasx_xvssrlrni_hu_w:

  case Intrinsic::loongarch_lasx_xvssrarni_hu_w:

  case Intrinsic::loongarch_lasx_xvfrstpi_b:

  case Intrinsic::loongarch_lasx_xvfrstpi_h:

    return checkIntrinsicImmArg<5>(Op, 3, DAG);

  case Intrinsic::loongarch_lsx_vsat_d:

  case Intrinsic::loongarch_lsx_vsat_du:

  case Intrinsic::loongarch_lsx_vrotri_d:

  case Intrinsic::loongarch_lsx_vsrlri_d:

  case Intrinsic::loongarch_lsx_vsrari_d:

  case Intrinsic::loongarch_lasx_xvsat_d:

  case Intrinsic::loongarch_lasx_xvsat_du:

  case Intrinsic::loongarch_lasx_xvrotri_d:

  case Intrinsic::loongarch_lasx_xvsrlri_d:

  case Intrinsic::loongarch_lasx_xvsrari_d:

    return checkIntrinsicImmArg<6>(Op, 2, DAG);

  case Intrinsic::loongarch_lsx_vsrlni_w_d:

  case Intrinsic::loongarch_lsx_vsrani_w_d:

  case Intrinsic::loongarch_lsx_vsrlrni_w_d:

  case Intrinsic::loongarch_lsx_vsrarni_w_d:

  case Intrinsic::loongarch_lsx_vssrlni_w_d:

  case Intrinsic::loongarch_lsx_vssrani_w_d:

  case Intrinsic::loongarch_lsx_vssrlni_wu_d:

  case Intrinsic::loongarch_lsx_vssrani_wu_d:

  case Intrinsic::loongarch_lsx_vssrlrni_w_d:

  case Intrinsic::loongarch_lsx_vssrarni_w_d:

  case Intrinsic::loongarch_lsx_vssrlrni_wu_d:

  case Intrinsic::loongarch_lsx_vssrarni_wu_d:

  case Intrinsic::loongarch_lasx_xvsrlni_w_d:

  case Intrinsic::loongarch_lasx_xvsrani_w_d:

  case Intrinsic::loongarch_lasx_xvsrlrni_w_d:

  case Intrinsic::loongarch_lasx_xvsrarni_w_d:

  case Intrinsic::loongarch_lasx_xvssrlni_w_d:

  case Intrinsic::loongarch_lasx_xvssrani_w_d:

  case Intrinsic::loongarch_lasx_xvssrlni_wu_d:

  case Intrinsic::loongarch_lasx_xvssrani_wu_d:

  case Intrinsic::loongarch_lasx_xvssrlrni_w_d:

  case Intrinsic::loongarch_lasx_xvssrarni_w_d:

  case Intrinsic::loongarch_lasx_xvssrlrni_wu_d:

  case Intrinsic::loongarch_lasx_xvssrarni_wu_d:

    return checkIntrinsicImmArg<6>(Op, 3, DAG);

  case Intrinsic::loongarch_lsx_vsrlni_d_q:

  case Intrinsic::loongarch_lsx_vsrani_d_q:

  case Intrinsic::loongarch_lsx_vsrlrni_d_q:

  case Intrinsic::loongarch_lsx_vsrarni_d_q:

  case Intrinsic::loongarch_lsx_vssrlni_d_q:

  case Intrinsic::loongarch_lsx_vssrani_d_q:

  case Intrinsic::loongarch_lsx_vssrlni_du_q:

  case Intrinsic::loongarch_lsx_vssrani_du_q:

  case Intrinsic::loongarch_lsx_vssrlrni_d_q:

  case Intrinsic::loongarch_lsx_vssrarni_d_q:

  case Intrinsic::loongarch_lsx_vssrlrni_du_q:

  case Intrinsic::loongarch_lsx_vssrarni_du_q:

  case Intrinsic::loongarch_lasx_xvsrlni_d_q:

  case Intrinsic::loongarch_lasx_xvsrani_d_q:

  case Intrinsic::loongarch_lasx_xvsrlrni_d_q:

  case Intrinsic::loongarch_lasx_xvsrarni_d_q:

  case Intrinsic::loongarch_lasx_xvssrlni_d_q:

  case Intrinsic::loongarch_lasx_xvssrani_d_q:

  case Intrinsic::loongarch_lasx_xvssrlni_du_q:

  case Intrinsic::loongarch_lasx_xvssrani_du_q:

  case Intrinsic::loongarch_lasx_xvssrlrni_d_q:

  case Intrinsic::loongarch_lasx_xvssrarni_d_q:

  case Intrinsic::loongarch_lasx_xvssrlrni_du_q:

  case Intrinsic::loongarch_lasx_xvssrarni_du_q:

    return checkIntrinsicImmArg<7>(Op, 3, DAG);

  case Intrinsic::loongarch_lsx_vnori_b:

  case Intrinsic::loongarch_lsx_vshuf4i_b:

  case Intrinsic::loongarch_lsx_vshuf4i_h:

  case Intrinsic::loongarch_lsx_vshuf4i_w:

  case Intrinsic::loongarch_lasx_xvnori_b:

  case Intrinsic::loongarch_lasx_xvshuf4i_b:

  case Intrinsic::loongarch_lasx_xvshuf4i_h:

  case Intrinsic::loongarch_lasx_xvshuf4i_w:

  case Intrinsic::loongarch_lasx_xvpermi_d:

    return checkIntrinsicImmArg<8>(Op, 2, DAG);

  case Intrinsic::loongarch_lsx_vshuf4i_d:

  case Intrinsic::loongarch_lsx_vpermi_w:

  case Intrinsic::loongarch_lsx_vbitseli_b:

  case Intrinsic::loongarch_lsx_vextrins_b:

  case Intrinsic::loongarch_lsx_vextrins_h:

  case Intrinsic::loongarch_lsx_vextrins_w:

  case Intrinsic::loongarch_lsx_vextrins_d:

  case Intrinsic::loongarch_lasx_xvshuf4i_d:

  case Intrinsic::loongarch_lasx_xvpermi_w:

  case Intrinsic::loongarch_lasx_xvpermi_q:

  case Intrinsic::loongarch_lasx_xvbitseli_b:

  case Intrinsic::loongarch_lasx_xvextrins_b:

  case Intrinsic::loongarch_lasx_xvextrins_h:

  case Intrinsic::loongarch_lasx_xvextrins_w:

  case Intrinsic::loongarch_lasx_xvextrins_d:

    return checkIntrinsicImmArg<8>(Op, 3, DAG);

  case Intrinsic::loongarch_lsx_vrepli_b:

  case Intrinsic::loongarch_lsx_vrepli_h:

  case Intrinsic::loongarch_lsx_vrepli_w:

  case Intrinsic::loongarch_lsx_vrepli_d:

  case Intrinsic::loongarch_lasx_xvrepli_b:

  case Intrinsic::loongarch_lasx_xvrepli_h:

  case Intrinsic::loongarch_lasx_xvrepli_w:

  case Intrinsic::loongarch_lasx_xvrepli_d:

    return checkIntrinsicImmArg<10>(Op, 1, DAG, /*IsSigned=*/true);

  case Intrinsic::loongarch_lsx_vldi:

  case Intrinsic::loongarch_lasx_xvldi:

    return checkIntrinsicImmArg<13>(Op, 1, DAG, /*IsSigned=*/true);

  }

}


// Helper function that emits error message for intrinsics with chain and return

// merge values of a UNDEF and the chain.


static SDValue emitIntrinsicWithChainErrorMessage(SDValue Op,

                                                  StringRef ErrorMsg,

                                                  SelectionDAG &DAG) {

  DAG.getContext()->emitError(Op->getOperationName(0) + ": " + ErrorMsg + ".");

  return DAG.getMergeValues({DAG.getUNDEF(Op.getValueType()), Op.getOperand(0)},

                            SDLoc(Op));

}


SDValue

LoongArchTargetLowering::lowerINTRINSIC_W_CHAIN(SDValue Op,

                                                SelectionDAG &DAG) const {

  SDLoc DL(Op);

  MVT GRLenVT = Subtarget.getGRLenVT();

  EVT VT = Op.getValueType();

  SDValue Chain = Op.getOperand(0);

  const StringRef ErrorMsgOOR = "argument out of range";

  const StringRef ErrorMsgReqLA64 = "requires loongarch64";

  const StringRef ErrorMsgReqF = "requires basic 'f' target feature";


  switch (Op.getConstantOperandVal(1)) {

  default:

    return Op;

  case Intrinsic::loongarch_crc_w_b_w:

  case Intrinsic::loongarch_crc_w_h_w:

  case Intrinsic::loongarch_crc_w_w_w:

  case Intrinsic::loongarch_crc_w_d_w:

  case Intrinsic::loongarch_crcc_w_b_w:

  case Intrinsic::loongarch_crcc_w_h_w:

  case Intrinsic::loongarch_crcc_w_w_w:

  case Intrinsic::loongarch_crcc_w_d_w:

    return emitIntrinsicWithChainErrorMessage(Op, ErrorMsgReqLA64, DAG);

  case Intrinsic::loongarch_csrrd_w:

  case Intrinsic::loongarch_csrrd_d: {

    unsigned Imm = Op.getConstantOperandVal(2);

    return !isUInt<14>(Imm)

               ? emitIntrinsicWithChainErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::CSRRD, DL, {GRLenVT, MVT::Other},

                             {Chain, DAG.getConstant(Imm, DL, GRLenVT)});

  }

  case Intrinsic::loongarch_csrwr_w:

  case Intrinsic::loongarch_csrwr_d: {

    unsigned Imm = Op.getConstantOperandVal(3);

    return !isUInt<14>(Imm)

               ? emitIntrinsicWithChainErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::CSRWR, DL, {GRLenVT, MVT::Other},

                             {Chain, Op.getOperand(2),

                              DAG.getConstant(Imm, DL, GRLenVT)});

  }

  case Intrinsic::loongarch_csrxchg_w:

  case Intrinsic::loongarch_csrxchg_d: {

    unsigned Imm = Op.getConstantOperandVal(4);

    return !isUInt<14>(Imm)

               ? emitIntrinsicWithChainErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::CSRXCHG, DL, {GRLenVT, MVT::Other},

                             {Chain, Op.getOperand(2), Op.getOperand(3),

                              DAG.getConstant(Imm, DL, GRLenVT)});

  }

  case Intrinsic::loongarch_iocsrrd_d: {

    return DAG.getNode(

        LoongArchISD::IOCSRRD_D, DL, {GRLenVT, MVT::Other},

        {Chain, DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op.getOperand(2))});

  }

#define IOCSRRD_CASE(NAME, NODE)                                               \

  case Intrinsic::loongarch_##NAME: {                                          \

    return DAG.getNode(LoongArchISD::NODE, DL, {GRLenVT, MVT::Other},          \

                       {Chain, Op.getOperand(2)});                             \

  }

    IOCSRRD_CASE(iocsrrd_b, IOCSRRD_B);

    IOCSRRD_CASE(iocsrrd_h, IOCSRRD_H);

    IOCSRRD_CASE(iocsrrd_w, IOCSRRD_W);

#undef IOCSRRD_CASE

  case Intrinsic::loongarch_cpucfg: {

    return DAG.getNode(LoongArchISD::CPUCFG, DL, {GRLenVT, MVT::Other},

                       {Chain, Op.getOperand(2)});

  }

  case Intrinsic::loongarch_lddir_d: {

    unsigned Imm = Op.getConstantOperandVal(3);

    return !isUInt<8>(Imm)

               ? emitIntrinsicWithChainErrorMessage(Op, ErrorMsgOOR, DAG)

               : Op;

  }

  case Intrinsic::loongarch_movfcsr2gr: {

    if (!Subtarget.hasBasicF())

      return emitIntrinsicWithChainErrorMessage(Op, ErrorMsgReqF, DAG);

    unsigned Imm = Op.getConstantOperandVal(2);

    return !isUInt<2>(Imm)

               ? emitIntrinsicWithChainErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::MOVFCSR2GR, DL, {VT, MVT::Other},

                             {Chain, DAG.getConstant(Imm, DL, GRLenVT)});

  }

  case Intrinsic::loongarch_lsx_vld:

  case Intrinsic::loongarch_lsx_vldrepl_b:

  case Intrinsic::loongarch_lasx_xvld:

  case Intrinsic::loongarch_lasx_xvldrepl_b:

    return !isInt<12>(cast<ConstantSDNode>(Op.getOperand(3))->getSExtValue())

               ? emitIntrinsicWithChainErrorMessage(Op, ErrorMsgOOR, DAG)

               : SDValue();

  case Intrinsic::loongarch_lsx_vldrepl_h:

  case Intrinsic::loongarch_lasx_xvldrepl_h:

    return !isShiftedInt<11, 1>(

               cast<ConstantSDNode>(Op.getOperand(3))->getSExtValue())

               ? emitIntrinsicWithChainErrorMessage(

                     Op, "argument out of range or not a multiple of 2", DAG)

               : SDValue();

  case Intrinsic::loongarch_lsx_vldrepl_w:

  case Intrinsic::loongarch_lasx_xvldrepl_w:

    return !isShiftedInt<10, 2>(

               cast<ConstantSDNode>(Op.getOperand(3))->getSExtValue())

               ? emitIntrinsicWithChainErrorMessage(

                     Op, "argument out of range or not a multiple of 4", DAG)

               : SDValue();

  case Intrinsic::loongarch_lsx_vldrepl_d:

  case Intrinsic::loongarch_lasx_xvldrepl_d:

    return !isShiftedInt<9, 3>(

               cast<ConstantSDNode>(Op.getOperand(3))->getSExtValue())

               ? emitIntrinsicWithChainErrorMessage(

                     Op, "argument out of range or not a multiple of 8", DAG)

               : SDValue();

  }

}


// Helper function that emits error message for intrinsics with void return

// value and return the chain.


static SDValue emitIntrinsicErrorMessage(SDValue Op, StringRef ErrorMsg,

                                         SelectionDAG &DAG) {


  DAG.getContext()->emitError(Op->getOperationName(0) + ": " + ErrorMsg + ".");

  return Op.getOperand(0);

}


SDValue LoongArchTargetLowering::lowerINTRINSIC_VOID(SDValue Op,

                                                     SelectionDAG &DAG) const {

  SDLoc DL(Op);

  MVT GRLenVT = Subtarget.getGRLenVT();

  SDValue Chain = Op.getOperand(0);

  uint64_t IntrinsicEnum = Op.getConstantOperandVal(1);

  SDValue Op2 = Op.getOperand(2);

  const StringRef ErrorMsgOOR = "argument out of range";

  const StringRef ErrorMsgReqLA64 = "requires loongarch64";

  const StringRef ErrorMsgReqLA32 = "requires loongarch32";

  const StringRef ErrorMsgReqF = "requires basic 'f' target feature";


  switch (IntrinsicEnum) {

  default:

    // TODO: Add more Intrinsics.

    return SDValue();

  case Intrinsic::loongarch_cacop_d:

  case Intrinsic::loongarch_cacop_w: {

    if (IntrinsicEnum == Intrinsic::loongarch_cacop_d && !Subtarget.is64Bit())

      return emitIntrinsicErrorMessage(Op, ErrorMsgReqLA64, DAG);

    if (IntrinsicEnum == Intrinsic::loongarch_cacop_w && Subtarget.is64Bit())

      return emitIntrinsicErrorMessage(Op, ErrorMsgReqLA32, DAG);

    // call void @llvm.loongarch.cacop.[d/w](uimm5, rj, simm12)

    unsigned Imm1 = Op2->getAsZExtVal();

    int Imm2 = cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue();

    if (!isUInt<5>(Imm1) || !isInt<12>(Imm2))

      return emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG);

    return Op;

  }

  case Intrinsic::loongarch_dbar: {

    unsigned Imm = Op2->getAsZExtVal();

    return !isUInt<15>(Imm)

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::DBAR, DL, MVT::Other, Chain,

                             DAG.getConstant(Imm, DL, GRLenVT));

  }

  case Intrinsic::loongarch_ibar: {

    unsigned Imm = Op2->getAsZExtVal();

    return !isUInt<15>(Imm)

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::IBAR, DL, MVT::Other, Chain,

                             DAG.getConstant(Imm, DL, GRLenVT));

  }

  case Intrinsic::loongarch_break: {

    unsigned Imm = Op2->getAsZExtVal();

    return !isUInt<15>(Imm)

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::BREAK, DL, MVT::Other, Chain,

                             DAG.getConstant(Imm, DL, GRLenVT));

  }

  case Intrinsic::loongarch_movgr2fcsr: {

    if (!Subtarget.hasBasicF())

      return emitIntrinsicErrorMessage(Op, ErrorMsgReqF, DAG);

    unsigned Imm = Op2->getAsZExtVal();

    return !isUInt<2>(Imm)

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::MOVGR2FCSR, DL, MVT::Other, Chain,

                             DAG.getConstant(Imm, DL, GRLenVT),

                             DAG.getNode(ISD::ANY_EXTEND, DL, GRLenVT,

                                         Op.getOperand(3)));

  }

  case Intrinsic::loongarch_syscall: {

    unsigned Imm = Op2->getAsZExtVal();

    return !isUInt<15>(Imm)

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : DAG.getNode(LoongArchISD::SYSCALL, DL, MVT::Other, Chain,

                             DAG.getConstant(Imm, DL, GRLenVT));

  }

#define IOCSRWR_CASE(NAME, NODE)                                               \

  case Intrinsic::loongarch_##NAME: {                                          \

    SDValue Op3 = Op.getOperand(3);                                            \

    return Subtarget.is64Bit()                                                 \

               ? DAG.getNode(LoongArchISD::NODE, DL, MVT::Other, Chain,        \

                             DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op2),  \

                             DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op3))  \

               : DAG.getNode(LoongArchISD::NODE, DL, MVT::Other, Chain, Op2,   \

                             Op3);                                             \

  }

    IOCSRWR_CASE(iocsrwr_b, IOCSRWR_B);

    IOCSRWR_CASE(iocsrwr_h, IOCSRWR_H);

    IOCSRWR_CASE(iocsrwr_w, IOCSRWR_W);

#undef IOCSRWR_CASE

  case Intrinsic::loongarch_iocsrwr_d: {

    return !Subtarget.is64Bit()

               ? emitIntrinsicErrorMessage(Op, ErrorMsgReqLA64, DAG)

               : DAG.getNode(LoongArchISD::IOCSRWR_D, DL, MVT::Other, Chain,

                             Op2,

                             DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64,

                                         Op.getOperand(3)));

  }

#define ASRT_LE_GT_CASE(NAME)                                                  \

  case Intrinsic::loongarch_##NAME: {                                          \

    return !Subtarget.is64Bit()                                                \

               ? emitIntrinsicErrorMessage(Op, ErrorMsgReqLA64, DAG)           \

               : Op;                                                           \

  }

    ASRT_LE_GT_CASE(asrtle_d)

    ASRT_LE_GT_CASE(asrtgt_d)

#undef ASRT_LE_GT_CASE

  case Intrinsic::loongarch_ldpte_d: {

    unsigned Imm = Op.getConstantOperandVal(3);

    return !Subtarget.is64Bit()

               ? emitIntrinsicErrorMessage(Op, ErrorMsgReqLA64, DAG)

           : !isUInt<8>(Imm) ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

                             : Op;

  }

  case Intrinsic::loongarch_lsx_vst:

  case Intrinsic::loongarch_lasx_xvst:

    return !isInt<12>(cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue())

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : SDValue();

  case Intrinsic::loongarch_lasx_xvstelm_b:

    return (!isInt<8>(cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<5>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : SDValue();

  case Intrinsic::loongarch_lsx_vstelm_b:

    return (!isInt<8>(cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<4>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(Op, ErrorMsgOOR, DAG)

               : SDValue();

  case Intrinsic::loongarch_lasx_xvstelm_h:

    return (!isShiftedInt<8, 1>(

                cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<4>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(

                     Op, "argument out of range or not a multiple of 2", DAG)

               : SDValue();

  case Intrinsic::loongarch_lsx_vstelm_h:

    return (!isShiftedInt<8, 1>(

                cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<3>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(

                     Op, "argument out of range or not a multiple of 2", DAG)

               : SDValue();

  case Intrinsic::loongarch_lasx_xvstelm_w:

    return (!isShiftedInt<8, 2>(

                cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<3>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(

                     Op, "argument out of range or not a multiple of 4", DAG)

               : SDValue();

  case Intrinsic::loongarch_lsx_vstelm_w:

    return (!isShiftedInt<8, 2>(

                cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<2>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(

                     Op, "argument out of range or not a multiple of 4", DAG)

               : SDValue();

  case Intrinsic::loongarch_lasx_xvstelm_d:

    return (!isShiftedInt<8, 3>(

                cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<2>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(

                     Op, "argument out of range or not a multiple of 8", DAG)

               : SDValue();

  case Intrinsic::loongarch_lsx_vstelm_d:

    return (!isShiftedInt<8, 3>(

                cast<ConstantSDNode>(Op.getOperand(4))->getSExtValue()) ||

            !isUInt<1>(Op.getConstantOperandVal(5)))

               ? emitIntrinsicErrorMessage(

                     Op, "argument out of range or not a multiple of 8", DAG)

               : SDValue();

  }

}


SDValue LoongArchTargetLowering::lowerShiftLeftParts(SDValue Op,

                                                     SelectionDAG &DAG) const {

  SDLoc DL(Op);

  SDValue Lo = Op.getOperand(0);

  SDValue Hi = Op.getOperand(1);

  SDValue Shamt = Op.getOperand(2);

  EVT VT = Lo.getValueType();


  // if Shamt-GRLen < 0: // Shamt < GRLen

  //   Lo = Lo << Shamt

  //   Hi = (Hi << Shamt) | ((Lo >>u 1) >>u (GRLen-1 ^ Shamt))

  // else:

  //   Lo = 0

  //   Hi = Lo << (Shamt-GRLen)


  SDValue Zero = DAG.getConstant(0, DL, VT);

  SDValue One = DAG.getConstant(1, DL, VT);

  SDValue MinusGRLen =

      DAG.getSignedConstant(-(int)Subtarget.getGRLen(), DL, VT);

  SDValue GRLenMinus1 = DAG.getConstant(Subtarget.getGRLen() - 1, DL, VT);

  SDValue ShamtMinusGRLen = DAG.getNode(ISD::ADD, DL, VT, Shamt, MinusGRLen);

  SDValue GRLenMinus1Shamt = DAG.getNode(ISD::XOR, DL, VT, Shamt, GRLenMinus1);


  SDValue LoTrue = DAG.getNode(ISD::SHL, DL, VT, Lo, Shamt);

  SDValue ShiftRight1Lo = DAG.getNode(ISD::SRL, DL, VT, Lo, One);

  SDValue ShiftRightLo =

      DAG.getNode(ISD::SRL, DL, VT, ShiftRight1Lo, GRLenMinus1Shamt);

  SDValue ShiftLeftHi = DAG.getNode(ISD::SHL, DL, VT, Hi, Shamt);

  SDValue HiTrue = DAG.getNode(ISD::OR, DL, VT, ShiftLeftHi, ShiftRightLo);

  SDValue HiFalse = DAG.getNode(ISD::SHL, DL, VT, Lo, ShamtMinusGRLen);


  SDValue CC = DAG.getSetCC(DL, VT, ShamtMinusGRLen, Zero, ISD::SETLT);


  Lo = DAG.getNode(ISD::SELECT, DL, VT, CC, LoTrue, Zero);

  Hi = DAG.getNode(ISD::SELECT, DL, VT, CC, HiTrue, HiFalse);


  SDValue Parts[2] = {Lo, Hi};

  return DAG.getMergeValues(Parts, DL);

}


SDValue LoongArchTargetLowering::lowerShiftRightParts(SDValue Op,

                                                      SelectionDAG &DAG,

                                                      bool IsSRA) const {

  SDLoc DL(Op);

  SDValue Lo = Op.getOperand(0);

  SDValue Hi = Op.getOperand(1);

  SDValue Shamt = Op.getOperand(2);

  EVT VT = Lo.getValueType();


  // SRA expansion:

  //   if Shamt-GRLen < 0: // Shamt < GRLen

  //     Lo = (Lo >>u Shamt) | ((Hi << 1) << (ShAmt ^ GRLen-1))

  //     Hi = Hi >>s Shamt

  //   else:

  //     Lo = Hi >>s (Shamt-GRLen);

  //     Hi = Hi >>s (GRLen-1)

  //

  // SRL expansion:

  //   if Shamt-GRLen < 0: // Shamt < GRLen

  //     Lo = (Lo >>u Shamt) | ((Hi << 1) << (ShAmt ^ GRLen-1))

  //     Hi = Hi >>u Shamt

  //   else:

  //     Lo = Hi >>u (Shamt-GRLen);

  //     Hi = 0;


  unsigned ShiftRightOp = IsSRA ? ISD::SRA : ISD::SRL;


  SDValue Zero = DAG.getConstant(0, DL, VT);

  SDValue One = DAG.getConstant(1, DL, VT);

  SDValue MinusGRLen =

      DAG.getSignedConstant(-(int)Subtarget.getGRLen(), DL, VT);

  SDValue GRLenMinus1 = DAG.getConstant(Subtarget.getGRLen() - 1, DL, VT);

  SDValue ShamtMinusGRLen = DAG.getNode(ISD::ADD, DL, VT, Shamt, MinusGRLen);

  SDValue GRLenMinus1Shamt = DAG.getNode(ISD::XOR, DL, VT, Shamt, GRLenMinus1);


  SDValue ShiftRightLo = DAG.getNode(ISD::SRL, DL, VT, Lo, Shamt);

  SDValue ShiftLeftHi1 = DAG.getNode(ISD::SHL, DL, VT, Hi, One);

  SDValue ShiftLeftHi =

      DAG.getNode(ISD::SHL, DL, VT, ShiftLeftHi1, GRLenMinus1Shamt);

  SDValue LoTrue = DAG.getNode(ISD::OR, DL, VT, ShiftRightLo, ShiftLeftHi);

  SDValue HiTrue = DAG.getNode(ShiftRightOp, DL, VT, Hi, Shamt);

  SDValue LoFalse = DAG.getNode(ShiftRightOp, DL, VT, Hi, ShamtMinusGRLen);

  SDValue HiFalse =

      IsSRA ? DAG.getNode(ISD::SRA, DL, VT, Hi, GRLenMinus1) : Zero;


  SDValue CC = DAG.getSetCC(DL, VT, ShamtMinusGRLen, Zero, ISD::SETLT);


  Lo = DAG.getNode(ISD::SELECT, DL, VT, CC, LoTrue, LoFalse);

  Hi = DAG.getNode(ISD::SELECT, DL, VT, CC, HiTrue, HiFalse);


  SDValue Parts[2] = {Lo, Hi};

  return DAG.getMergeValues(Parts, DL);

}


// Returns the opcode of the target-specific SDNode that implements the 32-bit

// form of the given Opcode.


static unsigned getLoongArchWOpcode(unsigned Opcode) {

  switch (Opcode) {

  default:

    llvm_unreachable("Unexpected opcode");

  case ISD::SDIV:

    return LoongArchISD::DIV_W;

  case ISD::UDIV:

    return LoongArchISD::DIV_WU;

  case ISD::SREM:

    return LoongArchISD::MOD_W;

  case ISD::UREM:

    return LoongArchISD::MOD_WU;

  case ISD::SHL:

    return LoongArchISD::SLL_W;

  case ISD::SRA:

    return LoongArchISD::SRA_W;

  case ISD::SRL:

    return LoongArchISD::SRL_W;

  case ISD::ROTL:

  case ISD::ROTR:

    return LoongArchISD::ROTR_W;

  case ISD::CTTZ:

    return LoongArchISD::CTZ_W;

  case ISD::CTLZ:

    return LoongArchISD::CLZ_W;

  }

}


// Converts the given i8/i16/i32 operation to a target-specific SelectionDAG

// node. Because i8/i16/i32 isn't a legal type for LA64, these operations would

// otherwise be promoted to i64, making it difficult to select the

// SLL_W/.../*W later one because the fact the operation was originally of

// type i8/i16/i32 is lost.


static SDValue customLegalizeToWOp(SDNode *N, SelectionDAG &DAG, int NumOp,

                                   unsigned ExtOpc = ISD::ANY_EXTEND) {

  SDLoc DL(N);

  unsigned WOpcode = getLoongArchWOpcode(N->getOpcode());

  SDValue NewOp0, NewRes;


  switch (NumOp) {

  default:

    llvm_unreachable("Unexpected NumOp");

  case 1: {

    NewOp0 = DAG.getNode(ExtOpc, DL, MVT::i64, N->getOperand(0));

    NewRes = DAG.getNode(WOpcode, DL, MVT::i64, NewOp0);

    break;

  }

  case 2: {

    NewOp0 = DAG.getNode(ExtOpc, DL, MVT::i64, N->getOperand(0));

    SDValue NewOp1 = DAG.getNode(ExtOpc, DL, MVT::i64, N->getOperand(1));

    if (N->getOpcode() == ISD::ROTL) {

      SDValue TmpOp = DAG.getConstant(32, DL, MVT::i64);

      NewOp1 = DAG.getNode(ISD::SUB, DL, MVT::i64, TmpOp, NewOp1);

    }

    NewRes = DAG.getNode(WOpcode, DL, MVT::i64, NewOp0, NewOp1);

    break;

  }

    // TODO:Handle more NumOp.

  }


  // ReplaceNodeResults requires we maintain the same type for the return

  // value.

  return DAG.getNode(ISD::TRUNCATE, DL, N->getValueType(0), NewRes);

}


// Converts the given 32-bit operation to a i64 operation with signed extension

// semantic to reduce the signed extension instructions.


static SDValue customLegalizeToWOpWithSExt(SDNode *N, SelectionDAG &DAG) {

  SDLoc DL(N);

  SDValue NewOp0 = DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, N->getOperand(0));

  SDValue NewOp1 = DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, N->getOperand(1));

  SDValue NewWOp = DAG.getNode(N->getOpcode(), DL, MVT::i64, NewOp0, NewOp1);

  SDValue NewRes = DAG.getNode(ISD::SIGN_EXTEND_INREG, DL, MVT::i64, NewWOp,

                               DAG.getValueType(MVT::i32));

  return DAG.getNode(ISD::TRUNCATE, DL, MVT::i32, NewRes);

}


// Helper function that emits error message for intrinsics with/without chain

// and return a UNDEF or and the chain as the results.


static void emitErrorAndReplaceIntrinsicResults(

    SDNode *N, SmallVectorImpl<SDValue> &Results, SelectionDAG &DAG,

    StringRef ErrorMsg, bool WithChain = true) {

  DAG.getContext()->emitError(N->getOperationName(0) + ": " + ErrorMsg + ".");

  Results.push_back(DAG.getUNDEF(N->getValueType(0)));

  if (!WithChain)

    return;

  Results.push_back(N->getOperand(0));

}


template <unsigned N>

static void


replaceVPICKVE2GRResults(SDNode *Node, SmallVectorImpl<SDValue> &Results,

                         SelectionDAG &DAG, const LoongArchSubtarget &Subtarget,

                         unsigned ResOp) {

  const StringRef ErrorMsgOOR = "argument out of range";

  unsigned Imm = Node->getConstantOperandVal(2);

  if (!isUInt<N>(Imm)) {

    emitErrorAndReplaceIntrinsicResults(Node, Results, DAG, ErrorMsgOOR,

                                        /*WithChain=*/false);

    return;

  }

  SDLoc DL(Node);

  SDValue Vec = Node->getOperand(1);


  SDValue PickElt =

      DAG.getNode(ResOp, DL, Subtarget.getGRLenVT(), Vec,

                  DAG.getConstant(Imm, DL, Subtarget.getGRLenVT()),

                  DAG.getValueType(Vec.getValueType().getVectorElementType()));

  Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, Node->getValueType(0),

                                PickElt.getValue(0)));

}


static void replaceVecCondBranchResults(SDNode *N,

                                        SmallVectorImpl<SDValue> &Results,

                                        SelectionDAG &DAG,

                                        const LoongArchSubtarget &Subtarget,

                                        unsigned ResOp) {

  SDLoc DL(N);

  SDValue Vec = N->getOperand(1);


  SDValue CB = DAG.getNode(ResOp, DL, Subtarget.getGRLenVT(), Vec);

  Results.push_back(

      DAG.getNode(ISD::TRUNCATE, DL, N->getValueType(0), CB.getValue(0)));

}


static void


replaceINTRINSIC_WO_CHAINResults(SDNode *N, SmallVectorImpl<SDValue> &Results,

                                 SelectionDAG &DAG,

                                 const LoongArchSubtarget &Subtarget) {

  switch (N->getConstantOperandVal(0)) {

  default:

    llvm_unreachable("Unexpected Intrinsic.");

  case Intrinsic::loongarch_lsx_vpickve2gr_b:

    replaceVPICKVE2GRResults<4>(N, Results, DAG, Subtarget,

                                LoongArchISD::VPICK_SEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_h:

  case Intrinsic::loongarch_lasx_xvpickve2gr_w:

    replaceVPICKVE2GRResults<3>(N, Results, DAG, Subtarget,

                                LoongArchISD::VPICK_SEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_w:

    replaceVPICKVE2GRResults<2>(N, Results, DAG, Subtarget,

                                LoongArchISD::VPICK_SEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_bu:

    replaceVPICKVE2GRResults<4>(N, Results, DAG, Subtarget,

                                LoongArchISD::VPICK_ZEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_hu:

  case Intrinsic::loongarch_lasx_xvpickve2gr_wu:

    replaceVPICKVE2GRResults<3>(N, Results, DAG, Subtarget,

                                LoongArchISD::VPICK_ZEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_wu:

    replaceVPICKVE2GRResults<2>(N, Results, DAG, Subtarget,

                                LoongArchISD::VPICK_ZEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_bz_b:

  case Intrinsic::loongarch_lsx_bz_h:

  case Intrinsic::loongarch_lsx_bz_w:

  case Intrinsic::loongarch_lsx_bz_d:

  case Intrinsic::loongarch_lasx_xbz_b:

  case Intrinsic::loongarch_lasx_xbz_h:

  case Intrinsic::loongarch_lasx_xbz_w:

  case Intrinsic::loongarch_lasx_xbz_d:

    replaceVecCondBranchResults(N, Results, DAG, Subtarget,

                                LoongArchISD::VALL_ZERO);

    break;

  case Intrinsic::loongarch_lsx_bz_v:

  case Intrinsic::loongarch_lasx_xbz_v:

    replaceVecCondBranchResults(N, Results, DAG, Subtarget,

                                LoongArchISD::VANY_ZERO);

    break;

  case Intrinsic::loongarch_lsx_bnz_b:

  case Intrinsic::loongarch_lsx_bnz_h:

  case Intrinsic::loongarch_lsx_bnz_w:

  case Intrinsic::loongarch_lsx_bnz_d:

  case Intrinsic::loongarch_lasx_xbnz_b:

  case Intrinsic::loongarch_lasx_xbnz_h:

  case Intrinsic::loongarch_lasx_xbnz_w:

  case Intrinsic::loongarch_lasx_xbnz_d:

    replaceVecCondBranchResults(N, Results, DAG, Subtarget,

                                LoongArchISD::VALL_NONZERO);

    break;

  case Intrinsic::loongarch_lsx_bnz_v:

  case Intrinsic::loongarch_lasx_xbnz_v:

    replaceVecCondBranchResults(N, Results, DAG, Subtarget,

                                LoongArchISD::VANY_NONZERO);

    break;

  }

}


static void replaceCMP_XCHG_128Results(SDNode *N,

                                       SmallVectorImpl<SDValue> &Results,

                                       SelectionDAG &DAG) {

  assert(N->getValueType(0) == MVT::i128 &&

         "AtomicCmpSwap on types less than 128 should be legal");

  MachineMemOperand *MemOp = cast<MemSDNode>(N)->getMemOperand();


  unsigned Opcode;

  switch (MemOp->getMergedOrdering()) {

  case AtomicOrdering::Acquire:

  case AtomicOrdering::AcquireRelease:

  case AtomicOrdering::SequentiallyConsistent:

    Opcode = LoongArch::PseudoCmpXchg128Acquire;

    break;

  case AtomicOrdering::Monotonic:

  case AtomicOrdering::Release:

    Opcode = LoongArch::PseudoCmpXchg128;

    break;

  default:

    llvm_unreachable("Unexpected ordering!");

  }


  SDLoc DL(N);

  auto CmpVal = DAG.SplitScalar(N->getOperand(2), DL, MVT::i64, MVT::i64);

  auto NewVal = DAG.SplitScalar(N->getOperand(3), DL, MVT::i64, MVT::i64);

  SDValue Ops[] = {N->getOperand(1), CmpVal.first,  CmpVal.second,

                   NewVal.first,     NewVal.second, N->getOperand(0)};


  SDNode *CmpSwap = DAG.getMachineNode(

      Opcode, SDLoc(N), DAG.getVTList(MVT::i64, MVT::i64, MVT::i64, MVT::Other),

      Ops);

  DAG.setNodeMemRefs(cast<MachineSDNode>(CmpSwap), {MemOp});

  Results.push_back(DAG.getNode(ISD::BUILD_PAIR, DL, MVT::i128,

                                SDValue(CmpSwap, 0), SDValue(CmpSwap, 1)));

  Results.push_back(SDValue(CmpSwap, 3));

}


void LoongArchTargetLowering::ReplaceNodeResults(

    SDNode *N, SmallVectorImpl<SDValue> &Results, SelectionDAG &DAG) const {

  SDLoc DL(N);

  EVT VT = N->getValueType(0);

  switch (N->getOpcode()) {

  default:

    llvm_unreachable("Don't know how to legalize this operation");

  case ISD::ADD:

  case ISD::SUB:

    assert(N->getValueType(0) == MVT::i32 && Subtarget.is64Bit() &&

           "Unexpected custom legalisation");

    Results.push_back(customLegalizeToWOpWithSExt(N, DAG));

    break;

  case ISD::SDIV:

  case ISD::UDIV:

  case ISD::SREM:

  case ISD::UREM:

    assert(VT == MVT::i32 && Subtarget.is64Bit() &&

           "Unexpected custom legalisation");

    Results.push_back(customLegalizeToWOp(N, DAG, 2,

                                          Subtarget.hasDiv32() && VT == MVT::i32

                                              ? ISD::ANY_EXTEND

                                              : ISD::SIGN_EXTEND));

    break;

  case ISD::SHL:

  case ISD::SRA:

  case ISD::SRL:

    assert(VT == MVT::i32 && Subtarget.is64Bit() &&

           "Unexpected custom legalisation");

    if (N->getOperand(1).getOpcode() != ISD::Constant) {

      Results.push_back(customLegalizeToWOp(N, DAG, 2));

      break;

    }

    break;

  case ISD::ROTL:

  case ISD::ROTR:

    assert(VT == MVT::i32 && Subtarget.is64Bit() &&

           "Unexpected custom legalisation");

    Results.push_back(customLegalizeToWOp(N, DAG, 2));

    break;

  case ISD::FP_TO_SINT: {

    assert(VT == MVT::i32 && Subtarget.is64Bit() &&

           "Unexpected custom legalisation");

    SDValue Src = N->getOperand(0);

    EVT FVT = EVT::getFloatingPointVT(N->getValueSizeInBits(0));

    if (getTypeAction(*DAG.getContext(), Src.getValueType()) !=

        TargetLowering::TypeSoftenFloat) {

      if (!isTypeLegal(Src.getValueType()))

        return;

      if (Src.getValueType() == MVT::f16)

        Src = DAG.getNode(ISD::FP_EXTEND, DL, MVT::f32, Src);

      SDValue Dst = DAG.getNode(LoongArchISD::FTINT, DL, FVT, Src);

      Results.push_back(DAG.getNode(ISD::BITCAST, DL, VT, Dst));

      return;

    }

    // If the FP type needs to be softened, emit a library call using the 'si'

    // version. If we left it to default legalization we'd end up with 'di'.

    RTLIB::Libcall LC;

    LC = RTLIB::getFPTOSINT(Src.getValueType(), VT);

    MakeLibCallOptions CallOptions;

    EVT OpVT = Src.getValueType();

    CallOptions.setTypeListBeforeSoften(OpVT, VT);

    SDValue Chain = SDValue();

    SDValue Result;

    std::tie(Result, Chain) =

        makeLibCall(DAG, LC, VT, Src, CallOptions, DL, Chain);

    Results.push_back(Result);

    break;

  }

  case ISD::BITCAST: {

    SDValue Src = N->getOperand(0);

    EVT SrcVT = Src.getValueType();

    if (VT == MVT::i32 && SrcVT == MVT::f32 && Subtarget.is64Bit() &&

        Subtarget.hasBasicF()) {

      SDValue Dst =

          DAG.getNode(LoongArchISD::MOVFR2GR_S_LA64, DL, MVT::i64, Src);

      Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, MVT::i32, Dst));

    } else if (VT == MVT::i64 && SrcVT == MVT::f64 && !Subtarget.is64Bit()) {

      SDValue NewReg = DAG.getNode(LoongArchISD::SPLIT_PAIR_F64, DL,

                                   DAG.getVTList(MVT::i32, MVT::i32), Src);

      SDValue RetReg = DAG.getNode(ISD::BUILD_PAIR, DL, MVT::i64,

                                   NewReg.getValue(0), NewReg.getValue(1));

      Results.push_back(RetReg);

    }

    break;

  }

  case ISD::FP_TO_UINT: {

    assert(VT == MVT::i32 && Subtarget.is64Bit() &&

           "Unexpected custom legalisation");

    auto &TLI = DAG.getTargetLoweringInfo();

    SDValue Tmp1, Tmp2;

    TLI.expandFP_TO_UINT(N, Tmp1, Tmp2, DAG);

    Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, MVT::i32, Tmp1));

    break;

  }

  case ISD::BSWAP: {

    SDValue Src = N->getOperand(0);

    assert((VT == MVT::i16 || VT == MVT::i32) &&

           "Unexpected custom legalization");

    MVT GRLenVT = Subtarget.getGRLenVT();

    SDValue NewSrc = DAG.getNode(ISD::ANY_EXTEND, DL, GRLenVT, Src);

    SDValue Tmp;

    switch (VT.getSizeInBits()) {

    default:

      llvm_unreachable("Unexpected operand width");

    case 16:

      Tmp = DAG.getNode(LoongArchISD::REVB_2H, DL, GRLenVT, NewSrc);

      break;

    case 32:

      // Only LA64 will get to here due to the size mismatch between VT and

      // GRLenVT, LA32 lowering is directly defined in LoongArchInstrInfo.

      Tmp = DAG.getNode(LoongArchISD::REVB_2W, DL, GRLenVT, NewSrc);

      break;

    }

    Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, VT, Tmp));

    break;

  }

  case ISD::BITREVERSE: {

    SDValue Src = N->getOperand(0);

    assert((VT == MVT::i8 || (VT == MVT::i32 && Subtarget.is64Bit())) &&

           "Unexpected custom legalization");

    MVT GRLenVT = Subtarget.getGRLenVT();

    SDValue NewSrc = DAG.getNode(ISD::ANY_EXTEND, DL, GRLenVT, Src);

    SDValue Tmp;

    switch (VT.getSizeInBits()) {

    default:

      llvm_unreachable("Unexpected operand width");

    case 8:

      Tmp = DAG.getNode(LoongArchISD::BITREV_4B, DL, GRLenVT, NewSrc);

      break;

    case 32:

      Tmp = DAG.getNode(LoongArchISD::BITREV_W, DL, GRLenVT, NewSrc);

      break;

    }

    Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, VT, Tmp));

    break;

  }

  case ISD::CTLZ:

  case ISD::CTTZ: {

    assert(VT == MVT::i32 && Subtarget.is64Bit() &&

           "Unexpected custom legalisation");

    Results.push_back(customLegalizeToWOp(N, DAG, 1));

    break;

  }

  case ISD::INTRINSIC_W_CHAIN: {

    SDValue Chain = N->getOperand(0);

    SDValue Op2 = N->getOperand(2);

    MVT GRLenVT = Subtarget.getGRLenVT();

    const StringRef ErrorMsgOOR = "argument out of range";

    const StringRef ErrorMsgReqLA64 = "requires loongarch64";

    const StringRef ErrorMsgReqF = "requires basic 'f' target feature";


    switch (N->getConstantOperandVal(1)) {

    default:

      llvm_unreachable("Unexpected Intrinsic.");

    case Intrinsic::loongarch_movfcsr2gr: {

      if (!Subtarget.hasBasicF()) {

        emitErrorAndReplaceIntrinsicResults(N, Results, DAG, ErrorMsgReqF);

        return;

      }

      unsigned Imm = Op2->getAsZExtVal();

      if (!isUInt<2>(Imm)) {

        emitErrorAndReplaceIntrinsicResults(N, Results, DAG, ErrorMsgOOR);

        return;

      }

      SDValue MOVFCSR2GRResults = DAG.getNode(

          LoongArchISD::MOVFCSR2GR, SDLoc(N), {MVT::i64, MVT::Other},

          {Chain, DAG.getConstant(Imm, DL, GRLenVT)});

      Results.push_back(

          DAG.getNode(ISD::TRUNCATE, DL, VT, MOVFCSR2GRResults.getValue(0)));

      Results.push_back(MOVFCSR2GRResults.getValue(1));

      break;

    }

#define CRC_CASE_EXT_BINARYOP(NAME, NODE)                                      \

  case Intrinsic::loongarch_##NAME: {                                          \

    SDValue NODE = DAG.getNode(                                                \

        LoongArchISD::NODE, DL, {MVT::i64, MVT::Other},                        \

        {Chain, DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op2),               \

         DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, N->getOperand(3))});       \

    Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, VT, NODE.getValue(0)));   \

    Results.push_back(NODE.getValue(1));                                       \

    break;                                                                     \

  }

      CRC_CASE_EXT_BINARYOP(crc_w_b_w, CRC_W_B_W)

      CRC_CASE_EXT_BINARYOP(crc_w_h_w, CRC_W_H_W)

      CRC_CASE_EXT_BINARYOP(crc_w_w_w, CRC_W_W_W)

      CRC_CASE_EXT_BINARYOP(crcc_w_b_w, CRCC_W_B_W)

      CRC_CASE_EXT_BINARYOP(crcc_w_h_w, CRCC_W_H_W)

      CRC_CASE_EXT_BINARYOP(crcc_w_w_w, CRCC_W_W_W)

#undef CRC_CASE_EXT_BINARYOP


#define CRC_CASE_EXT_UNARYOP(NAME, NODE)                                       \

  case Intrinsic::loongarch_##NAME: {                                          \

    SDValue NODE = DAG.getNode(                                                \

        LoongArchISD::NODE, DL, {MVT::i64, MVT::Other},                        \

        {Chain, Op2,                                                           \

         DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, N->getOperand(3))});       \

    Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, VT, NODE.getValue(0)));   \

    Results.push_back(NODE.getValue(1));                                       \

    break;                                                                     \

  }

      CRC_CASE_EXT_UNARYOP(crc_w_d_w, CRC_W_D_W)

      CRC_CASE_EXT_UNARYOP(crcc_w_d_w, CRCC_W_D_W)

#undef CRC_CASE_EXT_UNARYOP

#define CSR_CASE(ID)                                                           \

  case Intrinsic::loongarch_##ID: {                                            \

    if (!Subtarget.is64Bit())                                                  \

      emitErrorAndReplaceIntrinsicResults(N, Results, DAG, ErrorMsgReqLA64);   \

    break;                                                                     \

  }

      CSR_CASE(csrrd_d);

      CSR_CASE(csrwr_d);

      CSR_CASE(csrxchg_d);

      CSR_CASE(iocsrrd_d);

#undef CSR_CASE

    case Intrinsic::loongarch_csrrd_w: {

      unsigned Imm = Op2->getAsZExtVal();

      if (!isUInt<14>(Imm)) {

        emitErrorAndReplaceIntrinsicResults(N, Results, DAG, ErrorMsgOOR);

        return;

      }

      SDValue CSRRDResults =

          DAG.getNode(LoongArchISD::CSRRD, DL, {GRLenVT, MVT::Other},

                      {Chain, DAG.getConstant(Imm, DL, GRLenVT)});

      Results.push_back(

          DAG.getNode(ISD::TRUNCATE, DL, VT, CSRRDResults.getValue(0)));

      Results.push_back(CSRRDResults.getValue(1));

      break;

    }

    case Intrinsic::loongarch_csrwr_w: {

      unsigned Imm = N->getConstantOperandVal(3);

      if (!isUInt<14>(Imm)) {

        emitErrorAndReplaceIntrinsicResults(N, Results, DAG, ErrorMsgOOR);

        return;

      }

      SDValue CSRWRResults =

          DAG.getNode(LoongArchISD::CSRWR, DL, {GRLenVT, MVT::Other},

                      {Chain, DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op2),

                       DAG.getConstant(Imm, DL, GRLenVT)});

      Results.push_back(

          DAG.getNode(ISD::TRUNCATE, DL, VT, CSRWRResults.getValue(0)));

      Results.push_back(CSRWRResults.getValue(1));

      break;

    }

    case Intrinsic::loongarch_csrxchg_w: {

      unsigned Imm = N->getConstantOperandVal(4);

      if (!isUInt<14>(Imm)) {

        emitErrorAndReplaceIntrinsicResults(N, Results, DAG, ErrorMsgOOR);

        return;

      }

      SDValue CSRXCHGResults = DAG.getNode(

          LoongArchISD::CSRXCHG, DL, {GRLenVT, MVT::Other},

          {Chain, DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op2),

           DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, N->getOperand(3)),

           DAG.getConstant(Imm, DL, GRLenVT)});

      Results.push_back(

          DAG.getNode(ISD::TRUNCATE, DL, VT, CSRXCHGResults.getValue(0)));

      Results.push_back(CSRXCHGResults.getValue(1));

      break;

    }

#define IOCSRRD_CASE(NAME, NODE)                                               \

  case Intrinsic::loongarch_##NAME: {                                          \

    SDValue IOCSRRDResults =                                                   \

        DAG.getNode(LoongArchISD::NODE, DL, {MVT::i64, MVT::Other},            \

                    {Chain, DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op2)}); \

    Results.push_back(                                                         \

        DAG.getNode(ISD::TRUNCATE, DL, VT, IOCSRRDResults.getValue(0)));       \

    Results.push_back(IOCSRRDResults.getValue(1));                             \

    break;                                                                     \

  }

      IOCSRRD_CASE(iocsrrd_b, IOCSRRD_B);

      IOCSRRD_CASE(iocsrrd_h, IOCSRRD_H);

      IOCSRRD_CASE(iocsrrd_w, IOCSRRD_W);

#undef IOCSRRD_CASE

    case Intrinsic::loongarch_cpucfg: {

      SDValue CPUCFGResults =

          DAG.getNode(LoongArchISD::CPUCFG, DL, {GRLenVT, MVT::Other},

                      {Chain, DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i64, Op2)});

      Results.push_back(

          DAG.getNode(ISD::TRUNCATE, DL, VT, CPUCFGResults.getValue(0)));

      Results.push_back(CPUCFGResults.getValue(1));

      break;

    }

    case Intrinsic::loongarch_lddir_d: {

      if (!Subtarget.is64Bit()) {

        emitErrorAndReplaceIntrinsicResults(N, Results, DAG, ErrorMsgReqLA64);

        return;

      }

      break;

    }

    }

    break;

  }

  case ISD::READ_REGISTER: {

    if (Subtarget.is64Bit())

      DAG.getContext()->emitError(

          "On LA64, only 64-bit registers can be read.");

    else

      DAG.getContext()->emitError(

          "On LA32, only 32-bit registers can be read.");

    Results.push_back(DAG.getUNDEF(VT));

    Results.push_back(N->getOperand(0));

    break;

  }

  case ISD::INTRINSIC_WO_CHAIN: {

    replaceINTRINSIC_WO_CHAINResults(N, Results, DAG, Subtarget);

    break;

  }

  case ISD::LROUND: {

    SDValue Op0 = N->getOperand(0);

    EVT OpVT = Op0.getValueType();

    RTLIB::Libcall LC =

        OpVT == MVT::f64 ? RTLIB::LROUND_F64 : RTLIB::LROUND_F32;

    MakeLibCallOptions CallOptions;

    CallOptions.setTypeListBeforeSoften(OpVT, MVT::i64);

    SDValue Result = makeLibCall(DAG, LC, MVT::i64, Op0, CallOptions, DL).first;

    Result = DAG.getNode(ISD::TRUNCATE, DL, MVT::i32, Result);

    Results.push_back(Result);

    break;

  }

  case ISD::ATOMIC_CMP_SWAP: {

    replaceCMP_XCHG_128Results(N, Results, DAG);

    break;

  }

  case ISD::TRUNCATE: {

    MVT VT = N->getSimpleValueType(0);

    if (getTypeAction(*DAG.getContext(), VT) != TypeWidenVector)

      return;


    MVT WidenVT = getTypeToTransformTo(*DAG.getContext(), VT).getSimpleVT();

    SDValue In = N->getOperand(0);

    EVT InVT = In.getValueType();

    EVT InEltVT = InVT.getVectorElementType();

    EVT EltVT = VT.getVectorElementType();

    unsigned MinElts = VT.getVectorNumElements();

    unsigned WidenNumElts = WidenVT.getVectorNumElements();

    unsigned InBits = InVT.getSizeInBits();


    if ((128 % InBits) == 0 && WidenVT.is128BitVector()) {

      if ((InEltVT.getSizeInBits() % EltVT.getSizeInBits()) == 0) {

        int Scale = InEltVT.getSizeInBits() / EltVT.getSizeInBits();

        SmallVector<int, 16> TruncMask(WidenNumElts, -1);

        for (unsigned I = 0; I < MinElts; ++I)

          TruncMask[I] = Scale * I;


        unsigned WidenNumElts = 128 / In.getScalarValueSizeInBits();

        MVT SVT = In.getSimpleValueType().getScalarType();

        MVT VT = MVT::getVectorVT(SVT, WidenNumElts);

        SDValue WidenIn =

            DAG.getNode(ISD::INSERT_SUBVECTOR, DL, VT, DAG.getUNDEF(VT), In,

                        DAG.getVectorIdxConstant(0, DL));

        assert(isTypeLegal(WidenVT) && isTypeLegal(WidenIn.getValueType()) &&

               "Illegal vector type in truncation");

        WidenIn = DAG.getBitcast(WidenVT, WidenIn);

        Results.push_back(

            DAG.getVectorShuffle(WidenVT, DL, WidenIn, WidenIn, TruncMask));

        return;

      }

    }


    break;

  }

  }

}


/// Try to fold: (and (xor X, -1), Y) -> (vandn X, Y).


static SDValue combineAndNotIntoVANDN(SDNode *N, const SDLoc &DL,

                                      SelectionDAG &DAG) {

  assert(N->getOpcode() == ISD::AND && "Unexpected opcode combine into ANDN");


  MVT VT = N->getSimpleValueType(0);

  if (!VT.is128BitVector() && !VT.is256BitVector())

    return SDValue();


  SDValue X, Y;

  SDValue N0 = N->getOperand(0);

  SDValue N1 = N->getOperand(1);


  if (SDValue Not = isNOT(N0, DAG)) {

    X = Not;

    Y = N1;

  } else if (SDValue Not = isNOT(N1, DAG)) {

    X = Not;

    Y = N0;

  } else

    return SDValue();


  X = DAG.getBitcast(VT, X);

  Y = DAG.getBitcast(VT, Y);

  return DAG.getNode(LoongArchISD::VANDN, DL, VT, X, Y);

}


static SDValue performANDCombine(SDNode *N, SelectionDAG &DAG,

                                 TargetLowering::DAGCombinerInfo &DCI,

                                 const LoongArchSubtarget &Subtarget) {

  if (DCI.isBeforeLegalizeOps())

    return SDValue();


  SDValue FirstOperand = N->getOperand(0);

  SDValue SecondOperand = N->getOperand(1);

  unsigned FirstOperandOpc = FirstOperand.getOpcode();

  EVT ValTy = N->getValueType(0);

  SDLoc DL(N);

  uint64_t lsb, msb;

  unsigned SMIdx, SMLen;

  ConstantSDNode *CN;

  SDValue NewOperand;

  MVT GRLenVT = Subtarget.getGRLenVT();


  if (SDValue R = combineAndNotIntoVANDN(N, DL, DAG))

    return R;


  // BSTRPICK requires the 32S feature.

  if (!Subtarget.has32S())

    return SDValue();


  // Op's second operand must be a shifted mask.

  if (!(CN = dyn_cast<ConstantSDNode>(SecondOperand)) ||

      !isShiftedMask_64(CN->getZExtValue(), SMIdx, SMLen))

    return SDValue();


  if (FirstOperandOpc == ISD::SRA || FirstOperandOpc == ISD::SRL) {

    // Pattern match BSTRPICK.

    //  $dst = and ((sra or srl) $src , lsb), (2**len - 1)

    //  => BSTRPICK $dst, $src, msb, lsb

    //  where msb = lsb + len - 1


    // The second operand of the shift must be an immediate.

    if (!(CN = dyn_cast<ConstantSDNode>(FirstOperand.getOperand(1))))

      return SDValue();


    lsb = CN->getZExtValue();


    // Return if the shifted mask does not start at bit 0 or the sum of its

    // length and lsb exceeds the word's size.

    if (SMIdx != 0 || lsb + SMLen > ValTy.getSizeInBits())

      return SDValue();


    NewOperand = FirstOperand.getOperand(0);

  } else {

    // Pattern match BSTRPICK.

    //  $dst = and $src, (2**len- 1) , if len > 12

    //  => BSTRPICK $dst, $src, msb, lsb

    //  where lsb = 0 and msb = len - 1


    // If the mask is <= 0xfff, andi can be used instead.

    if (CN->getZExtValue() <= 0xfff)

      return SDValue();


    // Return if the MSB exceeds.

    if (SMIdx + SMLen > ValTy.getSizeInBits())

      return SDValue();


    if (SMIdx > 0) {

      // Omit if the constant has more than 2 uses. This a conservative

      // decision. Whether it is a win depends on the HW microarchitecture.

      // However it should always be better for 1 and 2 uses.

      if (CN->use_size() > 2)

        return SDValue();

      // Return if the constant can be composed by a single LU12I.W.

      if ((CN->getZExtValue() & 0xfff) == 0)

        return SDValue();

      // Return if the constand can be composed by a single ADDI with

      // the zero register.

      if (CN->getSExtValue() >= -2048 && CN->getSExtValue() < 0)

        return SDValue();

    }


    lsb = SMIdx;

    NewOperand = FirstOperand;

  }


  msb = lsb + SMLen - 1;

  SDValue NR0 = DAG.getNode(LoongArchISD::BSTRPICK, DL, ValTy, NewOperand,

                            DAG.getConstant(msb, DL, GRLenVT),

                            DAG.getConstant(lsb, DL, GRLenVT));

  if (FirstOperandOpc == ISD::SRA || FirstOperandOpc == ISD::SRL || lsb == 0)

    return NR0;

  // Try to optimize to

  //   bstrpick $Rd, $Rs, msb, lsb

  //   slli     $Rd, $Rd, lsb

  return DAG.getNode(ISD::SHL, DL, ValTy, NR0,

                     DAG.getConstant(lsb, DL, GRLenVT));

}


static SDValue performSRLCombine(SDNode *N, SelectionDAG &DAG,

                                 TargetLowering::DAGCombinerInfo &DCI,

                                 const LoongArchSubtarget &Subtarget) {

  // BSTRPICK requires the 32S feature.

  if (!Subtarget.has32S())

    return SDValue();


  if (DCI.isBeforeLegalizeOps())

    return SDValue();


  // $dst = srl (and $src, Mask), Shamt

  // =>

  // BSTRPICK $dst, $src, MaskIdx+MaskLen-1, Shamt

  // when Mask is a shifted mask, and MaskIdx <= Shamt <= MaskIdx+MaskLen-1

  //


  SDValue FirstOperand = N->getOperand(0);

  ConstantSDNode *CN;

  EVT ValTy = N->getValueType(0);

  SDLoc DL(N);

  MVT GRLenVT = Subtarget.getGRLenVT();

  unsigned MaskIdx, MaskLen;

  uint64_t Shamt;


  // The first operand must be an AND and the second operand of the AND must be

  // a shifted mask.

  if (FirstOperand.getOpcode() != ISD::AND ||

      !(CN = dyn_cast<ConstantSDNode>(FirstOperand.getOperand(1))) ||

      !isShiftedMask_64(CN->getZExtValue(), MaskIdx, MaskLen))

    return SDValue();


  // The second operand (shift amount) must be an immediate.

  if (!(CN = dyn_cast<ConstantSDNode>(N->getOperand(1))))

    return SDValue();


  Shamt = CN->getZExtValue();

  if (MaskIdx <= Shamt && Shamt <= MaskIdx + MaskLen - 1)

    return DAG.getNode(LoongArchISD::BSTRPICK, DL, ValTy,

                       FirstOperand->getOperand(0),

                       DAG.getConstant(MaskIdx + MaskLen - 1, DL, GRLenVT),

                       DAG.getConstant(Shamt, DL, GRLenVT));


  return SDValue();

}


// Helper to peek through bitops/trunc/setcc to determine size of source vector.

// Allows BITCASTCombine to determine what size vector generated a <X x i1>.


static bool checkBitcastSrcVectorSize(SDValue Src, unsigned Size,

                                      unsigned Depth) {

  // Limit recursion.

  if (Depth >= SelectionDAG::MaxRecursionDepth)

    return false;

  switch (Src.getOpcode()) {

  case ISD::SETCC:

  case ISD::TRUNCATE:

    return Src.getOperand(0).getValueSizeInBits() == Size;

  case ISD::FREEZE:

    return checkBitcastSrcVectorSize(Src.getOperand(0), Size, Depth + 1);

  case ISD::AND:

  case ISD::XOR:

  case ISD::OR:

    return checkBitcastSrcVectorSize(Src.getOperand(0), Size, Depth + 1) &&

           checkBitcastSrcVectorSize(Src.getOperand(1), Size, Depth + 1);

  case ISD::SELECT:

  case ISD::VSELECT:

    return Src.getOperand(0).getScalarValueSizeInBits() == 1 &&

           checkBitcastSrcVectorSize(Src.getOperand(1), Size, Depth + 1) &&

           checkBitcastSrcVectorSize(Src.getOperand(2), Size, Depth + 1);

  case ISD::BUILD_VECTOR:

    return ISD::isBuildVectorAllZeros(Src.getNode()) ||

           ISD::isBuildVectorAllOnes(Src.getNode());

  }

  return false;

}


// Helper to push sign extension of vXi1 SETCC result through bitops.


static SDValue signExtendBitcastSrcVector(SelectionDAG &DAG, EVT SExtVT,

                                          SDValue Src, const SDLoc &DL) {

  switch (Src.getOpcode()) {

  case ISD::SETCC:

  case ISD::FREEZE:

  case ISD::TRUNCATE:

  case ISD::BUILD_VECTOR:

    return DAG.getNode(ISD::SIGN_EXTEND, DL, SExtVT, Src);

  case ISD::AND:

  case ISD::XOR:

  case ISD::OR:

    return DAG.getNode(

        Src.getOpcode(), DL, SExtVT,

        signExtendBitcastSrcVector(DAG, SExtVT, Src.getOperand(0), DL),

        signExtendBitcastSrcVector(DAG, SExtVT, Src.getOperand(1), DL));

  case ISD::SELECT:

  case ISD::VSELECT:

    return DAG.getSelect(

        DL, SExtVT, Src.getOperand(0),

        signExtendBitcastSrcVector(DAG, SExtVT, Src.getOperand(1), DL),

        signExtendBitcastSrcVector(DAG, SExtVT, Src.getOperand(2), DL));

  }

  llvm_unreachable("Unexpected node type for vXi1 sign extension");

}


static SDValue


performSETCC_BITCASTCombine(SDNode *N, SelectionDAG &DAG,

                            TargetLowering::DAGCombinerInfo &DCI,

                            const LoongArchSubtarget &Subtarget) {

  SDLoc DL(N);

  EVT VT = N->getValueType(0);

  SDValue Src = N->getOperand(0);

  EVT SrcVT = Src.getValueType();


  if (Src.getOpcode() != ISD::SETCC || !Src.hasOneUse())

    return SDValue();


  bool UseLASX;

  unsigned Opc = ISD::DELETED_NODE;

  EVT CmpVT = Src.getOperand(0).getValueType();

  EVT EltVT = CmpVT.getVectorElementType();


  if (Subtarget.hasExtLSX() && CmpVT.getSizeInBits() == 128)

    UseLASX = false;

  else if (Subtarget.has32S() && Subtarget.hasExtLASX() &&

           CmpVT.getSizeInBits() == 256)

    UseLASX = true;

  else

    return SDValue();


  SDValue SrcN1 = Src.getOperand(1);

  switch (cast<CondCodeSDNode>(Src.getOperand(2))->get()) {

  default:

    break;

  case ISD::SETEQ:

    // x == 0 => not (vmsknez.b x)

    if (ISD::isBuildVectorAllZeros(SrcN1.getNode()) && EltVT == MVT::i8)

      Opc = UseLASX ? LoongArchISD::XVMSKEQZ : LoongArchISD::VMSKEQZ;

    break;

  case ISD::SETGT:

    // x > -1 => vmskgez.b x

    if (ISD::isBuildVectorAllOnes(SrcN1.getNode()) && EltVT == MVT::i8)

      Opc = UseLASX ? LoongArchISD::XVMSKGEZ : LoongArchISD::VMSKGEZ;

    break;

  case ISD::SETGE:

    // x >= 0 => vmskgez.b x

    if (ISD::isBuildVectorAllZeros(SrcN1.getNode()) && EltVT == MVT::i8)

      Opc = UseLASX ? LoongArchISD::XVMSKGEZ : LoongArchISD::VMSKGEZ;

    break;

  case ISD::SETLT:

    // x < 0 => vmskltz.{b,h,w,d} x

    if (ISD::isBuildVectorAllZeros(SrcN1.getNode()) &&

        (EltVT == MVT::i8 || EltVT == MVT::i16 || EltVT == MVT::i32 ||

         EltVT == MVT::i64))

      Opc = UseLASX ? LoongArchISD::XVMSKLTZ : LoongArchISD::VMSKLTZ;

    break;

  case ISD::SETLE:

    // x <= -1 => vmskltz.{b,h,w,d} x

    if (ISD::isBuildVectorAllOnes(SrcN1.getNode()) &&

        (EltVT == MVT::i8 || EltVT == MVT::i16 || EltVT == MVT::i32 ||

         EltVT == MVT::i64))

      Opc = UseLASX ? LoongArchISD::XVMSKLTZ : LoongArchISD::VMSKLTZ;

    break;

  case ISD::SETNE:

    // x != 0 => vmsknez.b x

    if (ISD::isBuildVectorAllZeros(SrcN1.getNode()) && EltVT == MVT::i8)

      Opc = UseLASX ? LoongArchISD::XVMSKNEZ : LoongArchISD::VMSKNEZ;

    break;

  }


  if (Opc == ISD::DELETED_NODE)

    return SDValue();


  SDValue V = DAG.getNode(Opc, DL, Subtarget.getGRLenVT(), Src.getOperand(0));

  EVT T = EVT::getIntegerVT(*DAG.getContext(), SrcVT.getVectorNumElements());

  V = DAG.getZExtOrTrunc(V, DL, T);

  return DAG.getBitcast(VT, V);

}


static SDValue performBITCASTCombine(SDNode *N, SelectionDAG &DAG,

                                     TargetLowering::DAGCombinerInfo &DCI,

                                     const LoongArchSubtarget &Subtarget) {

  SDLoc DL(N);

  EVT VT = N->getValueType(0);

  SDValue Src = N->getOperand(0);

  EVT SrcVT = Src.getValueType();

  MVT GRLenVT = Subtarget.getGRLenVT();


  if (!DCI.isBeforeLegalizeOps())

    return SDValue();


  if (!SrcVT.isSimple() || SrcVT.getScalarType() != MVT::i1)

    return SDValue();


  // Combine SETCC and BITCAST into [X]VMSK{LT,GE,NE} when possible

  SDValue Res = performSETCC_BITCASTCombine(N, DAG, DCI, Subtarget);

  if (Res)

    return Res;


  // Generate vXi1 using [X]VMSKLTZ

  MVT SExtVT;

  unsigned Opc;

  bool UseLASX = false;

  bool PropagateSExt = false;


  if (Src.getOpcode() == ISD::SETCC && Src.hasOneUse()) {

    EVT CmpVT = Src.getOperand(0).getValueType();

    if (CmpVT.getSizeInBits() > 256)

      return SDValue();

  }


  switch (SrcVT.getSimpleVT().SimpleTy) {

  default:

    return SDValue();

  case MVT::v2i1:

    SExtVT = MVT::v2i64;

    break;

  case MVT::v4i1:

    SExtVT = MVT::v4i32;

    if (Subtarget.hasExtLASX() && checkBitcastSrcVectorSize(Src, 256, 0)) {

      SExtVT = MVT::v4i64;

      UseLASX = true;

      PropagateSExt = true;

    }

    break;

  case MVT::v8i1:

    SExtVT = MVT::v8i16;

    if (Subtarget.hasExtLASX() && checkBitcastSrcVectorSize(Src, 256, 0)) {

      SExtVT = MVT::v8i32;

      UseLASX = true;

      PropagateSExt = true;

    }

    break;

  case MVT::v16i1:

    SExtVT = MVT::v16i8;

    if (Subtarget.hasExtLASX() && checkBitcastSrcVectorSize(Src, 256, 0)) {

      SExtVT = MVT::v16i16;

      UseLASX = true;

      PropagateSExt = true;

    }

    break;

  case MVT::v32i1:

    SExtVT = MVT::v32i8;

    UseLASX = true;

    break;

  };

  Src = PropagateSExt ? signExtendBitcastSrcVector(DAG, SExtVT, Src, DL)

                      : DAG.getNode(ISD::SIGN_EXTEND, DL, SExtVT, Src);


  SDValue V;

  if (!Subtarget.has32S() || !Subtarget.hasExtLASX()) {

    if (Src.getSimpleValueType() == MVT::v32i8) {

      SDValue Lo, Hi;

      std::tie(Lo, Hi) = DAG.SplitVector(Src, DL);

      Lo = DAG.getNode(LoongArchISD::VMSKLTZ, DL, GRLenVT, Lo);

      Hi = DAG.getNode(LoongArchISD::VMSKLTZ, DL, GRLenVT, Hi);

      Hi = DAG.getNode(ISD::SHL, DL, GRLenVT, Hi,

                       DAG.getShiftAmountConstant(16, GRLenVT, DL));

      V = DAG.getNode(ISD::OR, DL, GRLenVT, Lo, Hi);

    } else if (UseLASX) {

      return SDValue();

    }

  }


  if (!V) {

    Opc = UseLASX ? LoongArchISD::XVMSKLTZ : LoongArchISD::VMSKLTZ;

    V = DAG.getNode(Opc, DL, GRLenVT, Src);

  }


  EVT T = EVT::getIntegerVT(*DAG.getContext(), SrcVT.getVectorNumElements());

  V = DAG.getZExtOrTrunc(V, DL, T);

  return DAG.getBitcast(VT, V);

}


static SDValue performORCombine(SDNode *N, SelectionDAG &DAG,

                                TargetLowering::DAGCombinerInfo &DCI,

                                const LoongArchSubtarget &Subtarget) {

  MVT GRLenVT = Subtarget.getGRLenVT();

  EVT ValTy = N->getValueType(0);

  SDValue N0 = N->getOperand(0), N1 = N->getOperand(1);

  ConstantSDNode *CN0, *CN1;

  SDLoc DL(N);

  unsigned ValBits = ValTy.getSizeInBits();

  unsigned MaskIdx0, MaskLen0, MaskIdx1, MaskLen1;

  unsigned Shamt;

  bool SwapAndRetried = false;


  // BSTRPICK requires the 32S feature.

  if (!Subtarget.has32S())

    return SDValue();


  if (DCI.isBeforeLegalizeOps())

    return SDValue();


  if (ValBits != 32 && ValBits != 64)

    return SDValue();


Retry:

  // 1st pattern to match BSTRINS:

  //  R = or (and X, mask0), (and (shl Y, lsb), mask1)

  //  where mask1 = (2**size - 1) << lsb, mask0 = ~mask1

  //  =>

  //  R = BSTRINS X, Y, msb, lsb (where msb = lsb + size - 1)

  if (N0.getOpcode() == ISD::AND &&

      (CN0 = dyn_cast<ConstantSDNode>(N0.getOperand(1))) &&

      isShiftedMask_64(~CN0->getSExtValue(), MaskIdx0, MaskLen0) &&

      N1.getOpcode() == ISD::AND && N1.getOperand(0).getOpcode() == ISD::SHL &&

      (CN1 = dyn_cast<ConstantSDNode>(N1.getOperand(1))) &&

      isShiftedMask_64(CN1->getZExtValue(), MaskIdx1, MaskLen1) &&

      MaskIdx0 == MaskIdx1 && MaskLen0 == MaskLen1 &&

      (CN1 = dyn_cast<ConstantSDNode>(N1.getOperand(0).getOperand(1))) &&

      (Shamt = CN1->getZExtValue()) == MaskIdx0 &&

      (MaskIdx0 + MaskLen0 <= ValBits)) {

    LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 1\n");

    return DAG.getNode(LoongArchISD::BSTRINS, DL, ValTy, N0.getOperand(0),

                       N1.getOperand(0).getOperand(0),

                       DAG.getConstant((MaskIdx0 + MaskLen0 - 1), DL, GRLenVT),

                       DAG.getConstant(MaskIdx0, DL, GRLenVT));

  }


  // 2nd pattern to match BSTRINS:

  //  R = or (and X, mask0), (shl (and Y, mask1), lsb)

  //  where mask1 = (2**size - 1), mask0 = ~(mask1 << lsb)

  //  =>

  //  R = BSTRINS X, Y, msb, lsb (where msb = lsb + size - 1)

  if (N0.getOpcode() == ISD::AND &&

      (CN0 = dyn_cast<ConstantSDNode>(N0.getOperand(1))) &&

      isShiftedMask_64(~CN0->getSExtValue(), MaskIdx0, MaskLen0) &&

      N1.getOpcode() == ISD::SHL && N1.getOperand(0).getOpcode() == ISD::AND &&

      (CN1 = dyn_cast<ConstantSDNode>(N1.getOperand(1))) &&

      (Shamt = CN1->getZExtValue()) == MaskIdx0 &&

      (CN1 = dyn_cast<ConstantSDNode>(N1.getOperand(0).getOperand(1))) &&

      isShiftedMask_64(CN1->getZExtValue(), MaskIdx1, MaskLen1) &&

      MaskLen0 == MaskLen1 && MaskIdx1 == 0 &&

      (MaskIdx0 + MaskLen0 <= ValBits)) {

    LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 2\n");

    return DAG.getNode(LoongArchISD::BSTRINS, DL, ValTy, N0.getOperand(0),

                       N1.getOperand(0).getOperand(0),

                       DAG.getConstant((MaskIdx0 + MaskLen0 - 1), DL, GRLenVT),

                       DAG.getConstant(MaskIdx0, DL, GRLenVT));

  }


  // 3rd pattern to match BSTRINS:

  //  R = or (and X, mask0), (and Y, mask1)

  //  where ~mask0 = (2**size - 1) << lsb, mask0 & mask1 = 0

  //  =>

  //  R = BSTRINS X, (shr (and Y, mask1), lsb), msb, lsb

  //  where msb = lsb + size - 1

  if (N0.getOpcode() == ISD::AND && N1.getOpcode() == ISD::AND &&

      (CN0 = dyn_cast<ConstantSDNode>(N0.getOperand(1))) &&

      isShiftedMask_64(~CN0->getSExtValue(), MaskIdx0, MaskLen0) &&

      (MaskIdx0 + MaskLen0 <= 64) &&

      (CN1 = dyn_cast<ConstantSDNode>(N1->getOperand(1))) &&

      (CN1->getSExtValue() & CN0->getSExtValue()) == 0) {

    LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 3\n");

    return DAG.getNode(LoongArchISD::BSTRINS, DL, ValTy, N0.getOperand(0),

                       DAG.getNode(ISD::SRL, DL, N1->getValueType(0), N1,

                                   DAG.getConstant(MaskIdx0, DL, GRLenVT)),

                       DAG.getConstant(ValBits == 32

                                           ? (MaskIdx0 + (MaskLen0 & 31) - 1)

                                           : (MaskIdx0 + MaskLen0 - 1),

                                       DL, GRLenVT),

                       DAG.getConstant(MaskIdx0, DL, GRLenVT));

  }


  // 4th pattern to match BSTRINS:

  //  R = or (and X, mask), (shl Y, shamt)

  //  where mask = (2**shamt - 1)

  //  =>

  //  R = BSTRINS X, Y, ValBits - 1, shamt

  //  where ValBits = 32 or 64

  if (N0.getOpcode() == ISD::AND && N1.getOpcode() == ISD::SHL &&

      (CN0 = dyn_cast<ConstantSDNode>(N0.getOperand(1))) &&

      isShiftedMask_64(CN0->getZExtValue(), MaskIdx0, MaskLen0) &&

      MaskIdx0 == 0 && (CN1 = dyn_cast<ConstantSDNode>(N1.getOperand(1))) &&

      (Shamt = CN1->getZExtValue()) == MaskLen0 &&

      (MaskIdx0 + MaskLen0 <= ValBits)) {

    LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 4\n");

    return DAG.getNode(LoongArchISD::BSTRINS, DL, ValTy, N0.getOperand(0),

                       N1.getOperand(0),

                       DAG.getConstant((ValBits - 1), DL, GRLenVT),

                       DAG.getConstant(Shamt, DL, GRLenVT));

  }


  // 5th pattern to match BSTRINS:

  //  R = or (and X, mask), const

  //  where ~mask = (2**size - 1) << lsb, mask & const = 0

  //  =>

  //  R = BSTRINS X, (const >> lsb), msb, lsb

  //  where msb = lsb + size - 1

  if (N0.getOpcode() == ISD::AND &&

      (CN0 = dyn_cast<ConstantSDNode>(N0.getOperand(1))) &&

      isShiftedMask_64(~CN0->getSExtValue(), MaskIdx0, MaskLen0) &&

      (CN1 = dyn_cast<ConstantSDNode>(N1)) &&

      (CN1->getSExtValue() & CN0->getSExtValue()) == 0) {

    LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 5\n");

    return DAG.getNode(

        LoongArchISD::BSTRINS, DL, ValTy, N0.getOperand(0),

        DAG.getSignedConstant(CN1->getSExtValue() >> MaskIdx0, DL, ValTy),

        DAG.getConstant(ValBits == 32 ? (MaskIdx0 + (MaskLen0 & 31) - 1)

                                      : (MaskIdx0 + MaskLen0 - 1),

                        DL, GRLenVT),

        DAG.getConstant(MaskIdx0, DL, GRLenVT));

  }


  // 6th pattern.

  // a = b | ((c & mask) << shamt), where all positions in b to be overwritten

  // by the incoming bits are known to be zero.

  // =>

  // a = BSTRINS b, c, shamt + MaskLen - 1, shamt

  //

  // Note that the 1st pattern is a special situation of the 6th, i.e. the 6th

  // pattern is more common than the 1st. So we put the 1st before the 6th in

  // order to match as many nodes as possible.

  ConstantSDNode *CNMask, *CNShamt;

  unsigned MaskIdx, MaskLen;

  if (N1.getOpcode() == ISD::SHL && N1.getOperand(0).getOpcode() == ISD::AND &&

      (CNMask = dyn_cast<ConstantSDNode>(N1.getOperand(0).getOperand(1))) &&

      isShiftedMask_64(CNMask->getZExtValue(), MaskIdx, MaskLen) &&

      MaskIdx == 0 && (CNShamt = dyn_cast<ConstantSDNode>(N1.getOperand(1))) &&

      CNShamt->getZExtValue() + MaskLen <= ValBits) {

    Shamt = CNShamt->getZExtValue();

    APInt ShMask(ValBits, CNMask->getZExtValue() << Shamt);

    if (ShMask.isSubsetOf(DAG.computeKnownBits(N0).Zero)) {

      LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 6\n");

      return DAG.getNode(LoongArchISD::BSTRINS, DL, ValTy, N0,

                         N1.getOperand(0).getOperand(0),

                         DAG.getConstant(Shamt + MaskLen - 1, DL, GRLenVT),

                         DAG.getConstant(Shamt, DL, GRLenVT));

    }

  }


  // 7th pattern.

  // a = b | ((c << shamt) & shifted_mask), where all positions in b to be

  // overwritten by the incoming bits are known to be zero.

  // =>

  // a = BSTRINS b, c, MaskIdx + MaskLen - 1, MaskIdx

  //

  // Similarly, the 7th pattern is more common than the 2nd. So we put the 2nd

  // before the 7th in order to match as many nodes as possible.

  if (N1.getOpcode() == ISD::AND &&

      (CNMask = dyn_cast<ConstantSDNode>(N1.getOperand(1))) &&

      isShiftedMask_64(CNMask->getZExtValue(), MaskIdx, MaskLen) &&

      N1.getOperand(0).getOpcode() == ISD::SHL &&

      (CNShamt = dyn_cast<ConstantSDNode>(N1.getOperand(0).getOperand(1))) &&

      CNShamt->getZExtValue() == MaskIdx) {

    APInt ShMask(ValBits, CNMask->getZExtValue());

    if (ShMask.isSubsetOf(DAG.computeKnownBits(N0).Zero)) {

      LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 7\n");

      return DAG.getNode(LoongArchISD::BSTRINS, DL, ValTy, N0,

                         N1.getOperand(0).getOperand(0),

                         DAG.getConstant(MaskIdx + MaskLen - 1, DL, GRLenVT),

                         DAG.getConstant(MaskIdx, DL, GRLenVT));

    }

  }


  // (or a, b) and (or b, a) are equivalent, so swap the operands and retry.

  if (!SwapAndRetried) {

    std::swap(N0, N1);

    SwapAndRetried = true;

    goto Retry;

  }


  SwapAndRetried = false;

Retry2:

  // 8th pattern.

  // a = b | (c & shifted_mask), where all positions in b to be overwritten by

  // the incoming bits are known to be zero.

  // =>

  // a = BSTRINS b, c >> MaskIdx, MaskIdx + MaskLen - 1, MaskIdx

  //

  // Similarly, the 8th pattern is more common than the 4th and 5th patterns. So

  // we put it here in order to match as many nodes as possible or generate less

  // instructions.

  if (N1.getOpcode() == ISD::AND &&

      (CNMask = dyn_cast<ConstantSDNode>(N1.getOperand(1))) &&

      isShiftedMask_64(CNMask->getZExtValue(), MaskIdx, MaskLen)) {

    APInt ShMask(ValBits, CNMask->getZExtValue());

    if (ShMask.isSubsetOf(DAG.computeKnownBits(N0).Zero)) {

      LLVM_DEBUG(dbgs() << "Perform OR combine: match pattern 8\n");

      return DAG.getNode(LoongArchISD::BSTRINS, DL, ValTy, N0,

                         DAG.getNode(ISD::SRL, DL, N1->getValueType(0),

                                     N1->getOperand(0),

                                     DAG.getConstant(MaskIdx, DL, GRLenVT)),

                         DAG.getConstant(MaskIdx + MaskLen - 1, DL, GRLenVT),

                         DAG.getConstant(MaskIdx, DL, GRLenVT));

    }

  }

  // Swap N0/N1 and retry.

  if (!SwapAndRetried) {

    std::swap(N0, N1);

    SwapAndRetried = true;

    goto Retry2;

  }


  return SDValue();

}


static bool checkValueWidth(SDValue V, ISD::LoadExtType &ExtType) {

  ExtType = ISD::NON_EXTLOAD;


  switch (V.getNode()->getOpcode()) {

  case ISD::LOAD: {

    LoadSDNode *LoadNode = cast<LoadSDNode>(V.getNode());

    if ((LoadNode->getMemoryVT() == MVT::i8) ||

        (LoadNode->getMemoryVT() == MVT::i16)) {

      ExtType = LoadNode->getExtensionType();

      return true;

    }

    return false;

  }

  case ISD::AssertSext: {

    VTSDNode *TypeNode = cast<VTSDNode>(V.getNode()->getOperand(1));

    if ((TypeNode->getVT() == MVT::i8) || (TypeNode->getVT() == MVT::i16)) {

      ExtType = ISD::SEXTLOAD;

      return true;

    }

    return false;

  }

  case ISD::AssertZext: {

    VTSDNode *TypeNode = cast<VTSDNode>(V.getNode()->getOperand(1));

    if ((TypeNode->getVT() == MVT::i8) || (TypeNode->getVT() == MVT::i16)) {

      ExtType = ISD::ZEXTLOAD;

      return true;

    }

    return false;

  }

  default:

    return false;

  }


  return false;

}


// Eliminate redundant truncation and zero-extension nodes.

// * Case 1:

//  +------------+ +------------+ +------------+

//  |   Input1   | |   Input2   | |     CC     |

//  +------------+ +------------+ +------------+

//         |              |              |

//         V              V              +----+

//  +------------+ +------------+             |

//  |  TRUNCATE  | |  TRUNCATE  |             |

//  +------------+ +------------+             |

//         |              |                   |

//         V              V                   |

//  +------------+ +------------+             |

//  |  ZERO_EXT  | |  ZERO_EXT  |             |

//  +------------+ +------------+             |

//         |              |                   |

//         |              +-------------+     |

//         V              V             |     |

//        +----------------+            |     |

//        |      AND       |            |     |

//        +----------------+            |     |

//                |                     |     |

//                +---------------+     |     |

//                                |     |     |

//                                V     V     V

//                               +-------------+

//                               |     CMP     |

//                               +-------------+

// * Case 2:

//  +------------+ +------------+ +-------------+ +------------+ +------------+

//  |   Input1   | |   Input2   | | Constant -1 | | Constant 0 | |     CC     |

//  +------------+ +------------+ +-------------+ +------------+ +------------+

//         |              |             |               |               |

//         V              |             |               |               |

//  +------------+        |             |               |               |

//  |     XOR    |<---------------------+               |               |

//  +------------+        |                             |               |

//         |              |                             |               |

//         V              V             +---------------+               |

//  +------------+ +------------+       |                               |

//  |  TRUNCATE  | |  TRUNCATE  |       |     +-------------------------+

//  +------------+ +------------+       |     |

//         |              |             |     |

//         V              V             |     |

//  +------------+ +------------+       |     |

//  |  ZERO_EXT  | |  ZERO_EXT  |       |     |

//  +------------+ +------------+       |     |

//         |              |             |     |

//         V              V             |     |

//        +----------------+            |     |

//        |      AND       |            |     |

//        +----------------+            |     |

//                |                     |     |

//                +---------------+     |     |

//                                |     |     |

//                                V     V     V

//                               +-------------+

//                               |     CMP     |

//                               +-------------+


static SDValue performSETCCCombine(SDNode *N, SelectionDAG &DAG,

                                   TargetLowering::DAGCombinerInfo &DCI,

                                   const LoongArchSubtarget &Subtarget) {

  ISD::CondCode CC = cast<CondCodeSDNode>(N->getOperand(2))->get();


  SDNode *AndNode = N->getOperand(0).getNode();

  if (AndNode->getOpcode() != ISD::AND)

    return SDValue();


  SDValue AndInputValue2 = AndNode->getOperand(1);

  if (AndInputValue2.getOpcode() != ISD::ZERO_EXTEND)

    return SDValue();


  SDValue CmpInputValue = N->getOperand(1);

  SDValue AndInputValue1 = AndNode->getOperand(0);

  if (AndInputValue1.getOpcode() == ISD::XOR) {

    if (CC != ISD::SETEQ && CC != ISD::SETNE)

      return SDValue();

    ConstantSDNode *CN = dyn_cast<ConstantSDNode>(AndInputValue1.getOperand(1));

    if (!CN || !CN->isAllOnes())

      return SDValue();

    CN = dyn_cast<ConstantSDNode>(CmpInputValue);

    if (!CN || !CN->isZero())

      return SDValue();

    AndInputValue1 = AndInputValue1.getOperand(0);

    if (AndInputValue1.getOpcode() != ISD::ZERO_EXTEND)

      return SDValue();

  } else if (AndInputValue1.getOpcode() == ISD::ZERO_EXTEND) {

    if (AndInputValue2 != CmpInputValue)

      return SDValue();

  } else {

    return SDValue();

  }


  SDValue TruncValue1 = AndInputValue1.getNode()->getOperand(0);

  if (TruncValue1.getOpcode() != ISD::TRUNCATE)

    return SDValue();


  SDValue TruncValue2 = AndInputValue2.getNode()->getOperand(0);

  if (TruncValue2.getOpcode() != ISD::TRUNCATE)

    return SDValue();


  SDValue TruncInputValue1 = TruncValue1.getNode()->getOperand(0);

  SDValue TruncInputValue2 = TruncValue2.getNode()->getOperand(0);

  ISD::LoadExtType ExtType1;

  ISD::LoadExtType ExtType2;


  if (!checkValueWidth(TruncInputValue1, ExtType1) ||

      !checkValueWidth(TruncInputValue2, ExtType2))

    return SDValue();


  if (TruncInputValue1->getValueType(0) != TruncInputValue2->getValueType(0) ||

      AndNode->getValueType(0) != TruncInputValue1->getValueType(0))

    return SDValue();


  if ((ExtType2 != ISD::ZEXTLOAD) &&

      ((ExtType2 != ISD::SEXTLOAD) && (ExtType1 != ISD::SEXTLOAD)))

    return SDValue();


  // These truncation and zero-extension nodes are not necessary, remove them.

  SDValue NewAnd = DAG.getNode(ISD::AND, SDLoc(N), AndNode->getValueType(0),

                               TruncInputValue1, TruncInputValue2);

  SDValue NewSetCC =

      DAG.getSetCC(SDLoc(N), N->getValueType(0), NewAnd, TruncInputValue2, CC);

  DAG.ReplaceAllUsesWith(N, NewSetCC.getNode());

  return SDValue(N, 0);

}


// Combine (loongarch_bitrev_w (loongarch_revb_2w X)) to loongarch_bitrev_4b.


static SDValue performBITREV_WCombine(SDNode *N, SelectionDAG &DAG,

                                      TargetLowering::DAGCombinerInfo &DCI,

                                      const LoongArchSubtarget &Subtarget) {

  if (DCI.isBeforeLegalizeOps())

    return SDValue();


  SDValue Src = N->getOperand(0);

  if (Src.getOpcode() != LoongArchISD::REVB_2W)

    return SDValue();


  return DAG.getNode(LoongArchISD::BITREV_4B, SDLoc(N), N->getValueType(0),

                     Src.getOperand(0));

}


// Perform common combines for BR_CC and SELECT_CC conditions.


static bool combine_CC(SDValue &LHS, SDValue &RHS, SDValue &CC, const SDLoc &DL,

                       SelectionDAG &DAG, const LoongArchSubtarget &Subtarget) {

  ISD::CondCode CCVal = cast<CondCodeSDNode>(CC)->get();


  // As far as arithmetic right shift always saves the sign,

  // shift can be omitted.

  // Fold setlt (sra X, N), 0 -> setlt X, 0 and

  // setge (sra X, N), 0 -> setge X, 0

  if (isNullConstant(RHS) && (CCVal == ISD::SETGE || CCVal == ISD::SETLT) &&

      LHS.getOpcode() == ISD::SRA) {

    LHS = LHS.getOperand(0);

    return true;

  }


  if (!ISD::isIntEqualitySetCC(CCVal))

    return false;


  // Fold ((setlt X, Y), 0, ne) -> (X, Y, lt)

  // Sometimes the setcc is introduced after br_cc/select_cc has been formed.

  if (LHS.getOpcode() == ISD::SETCC && isNullConstant(RHS) &&

      LHS.getOperand(0).getValueType() == Subtarget.getGRLenVT()) {

    // If we're looking for eq 0 instead of ne 0, we need to invert the

    // condition.

    bool Invert = CCVal == ISD::SETEQ;

    CCVal = cast<CondCodeSDNode>(LHS.getOperand(2))->get();

    if (Invert)

      CCVal = ISD::getSetCCInverse(CCVal, LHS.getValueType());


    RHS = LHS.getOperand(1);

    LHS = LHS.getOperand(0);

    translateSetCCForBranch(DL, LHS, RHS, CCVal, DAG);


    CC = DAG.getCondCode(CCVal);

    return true;

  }


  // Fold ((srl (and X, 1<<C), C), 0, eq/ne) -> ((shl X, GRLen-1-C), 0, ge/lt)

  if (isNullConstant(RHS) && LHS.getOpcode() == ISD::SRL && LHS.hasOneUse() &&

      LHS.getOperand(1).getOpcode() == ISD::Constant) {

    SDValue LHS0 = LHS.getOperand(0);

    if (LHS0.getOpcode() == ISD::AND &&

        LHS0.getOperand(1).getOpcode() == ISD::Constant) {

      uint64_t Mask = LHS0.getConstantOperandVal(1);

      uint64_t ShAmt = LHS.getConstantOperandVal(1);

      if (isPowerOf2_64(Mask) && Log2_64(Mask) == ShAmt) {

        CCVal = CCVal == ISD::SETEQ ? ISD::SETGE : ISD::SETLT;

        CC = DAG.getCondCode(CCVal);


        ShAmt = LHS.getValueSizeInBits() - 1 - ShAmt;

        LHS = LHS0.getOperand(0);

        if (ShAmt != 0)

          LHS =

              DAG.getNode(ISD::SHL, DL, LHS.getValueType(), LHS0.getOperand(0),

                          DAG.getConstant(ShAmt, DL, LHS.getValueType()));

        return true;

      }

    }

  }


  // (X, 1, setne) -> (X, 0, seteq) if we can prove X is 0/1.

  // This can occur when legalizing some floating point comparisons.

  APInt Mask = APInt::getBitsSetFrom(LHS.getValueSizeInBits(), 1);

  if (isOneConstant(RHS) && DAG.MaskedValueIsZero(LHS, Mask)) {

    CCVal = ISD::getSetCCInverse(CCVal, LHS.getValueType());

    CC = DAG.getCondCode(CCVal);

    RHS = DAG.getConstant(0, DL, LHS.getValueType());

    return true;

  }


  return false;

}


static SDValue performBR_CCCombine(SDNode *N, SelectionDAG &DAG,

                                   TargetLowering::DAGCombinerInfo &DCI,

                                   const LoongArchSubtarget &Subtarget) {

  SDValue LHS = N->getOperand(1);

  SDValue RHS = N->getOperand(2);

  SDValue CC = N->getOperand(3);

  SDLoc DL(N);


  if (combine_CC(LHS, RHS, CC, DL, DAG, Subtarget))

    return DAG.getNode(LoongArchISD::BR_CC, DL, N->getValueType(0),

                       N->getOperand(0), LHS, RHS, CC, N->getOperand(4));


  return SDValue();

}


static SDValue performSELECT_CCCombine(SDNode *N, SelectionDAG &DAG,

                                       TargetLowering::DAGCombinerInfo &DCI,

                                       const LoongArchSubtarget &Subtarget) {

  // Transform

  SDValue LHS = N->getOperand(0);

  SDValue RHS = N->getOperand(1);

  SDValue CC = N->getOperand(2);

  ISD::CondCode CCVal = cast<CondCodeSDNode>(CC)->get();

  SDValue TrueV = N->getOperand(3);

  SDValue FalseV = N->getOperand(4);

  SDLoc DL(N);

  EVT VT = N->getValueType(0);


  // If the True and False values are the same, we don't need a select_cc.

  if (TrueV == FalseV)

    return TrueV;


  // (select (x < 0), y, z)  -> x >> (GRLEN - 1) & (y - z) + z

  // (select (x >= 0), y, z) -> x >> (GRLEN - 1) & (z - y) + y

  if (isa<ConstantSDNode>(TrueV) && isa<ConstantSDNode>(FalseV) &&

      isNullConstant(RHS) &&

      (CCVal == ISD::CondCode::SETLT || CCVal == ISD::CondCode::SETGE)) {

    if (CCVal == ISD::CondCode::SETGE)

      std::swap(TrueV, FalseV);


    int64_t TrueSImm = cast<ConstantSDNode>(TrueV)->getSExtValue();

    int64_t FalseSImm = cast<ConstantSDNode>(FalseV)->getSExtValue();

    // Only handle simm12, if it is not in this range, it can be considered as

    // register.

    if (isInt<12>(TrueSImm) && isInt<12>(FalseSImm) &&

        isInt<12>(TrueSImm - FalseSImm)) {

      SDValue SRA =

          DAG.getNode(ISD::SRA, DL, VT, LHS,

                      DAG.getConstant(Subtarget.getGRLen() - 1, DL, VT));

      SDValue AND =

          DAG.getNode(ISD::AND, DL, VT, SRA,

                      DAG.getSignedConstant(TrueSImm - FalseSImm, DL, VT));

      return DAG.getNode(ISD::ADD, DL, VT, AND, FalseV);

    }


    if (CCVal == ISD::CondCode::SETGE)

      std::swap(TrueV, FalseV);

  }


  if (combine_CC(LHS, RHS, CC, DL, DAG, Subtarget))

    return DAG.getNode(LoongArchISD::SELECT_CC, DL, N->getValueType(0),

                       {LHS, RHS, CC, TrueV, FalseV});


  return SDValue();

}


template <unsigned N>


static SDValue legalizeIntrinsicImmArg(SDNode *Node, unsigned ImmOp,

                                       SelectionDAG &DAG,

                                       const LoongArchSubtarget &Subtarget,

                                       bool IsSigned = false) {

  SDLoc DL(Node);

  auto *CImm = cast<ConstantSDNode>(Node->getOperand(ImmOp));

  // Check the ImmArg.

  if ((IsSigned && !isInt<N>(CImm->getSExtValue())) ||

      (!IsSigned && !isUInt<N>(CImm->getZExtValue()))) {

    DAG.getContext()->emitError(Node->getOperationName(0) +

                                ": argument out of range.");

    return DAG.getNode(ISD::UNDEF, DL, Subtarget.getGRLenVT());

  }

  return DAG.getConstant(CImm->getZExtValue(), DL, Subtarget.getGRLenVT());

}


template <unsigned N>


static SDValue lowerVectorSplatImm(SDNode *Node, unsigned ImmOp,

                                   SelectionDAG &DAG, bool IsSigned = false) {

  SDLoc DL(Node);

  EVT ResTy = Node->getValueType(0);

  auto *CImm = cast<ConstantSDNode>(Node->getOperand(ImmOp));


  // Check the ImmArg.

  if ((IsSigned && !isInt<N>(CImm->getSExtValue())) ||

      (!IsSigned && !isUInt<N>(CImm->getZExtValue()))) {

    DAG.getContext()->emitError(Node->getOperationName(0) +

                                ": argument out of range.");

    return DAG.getNode(ISD::UNDEF, DL, ResTy);

  }

  return DAG.getConstant(

      APInt(ResTy.getScalarType().getSizeInBits(),

            IsSigned ? CImm->getSExtValue() : CImm->getZExtValue(), IsSigned),

      DL, ResTy);

}


static SDValue truncateVecElts(SDNode *Node, SelectionDAG &DAG) {

  SDLoc DL(Node);

  EVT ResTy = Node->getValueType(0);

  SDValue Vec = Node->getOperand(2);

  SDValue Mask = DAG.getConstant(Vec.getScalarValueSizeInBits() - 1, DL, ResTy);

  return DAG.getNode(ISD::AND, DL, ResTy, Vec, Mask);

}


static SDValue lowerVectorBitClear(SDNode *Node, SelectionDAG &DAG) {

  SDLoc DL(Node);

  EVT ResTy = Node->getValueType(0);

  SDValue One = DAG.getConstant(1, DL, ResTy);

  SDValue Bit =

      DAG.getNode(ISD::SHL, DL, ResTy, One, truncateVecElts(Node, DAG));


  return DAG.getNode(ISD::AND, DL, ResTy, Node->getOperand(1),

                     DAG.getNOT(DL, Bit, ResTy));

}


template <unsigned N>


static SDValue lowerVectorBitClearImm(SDNode *Node, SelectionDAG &DAG) {

  SDLoc DL(Node);

  EVT ResTy = Node->getValueType(0);

  auto *CImm = cast<ConstantSDNode>(Node->getOperand(2));

  // Check the unsigned ImmArg.

  if (!isUInt<N>(CImm->getZExtValue())) {

    DAG.getContext()->emitError(Node->getOperationName(0) +

                                ": argument out of range.");

    return DAG.getNode(ISD::UNDEF, DL, ResTy);

  }


  APInt BitImm = APInt(ResTy.getScalarSizeInBits(), 1) << CImm->getAPIntValue();

  SDValue Mask = DAG.getConstant(~BitImm, DL, ResTy);


  return DAG.getNode(ISD::AND, DL, ResTy, Node->getOperand(1), Mask);

}


template <unsigned N>


static SDValue lowerVectorBitSetImm(SDNode *Node, SelectionDAG &DAG) {

  SDLoc DL(Node);

  EVT ResTy = Node->getValueType(0);

  auto *CImm = cast<ConstantSDNode>(Node->getOperand(2));

  // Check the unsigned ImmArg.

  if (!isUInt<N>(CImm->getZExtValue())) {

    DAG.getContext()->emitError(Node->getOperationName(0) +

                                ": argument out of range.");

    return DAG.getNode(ISD::UNDEF, DL, ResTy);

  }


  APInt Imm = APInt(ResTy.getScalarSizeInBits(), 1) << CImm->getAPIntValue();

  SDValue BitImm = DAG.getConstant(Imm, DL, ResTy);

  return DAG.getNode(ISD::OR, DL, ResTy, Node->getOperand(1), BitImm);

}


template <unsigned N>


static SDValue lowerVectorBitRevImm(SDNode *Node, SelectionDAG &DAG) {

  SDLoc DL(Node);

  EVT ResTy = Node->getValueType(0);

  auto *CImm = cast<ConstantSDNode>(Node->getOperand(2));

  // Check the unsigned ImmArg.

  if (!isUInt<N>(CImm->getZExtValue())) {

    DAG.getContext()->emitError(Node->getOperationName(0) +

                                ": argument out of range.");

    return DAG.getNode(ISD::UNDEF, DL, ResTy);

  }


  APInt Imm = APInt(ResTy.getScalarSizeInBits(), 1) << CImm->getAPIntValue();

  SDValue BitImm = DAG.getConstant(Imm, DL, ResTy);

  return DAG.getNode(ISD::XOR, DL, ResTy, Node->getOperand(1), BitImm);

}


template <unsigned W>


static SDValue lowerVectorPickVE2GR(SDNode *N, SelectionDAG &DAG,

                                    unsigned ResOp) {

  unsigned Imm = N->getConstantOperandVal(2);

  if (!isUInt<W>(Imm)) {

    const StringRef ErrorMsg = "argument out of range";

    DAG.getContext()->emitError(N->getOperationName(0) + ": " + ErrorMsg + ".");

    return DAG.getUNDEF(N->getValueType(0));

  }

  SDLoc DL(N);

  SDValue Vec = N->getOperand(1);

  SDValue Idx = DAG.getConstant(Imm, DL, MVT::i32);

  SDValue EltVT = DAG.getValueType(Vec.getValueType().getVectorElementType());

  return DAG.getNode(ResOp, DL, N->getValueType(0), Vec, Idx, EltVT);

}


static SDValue


performINTRINSIC_WO_CHAINCombine(SDNode *N, SelectionDAG &DAG,

                                 TargetLowering::DAGCombinerInfo &DCI,

                                 const LoongArchSubtarget &Subtarget) {

  SDLoc DL(N);

  switch (N->getConstantOperandVal(0)) {

  default:

    break;

  case Intrinsic::loongarch_lsx_vadd_b:

  case Intrinsic::loongarch_lsx_vadd_h:

  case Intrinsic::loongarch_lsx_vadd_w:

  case Intrinsic::loongarch_lsx_vadd_d:

  case Intrinsic::loongarch_lasx_xvadd_b:

  case Intrinsic::loongarch_lasx_xvadd_h:

  case Intrinsic::loongarch_lasx_xvadd_w:

  case Intrinsic::loongarch_lasx_xvadd_d:

    return DAG.getNode(ISD::ADD, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vaddi_bu:

  case Intrinsic::loongarch_lsx_vaddi_hu:

  case Intrinsic::loongarch_lsx_vaddi_wu:

  case Intrinsic::loongarch_lsx_vaddi_du:

  case Intrinsic::loongarch_lasx_xvaddi_bu:

  case Intrinsic::loongarch_lasx_xvaddi_hu:

  case Intrinsic::loongarch_lasx_xvaddi_wu:

  case Intrinsic::loongarch_lasx_xvaddi_du:

    return DAG.getNode(ISD::ADD, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsub_b:

  case Intrinsic::loongarch_lsx_vsub_h:

  case Intrinsic::loongarch_lsx_vsub_w:

  case Intrinsic::loongarch_lsx_vsub_d:

  case Intrinsic::loongarch_lasx_xvsub_b:

  case Intrinsic::loongarch_lasx_xvsub_h:

  case Intrinsic::loongarch_lasx_xvsub_w:

  case Intrinsic::loongarch_lasx_xvsub_d:

    return DAG.getNode(ISD::SUB, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vsubi_bu:

  case Intrinsic::loongarch_lsx_vsubi_hu:

  case Intrinsic::loongarch_lsx_vsubi_wu:

  case Intrinsic::loongarch_lsx_vsubi_du:

  case Intrinsic::loongarch_lasx_xvsubi_bu:

  case Intrinsic::loongarch_lasx_xvsubi_hu:

  case Intrinsic::loongarch_lasx_xvsubi_wu:

  case Intrinsic::loongarch_lasx_xvsubi_du:

    return DAG.getNode(ISD::SUB, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vneg_b:

  case Intrinsic::loongarch_lsx_vneg_h:

  case Intrinsic::loongarch_lsx_vneg_w:

  case Intrinsic::loongarch_lsx_vneg_d:

  case Intrinsic::loongarch_lasx_xvneg_b:

  case Intrinsic::loongarch_lasx_xvneg_h:

  case Intrinsic::loongarch_lasx_xvneg_w:

  case Intrinsic::loongarch_lasx_xvneg_d:

    return DAG.getNode(

        ISD::SUB, DL, N->getValueType(0),

        DAG.getConstant(

            APInt(N->getValueType(0).getScalarType().getSizeInBits(), 0,

                  /*isSigned=*/true),

            SDLoc(N), N->getValueType(0)),

        N->getOperand(1));

  case Intrinsic::loongarch_lsx_vmax_b:

  case Intrinsic::loongarch_lsx_vmax_h:

  case Intrinsic::loongarch_lsx_vmax_w:

  case Intrinsic::loongarch_lsx_vmax_d:

  case Intrinsic::loongarch_lasx_xvmax_b:

  case Intrinsic::loongarch_lasx_xvmax_h:

  case Intrinsic::loongarch_lasx_xvmax_w:

  case Intrinsic::loongarch_lasx_xvmax_d:

    return DAG.getNode(ISD::SMAX, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vmax_bu:

  case Intrinsic::loongarch_lsx_vmax_hu:

  case Intrinsic::loongarch_lsx_vmax_wu:

  case Intrinsic::loongarch_lsx_vmax_du:

  case Intrinsic::loongarch_lasx_xvmax_bu:

  case Intrinsic::loongarch_lasx_xvmax_hu:

  case Intrinsic::loongarch_lasx_xvmax_wu:

  case Intrinsic::loongarch_lasx_xvmax_du:

    return DAG.getNode(ISD::UMAX, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vmaxi_b:

  case Intrinsic::loongarch_lsx_vmaxi_h:

  case Intrinsic::loongarch_lsx_vmaxi_w:

  case Intrinsic::loongarch_lsx_vmaxi_d:

  case Intrinsic::loongarch_lasx_xvmaxi_b:

  case Intrinsic::loongarch_lasx_xvmaxi_h:

  case Intrinsic::loongarch_lasx_xvmaxi_w:

  case Intrinsic::loongarch_lasx_xvmaxi_d:

    return DAG.getNode(ISD::SMAX, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG, /*IsSigned=*/true));

  case Intrinsic::loongarch_lsx_vmaxi_bu:

  case Intrinsic::loongarch_lsx_vmaxi_hu:

  case Intrinsic::loongarch_lsx_vmaxi_wu:

  case Intrinsic::loongarch_lsx_vmaxi_du:

  case Intrinsic::loongarch_lasx_xvmaxi_bu:

  case Intrinsic::loongarch_lasx_xvmaxi_hu:

  case Intrinsic::loongarch_lasx_xvmaxi_wu:

  case Intrinsic::loongarch_lasx_xvmaxi_du:

    return DAG.getNode(ISD::UMAX, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vmin_b:

  case Intrinsic::loongarch_lsx_vmin_h:

  case Intrinsic::loongarch_lsx_vmin_w:

  case Intrinsic::loongarch_lsx_vmin_d:

  case Intrinsic::loongarch_lasx_xvmin_b:

  case Intrinsic::loongarch_lasx_xvmin_h:

  case Intrinsic::loongarch_lasx_xvmin_w:

  case Intrinsic::loongarch_lasx_xvmin_d:

    return DAG.getNode(ISD::SMIN, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vmin_bu:

  case Intrinsic::loongarch_lsx_vmin_hu:

  case Intrinsic::loongarch_lsx_vmin_wu:

  case Intrinsic::loongarch_lsx_vmin_du:

  case Intrinsic::loongarch_lasx_xvmin_bu:

  case Intrinsic::loongarch_lasx_xvmin_hu:

  case Intrinsic::loongarch_lasx_xvmin_wu:

  case Intrinsic::loongarch_lasx_xvmin_du:

    return DAG.getNode(ISD::UMIN, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vmini_b:

  case Intrinsic::loongarch_lsx_vmini_h:

  case Intrinsic::loongarch_lsx_vmini_w:

  case Intrinsic::loongarch_lsx_vmini_d:

  case Intrinsic::loongarch_lasx_xvmini_b:

  case Intrinsic::loongarch_lasx_xvmini_h:

  case Intrinsic::loongarch_lasx_xvmini_w:

  case Intrinsic::loongarch_lasx_xvmini_d:

    return DAG.getNode(ISD::SMIN, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG, /*IsSigned=*/true));

  case Intrinsic::loongarch_lsx_vmini_bu:

  case Intrinsic::loongarch_lsx_vmini_hu:

  case Intrinsic::loongarch_lsx_vmini_wu:

  case Intrinsic::loongarch_lsx_vmini_du:

  case Intrinsic::loongarch_lasx_xvmini_bu:

  case Intrinsic::loongarch_lasx_xvmini_hu:

  case Intrinsic::loongarch_lasx_xvmini_wu:

  case Intrinsic::loongarch_lasx_xvmini_du:

    return DAG.getNode(ISD::UMIN, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vmul_b:

  case Intrinsic::loongarch_lsx_vmul_h:

  case Intrinsic::loongarch_lsx_vmul_w:

  case Intrinsic::loongarch_lsx_vmul_d:

  case Intrinsic::loongarch_lasx_xvmul_b:

  case Intrinsic::loongarch_lasx_xvmul_h:

  case Intrinsic::loongarch_lasx_xvmul_w:

  case Intrinsic::loongarch_lasx_xvmul_d:

    return DAG.getNode(ISD::MUL, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vmadd_b:

  case Intrinsic::loongarch_lsx_vmadd_h:

  case Intrinsic::loongarch_lsx_vmadd_w:

  case Intrinsic::loongarch_lsx_vmadd_d:

  case Intrinsic::loongarch_lasx_xvmadd_b:

  case Intrinsic::loongarch_lasx_xvmadd_h:

  case Intrinsic::loongarch_lasx_xvmadd_w:

  case Intrinsic::loongarch_lasx_xvmadd_d: {

    EVT ResTy = N->getValueType(0);

    return DAG.getNode(ISD::ADD, SDLoc(N), ResTy, N->getOperand(1),

                       DAG.getNode(ISD::MUL, SDLoc(N), ResTy, N->getOperand(2),

                                   N->getOperand(3)));

  }

  case Intrinsic::loongarch_lsx_vmsub_b:

  case Intrinsic::loongarch_lsx_vmsub_h:

  case Intrinsic::loongarch_lsx_vmsub_w:

  case Intrinsic::loongarch_lsx_vmsub_d:

  case Intrinsic::loongarch_lasx_xvmsub_b:

  case Intrinsic::loongarch_lasx_xvmsub_h:

  case Intrinsic::loongarch_lasx_xvmsub_w:

  case Intrinsic::loongarch_lasx_xvmsub_d: {

    EVT ResTy = N->getValueType(0);

    return DAG.getNode(ISD::SUB, SDLoc(N), ResTy, N->getOperand(1),

                       DAG.getNode(ISD::MUL, SDLoc(N), ResTy, N->getOperand(2),

                                   N->getOperand(3)));

  }

  case Intrinsic::loongarch_lsx_vdiv_b:

  case Intrinsic::loongarch_lsx_vdiv_h:

  case Intrinsic::loongarch_lsx_vdiv_w:

  case Intrinsic::loongarch_lsx_vdiv_d:

  case Intrinsic::loongarch_lasx_xvdiv_b:

  case Intrinsic::loongarch_lasx_xvdiv_h:

  case Intrinsic::loongarch_lasx_xvdiv_w:

  case Intrinsic::loongarch_lasx_xvdiv_d:

    return DAG.getNode(ISD::SDIV, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vdiv_bu:

  case Intrinsic::loongarch_lsx_vdiv_hu:

  case Intrinsic::loongarch_lsx_vdiv_wu:

  case Intrinsic::loongarch_lsx_vdiv_du:

  case Intrinsic::loongarch_lasx_xvdiv_bu:

  case Intrinsic::loongarch_lasx_xvdiv_hu:

  case Intrinsic::loongarch_lasx_xvdiv_wu:

  case Intrinsic::loongarch_lasx_xvdiv_du:

    return DAG.getNode(ISD::UDIV, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vmod_b:

  case Intrinsic::loongarch_lsx_vmod_h:

  case Intrinsic::loongarch_lsx_vmod_w:

  case Intrinsic::loongarch_lsx_vmod_d:

  case Intrinsic::loongarch_lasx_xvmod_b:

  case Intrinsic::loongarch_lasx_xvmod_h:

  case Intrinsic::loongarch_lasx_xvmod_w:

  case Intrinsic::loongarch_lasx_xvmod_d:

    return DAG.getNode(ISD::SREM, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vmod_bu:

  case Intrinsic::loongarch_lsx_vmod_hu:

  case Intrinsic::loongarch_lsx_vmod_wu:

  case Intrinsic::loongarch_lsx_vmod_du:

  case Intrinsic::loongarch_lasx_xvmod_bu:

  case Intrinsic::loongarch_lasx_xvmod_hu:

  case Intrinsic::loongarch_lasx_xvmod_wu:

  case Intrinsic::loongarch_lasx_xvmod_du:

    return DAG.getNode(ISD::UREM, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vand_v:

  case Intrinsic::loongarch_lasx_xvand_v:

    return DAG.getNode(ISD::AND, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vor_v:

  case Intrinsic::loongarch_lasx_xvor_v:

    return DAG.getNode(ISD::OR, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vxor_v:

  case Intrinsic::loongarch_lasx_xvxor_v:

    return DAG.getNode(ISD::XOR, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vnor_v:

  case Intrinsic::loongarch_lasx_xvnor_v: {

    SDValue Res = DAG.getNode(ISD::OR, DL, N->getValueType(0), N->getOperand(1),

                              N->getOperand(2));

    return DAG.getNOT(DL, Res, Res->getValueType(0));

  }

  case Intrinsic::loongarch_lsx_vandi_b:

  case Intrinsic::loongarch_lasx_xvandi_b:

    return DAG.getNode(ISD::AND, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<8>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vori_b:

  case Intrinsic::loongarch_lasx_xvori_b:

    return DAG.getNode(ISD::OR, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<8>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vxori_b:

  case Intrinsic::loongarch_lasx_xvxori_b:

    return DAG.getNode(ISD::XOR, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<8>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsll_b:

  case Intrinsic::loongarch_lsx_vsll_h:

  case Intrinsic::loongarch_lsx_vsll_w:

  case Intrinsic::loongarch_lsx_vsll_d:

  case Intrinsic::loongarch_lasx_xvsll_b:

  case Intrinsic::loongarch_lasx_xvsll_h:

  case Intrinsic::loongarch_lasx_xvsll_w:

  case Intrinsic::loongarch_lasx_xvsll_d:

    return DAG.getNode(ISD::SHL, DL, N->getValueType(0), N->getOperand(1),

                       truncateVecElts(N, DAG));

  case Intrinsic::loongarch_lsx_vslli_b:

  case Intrinsic::loongarch_lasx_xvslli_b:

    return DAG.getNode(ISD::SHL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<3>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vslli_h:

  case Intrinsic::loongarch_lasx_xvslli_h:

    return DAG.getNode(ISD::SHL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<4>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vslli_w:

  case Intrinsic::loongarch_lasx_xvslli_w:

    return DAG.getNode(ISD::SHL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vslli_d:

  case Intrinsic::loongarch_lasx_xvslli_d:

    return DAG.getNode(ISD::SHL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<6>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsrl_b:

  case Intrinsic::loongarch_lsx_vsrl_h:

  case Intrinsic::loongarch_lsx_vsrl_w:

  case Intrinsic::loongarch_lsx_vsrl_d:

  case Intrinsic::loongarch_lasx_xvsrl_b:

  case Intrinsic::loongarch_lasx_xvsrl_h:

  case Intrinsic::loongarch_lasx_xvsrl_w:

  case Intrinsic::loongarch_lasx_xvsrl_d:

    return DAG.getNode(ISD::SRL, DL, N->getValueType(0), N->getOperand(1),

                       truncateVecElts(N, DAG));

  case Intrinsic::loongarch_lsx_vsrli_b:

  case Intrinsic::loongarch_lasx_xvsrli_b:

    return DAG.getNode(ISD::SRL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<3>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsrli_h:

  case Intrinsic::loongarch_lasx_xvsrli_h:

    return DAG.getNode(ISD::SRL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<4>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsrli_w:

  case Intrinsic::loongarch_lasx_xvsrli_w:

    return DAG.getNode(ISD::SRL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsrli_d:

  case Intrinsic::loongarch_lasx_xvsrli_d:

    return DAG.getNode(ISD::SRL, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<6>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsra_b:

  case Intrinsic::loongarch_lsx_vsra_h:

  case Intrinsic::loongarch_lsx_vsra_w:

  case Intrinsic::loongarch_lsx_vsra_d:

  case Intrinsic::loongarch_lasx_xvsra_b:

  case Intrinsic::loongarch_lasx_xvsra_h:

  case Intrinsic::loongarch_lasx_xvsra_w:

  case Intrinsic::loongarch_lasx_xvsra_d:

    return DAG.getNode(ISD::SRA, DL, N->getValueType(0), N->getOperand(1),

                       truncateVecElts(N, DAG));

  case Intrinsic::loongarch_lsx_vsrai_b:

  case Intrinsic::loongarch_lasx_xvsrai_b:

    return DAG.getNode(ISD::SRA, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<3>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsrai_h:

  case Intrinsic::loongarch_lasx_xvsrai_h:

    return DAG.getNode(ISD::SRA, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<4>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsrai_w:

  case Intrinsic::loongarch_lasx_xvsrai_w:

    return DAG.getNode(ISD::SRA, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<5>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vsrai_d:

  case Intrinsic::loongarch_lasx_xvsrai_d:

    return DAG.getNode(ISD::SRA, DL, N->getValueType(0), N->getOperand(1),

                       lowerVectorSplatImm<6>(N, 2, DAG));

  case Intrinsic::loongarch_lsx_vclz_b:

  case Intrinsic::loongarch_lsx_vclz_h:

  case Intrinsic::loongarch_lsx_vclz_w:

  case Intrinsic::loongarch_lsx_vclz_d:

  case Intrinsic::loongarch_lasx_xvclz_b:

  case Intrinsic::loongarch_lasx_xvclz_h:

  case Intrinsic::loongarch_lasx_xvclz_w:

  case Intrinsic::loongarch_lasx_xvclz_d:

    return DAG.getNode(ISD::CTLZ, DL, N->getValueType(0), N->getOperand(1));

  case Intrinsic::loongarch_lsx_vpcnt_b:

  case Intrinsic::loongarch_lsx_vpcnt_h:

  case Intrinsic::loongarch_lsx_vpcnt_w:

  case Intrinsic::loongarch_lsx_vpcnt_d:

  case Intrinsic::loongarch_lasx_xvpcnt_b:

  case Intrinsic::loongarch_lasx_xvpcnt_h:

  case Intrinsic::loongarch_lasx_xvpcnt_w:

  case Intrinsic::loongarch_lasx_xvpcnt_d:

    return DAG.getNode(ISD::CTPOP, DL, N->getValueType(0), N->getOperand(1));

  case Intrinsic::loongarch_lsx_vbitclr_b:

  case Intrinsic::loongarch_lsx_vbitclr_h:

  case Intrinsic::loongarch_lsx_vbitclr_w:

  case Intrinsic::loongarch_lsx_vbitclr_d:

  case Intrinsic::loongarch_lasx_xvbitclr_b:

  case Intrinsic::loongarch_lasx_xvbitclr_h:

  case Intrinsic::loongarch_lasx_xvbitclr_w:

  case Intrinsic::loongarch_lasx_xvbitclr_d:

    return lowerVectorBitClear(N, DAG);

  case Intrinsic::loongarch_lsx_vbitclri_b:

  case Intrinsic::loongarch_lasx_xvbitclri_b:

    return lowerVectorBitClearImm<3>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitclri_h:

  case Intrinsic::loongarch_lasx_xvbitclri_h:

    return lowerVectorBitClearImm<4>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitclri_w:

  case Intrinsic::loongarch_lasx_xvbitclri_w:

    return lowerVectorBitClearImm<5>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitclri_d:

  case Intrinsic::loongarch_lasx_xvbitclri_d:

    return lowerVectorBitClearImm<6>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitset_b:

  case Intrinsic::loongarch_lsx_vbitset_h:

  case Intrinsic::loongarch_lsx_vbitset_w:

  case Intrinsic::loongarch_lsx_vbitset_d:

  case Intrinsic::loongarch_lasx_xvbitset_b:

  case Intrinsic::loongarch_lasx_xvbitset_h:

  case Intrinsic::loongarch_lasx_xvbitset_w:

  case Intrinsic::loongarch_lasx_xvbitset_d: {

    EVT VecTy = N->getValueType(0);

    SDValue One = DAG.getConstant(1, DL, VecTy);

    return DAG.getNode(

        ISD::OR, DL, VecTy, N->getOperand(1),

        DAG.getNode(ISD::SHL, DL, VecTy, One, truncateVecElts(N, DAG)));

  }

  case Intrinsic::loongarch_lsx_vbitseti_b:

  case Intrinsic::loongarch_lasx_xvbitseti_b:

    return lowerVectorBitSetImm<3>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitseti_h:

  case Intrinsic::loongarch_lasx_xvbitseti_h:

    return lowerVectorBitSetImm<4>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitseti_w:

  case Intrinsic::loongarch_lasx_xvbitseti_w:

    return lowerVectorBitSetImm<5>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitseti_d:

  case Intrinsic::loongarch_lasx_xvbitseti_d:

    return lowerVectorBitSetImm<6>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitrev_b:

  case Intrinsic::loongarch_lsx_vbitrev_h:

  case Intrinsic::loongarch_lsx_vbitrev_w:

  case Intrinsic::loongarch_lsx_vbitrev_d:

  case Intrinsic::loongarch_lasx_xvbitrev_b:

  case Intrinsic::loongarch_lasx_xvbitrev_h:

  case Intrinsic::loongarch_lasx_xvbitrev_w:

  case Intrinsic::loongarch_lasx_xvbitrev_d: {

    EVT VecTy = N->getValueType(0);

    SDValue One = DAG.getConstant(1, DL, VecTy);

    return DAG.getNode(

        ISD::XOR, DL, VecTy, N->getOperand(1),

        DAG.getNode(ISD::SHL, DL, VecTy, One, truncateVecElts(N, DAG)));

  }

  case Intrinsic::loongarch_lsx_vbitrevi_b:

  case Intrinsic::loongarch_lasx_xvbitrevi_b:

    return lowerVectorBitRevImm<3>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitrevi_h:

  case Intrinsic::loongarch_lasx_xvbitrevi_h:

    return lowerVectorBitRevImm<4>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitrevi_w:

  case Intrinsic::loongarch_lasx_xvbitrevi_w:

    return lowerVectorBitRevImm<5>(N, DAG);

  case Intrinsic::loongarch_lsx_vbitrevi_d:

  case Intrinsic::loongarch_lasx_xvbitrevi_d:

    return lowerVectorBitRevImm<6>(N, DAG);

  case Intrinsic::loongarch_lsx_vfadd_s:

  case Intrinsic::loongarch_lsx_vfadd_d:

  case Intrinsic::loongarch_lasx_xvfadd_s:

  case Intrinsic::loongarch_lasx_xvfadd_d:

    return DAG.getNode(ISD::FADD, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vfsub_s:

  case Intrinsic::loongarch_lsx_vfsub_d:

  case Intrinsic::loongarch_lasx_xvfsub_s:

  case Intrinsic::loongarch_lasx_xvfsub_d:

    return DAG.getNode(ISD::FSUB, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vfmul_s:

  case Intrinsic::loongarch_lsx_vfmul_d:

  case Intrinsic::loongarch_lasx_xvfmul_s:

  case Intrinsic::loongarch_lasx_xvfmul_d:

    return DAG.getNode(ISD::FMUL, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vfdiv_s:

  case Intrinsic::loongarch_lsx_vfdiv_d:

  case Intrinsic::loongarch_lasx_xvfdiv_s:

  case Intrinsic::loongarch_lasx_xvfdiv_d:

    return DAG.getNode(ISD::FDIV, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2));

  case Intrinsic::loongarch_lsx_vfmadd_s:

  case Intrinsic::loongarch_lsx_vfmadd_d:

  case Intrinsic::loongarch_lasx_xvfmadd_s:

  case Intrinsic::loongarch_lasx_xvfmadd_d:

    return DAG.getNode(ISD::FMA, DL, N->getValueType(0), N->getOperand(1),

                       N->getOperand(2), N->getOperand(3));

  case Intrinsic::loongarch_lsx_vinsgr2vr_b:

    return DAG.getNode(ISD::INSERT_VECTOR_ELT, SDLoc(N), N->getValueType(0),

                       N->getOperand(1), N->getOperand(2),

                       legalizeIntrinsicImmArg<4>(N, 3, DAG, Subtarget));

  case Intrinsic::loongarch_lsx_vinsgr2vr_h:

  case Intrinsic::loongarch_lasx_xvinsgr2vr_w:

    return DAG.getNode(ISD::INSERT_VECTOR_ELT, SDLoc(N), N->getValueType(0),

                       N->getOperand(1), N->getOperand(2),

                       legalizeIntrinsicImmArg<3>(N, 3, DAG, Subtarget));

  case Intrinsic::loongarch_lsx_vinsgr2vr_w:

  case Intrinsic::loongarch_lasx_xvinsgr2vr_d:

    return DAG.getNode(ISD::INSERT_VECTOR_ELT, SDLoc(N), N->getValueType(0),

                       N->getOperand(1), N->getOperand(2),

                       legalizeIntrinsicImmArg<2>(N, 3, DAG, Subtarget));

  case Intrinsic::loongarch_lsx_vinsgr2vr_d:

    return DAG.getNode(ISD::INSERT_VECTOR_ELT, SDLoc(N), N->getValueType(0),

                       N->getOperand(1), N->getOperand(2),

                       legalizeIntrinsicImmArg<1>(N, 3, DAG, Subtarget));

  case Intrinsic::loongarch_lsx_vreplgr2vr_b:

  case Intrinsic::loongarch_lsx_vreplgr2vr_h:

  case Intrinsic::loongarch_lsx_vreplgr2vr_w:

  case Intrinsic::loongarch_lsx_vreplgr2vr_d:

  case Intrinsic::loongarch_lasx_xvreplgr2vr_b:

  case Intrinsic::loongarch_lasx_xvreplgr2vr_h:

  case Intrinsic::loongarch_lasx_xvreplgr2vr_w:

  case Intrinsic::loongarch_lasx_xvreplgr2vr_d:

    return DAG.getNode(LoongArchISD::VREPLGR2VR, DL, N->getValueType(0),

                       DAG.getNode(ISD::ANY_EXTEND, DL, Subtarget.getGRLenVT(),

                                   N->getOperand(1)));

  case Intrinsic::loongarch_lsx_vreplve_b:

  case Intrinsic::loongarch_lsx_vreplve_h:

  case Intrinsic::loongarch_lsx_vreplve_w:

  case Intrinsic::loongarch_lsx_vreplve_d:

  case Intrinsic::loongarch_lasx_xvreplve_b:

  case Intrinsic::loongarch_lasx_xvreplve_h:

  case Intrinsic::loongarch_lasx_xvreplve_w:

  case Intrinsic::loongarch_lasx_xvreplve_d:

    return DAG.getNode(LoongArchISD::VREPLVE, DL, N->getValueType(0),

                       N->getOperand(1),

                       DAG.getNode(ISD::ANY_EXTEND, DL, Subtarget.getGRLenVT(),

                                   N->getOperand(2)));

  case Intrinsic::loongarch_lsx_vpickve2gr_b:

    if (!Subtarget.is64Bit())

      return lowerVectorPickVE2GR<4>(N, DAG, LoongArchISD::VPICK_SEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_h:

  case Intrinsic::loongarch_lasx_xvpickve2gr_w:

    if (!Subtarget.is64Bit())

      return lowerVectorPickVE2GR<3>(N, DAG, LoongArchISD::VPICK_SEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_w:

    if (!Subtarget.is64Bit())

      return lowerVectorPickVE2GR<2>(N, DAG, LoongArchISD::VPICK_SEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_bu:

    if (!Subtarget.is64Bit())

      return lowerVectorPickVE2GR<4>(N, DAG, LoongArchISD::VPICK_ZEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_hu:

  case Intrinsic::loongarch_lasx_xvpickve2gr_wu:

    if (!Subtarget.is64Bit())

      return lowerVectorPickVE2GR<3>(N, DAG, LoongArchISD::VPICK_ZEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_vpickve2gr_wu:

    if (!Subtarget.is64Bit())

      return lowerVectorPickVE2GR<2>(N, DAG, LoongArchISD::VPICK_ZEXT_ELT);

    break;

  case Intrinsic::loongarch_lsx_bz_b:

  case Intrinsic::loongarch_lsx_bz_h:

  case Intrinsic::loongarch_lsx_bz_w:

  case Intrinsic::loongarch_lsx_bz_d:

  case Intrinsic::loongarch_lasx_xbz_b:

  case Intrinsic::loongarch_lasx_xbz_h:

  case Intrinsic::loongarch_lasx_xbz_w:

  case Intrinsic::loongarch_lasx_xbz_d:

    if (!Subtarget.is64Bit())

      return DAG.getNode(LoongArchISD::VALL_ZERO, DL, N->getValueType(0),

                         N->getOperand(1));

    break;

  case Intrinsic::loongarch_lsx_bz_v:

  case Intrinsic::loongarch_lasx_xbz_v:

    if (!Subtarget.is64Bit())

      return DAG.getNode(LoongArchISD::VANY_ZERO, DL, N->getValueType(0),

                         N->getOperand(1));

    break;

  case Intrinsic::loongarch_lsx_bnz_b:

  case Intrinsic::loongarch_lsx_bnz_h:

  case Intrinsic::loongarch_lsx_bnz_w:

  case Intrinsic::loongarch_lsx_bnz_d:

  case Intrinsic::loongarch_lasx_xbnz_b:

  case Intrinsic::loongarch_lasx_xbnz_h:

  case Intrinsic::loongarch_lasx_xbnz_w:

  case Intrinsic::loongarch_lasx_xbnz_d:

    if (!Subtarget.is64Bit())

      return DAG.getNode(LoongArchISD::VALL_NONZERO, DL, N->getValueType(0),

                         N->getOperand(1));

    break;

  case Intrinsic::loongarch_lsx_bnz_v:

  case Intrinsic::loongarch_lasx_xbnz_v:

    if (!Subtarget.is64Bit())

      return DAG.getNode(LoongArchISD::VANY_NONZERO, DL, N->getValueType(0),

                         N->getOperand(1));

    break;

  case Intrinsic::loongarch_lasx_concat_128_s:

  case Intrinsic::loongarch_lasx_concat_128_d:

  case Intrinsic::loongarch_lasx_concat_128:

    return DAG.getNode(ISD::CONCAT_VECTORS, DL, N->getValueType(0),

                       N->getOperand(1), N->getOperand(2));

  }

  return SDValue();

}


static SDValue performMOVGR2FR_WCombine(SDNode *N, SelectionDAG &DAG,

                                        TargetLowering::DAGCombinerInfo &DCI,

                                        const LoongArchSubtarget &Subtarget) {

  // If the input to MOVGR2FR_W_LA64 is just MOVFR2GR_S_LA64 the the

  // conversion is unnecessary and can be replaced with the

  // MOVFR2GR_S_LA64 operand.

  SDValue Op0 = N->getOperand(0);

  if (Op0.getOpcode() == LoongArchISD::MOVFR2GR_S_LA64)

    return Op0.getOperand(0);

  return SDValue();

}


static SDValue performMOVFR2GR_SCombine(SDNode *N, SelectionDAG &DAG,

                                        TargetLowering::DAGCombinerInfo &DCI,

                                        const LoongArchSubtarget &Subtarget) {

  // If the input to MOVFR2GR_S_LA64 is just MOVGR2FR_W_LA64 then the

  // conversion is unnecessary and can be replaced with the MOVGR2FR_W_LA64

  // operand.

  SDValue Op0 = N->getOperand(0);

  if (Op0->getOpcode() == LoongArchISD::MOVGR2FR_W_LA64) {

    assert(Op0.getOperand(0).getValueType() == N->getSimpleValueType(0) &&

           "Unexpected value type!");

    return Op0.getOperand(0);

  }

  return SDValue();

}


static SDValue performVMSKLTZCombine(SDNode *N, SelectionDAG &DAG,

                                     TargetLowering::DAGCombinerInfo &DCI,

                                     const LoongArchSubtarget &Subtarget) {

  MVT VT = N->getSimpleValueType(0);

  unsigned NumBits = VT.getScalarSizeInBits();


  // Simplify the inputs.

  const TargetLowering &TLI = DAG.getTargetLoweringInfo();

  APInt DemandedMask(APInt::getAllOnes(NumBits));

  if (TLI.SimplifyDemandedBits(SDValue(N, 0), DemandedMask, DCI))

    return SDValue(N, 0);


  return SDValue();

}


static SDValue


performSPLIT_PAIR_F64Combine(SDNode *N, SelectionDAG &DAG,

                             TargetLowering::DAGCombinerInfo &DCI,

                             const LoongArchSubtarget &Subtarget) {

  SDValue Op0 = N->getOperand(0);

  SDLoc DL(N);


  // If the input to SplitPairF64 is just BuildPairF64 then the operation is

  // redundant. Instead, use BuildPairF64's operands directly.

  if (Op0->getOpcode() == LoongArchISD::BUILD_PAIR_F64)

    return DCI.CombineTo(N, Op0.getOperand(0), Op0.getOperand(1));


  if (Op0->isUndef()) {

    SDValue Lo = DAG.getUNDEF(MVT::i32);

    SDValue Hi = DAG.getUNDEF(MVT::i32);

    return DCI.CombineTo(N, Lo, Hi);

  }


  // It's cheaper to materialise two 32-bit integers than to load a double

  // from the constant pool and transfer it to integer registers through the

  // stack.

  if (ConstantFPSDNode *C = dyn_cast<ConstantFPSDNode>(Op0)) {

    APInt V = C->getValueAPF().bitcastToAPInt();

    SDValue Lo = DAG.getConstant(V.trunc(32), DL, MVT::i32);

    SDValue Hi = DAG.getConstant(V.lshr(32).trunc(32), DL, MVT::i32);

    return DCI.CombineTo(N, Lo, Hi);

  }


  return SDValue();

}


static SDValue


performEXTRACT_VECTOR_ELTCombine(SDNode *N, SelectionDAG &DAG,

                                 TargetLowering::DAGCombinerInfo &DCI,

                                 const LoongArchSubtarget &Subtarget) {

  if (!DCI.isBeforeLegalize())

    return SDValue();


  MVT EltVT = N->getSimpleValueType(0);

  SDValue Vec = N->getOperand(0);

  EVT VecTy = Vec->getValueType(0);

  SDValue Idx = N->getOperand(1);

  unsigned IdxOp = Idx.getOpcode();

  SDLoc DL(N);


  if (!VecTy.is256BitVector() || isa<ConstantSDNode>(Idx))

    return SDValue();


  // Combine:

  //   t2 = truncate t1

  //   t3 = {zero/sign/any}_extend t2

  //   t4 = extract_vector_elt t0, t3

  // to:

  //   t4 = extract_vector_elt t0, t1

  if (IdxOp == ISD::ZERO_EXTEND || IdxOp == ISD::SIGN_EXTEND ||

      IdxOp == ISD::ANY_EXTEND) {

    SDValue IdxOrig = Idx.getOperand(0);

    if (!(IdxOrig.getOpcode() == ISD::TRUNCATE))

      return SDValue();


    return DAG.getNode(ISD::EXTRACT_VECTOR_ELT, DL, EltVT, Vec,

                       IdxOrig.getOperand(0));

  }


  return SDValue();

}


/// Do target-specific dag combines on LoongArchISD::VANDN nodes.


static SDValue performVANDNCombine(SDNode *N, SelectionDAG &DAG,

                                   TargetLowering::DAGCombinerInfo &DCI,

                                   const LoongArchSubtarget &Subtarget) {

  SDValue N0 = N->getOperand(0);

  SDValue N1 = N->getOperand(1);

  MVT VT = N->getSimpleValueType(0);

  SDLoc DL(N);


  // VANDN(undef, x) -> 0

  // VANDN(x, undef) -> 0

  if (N0.isUndef() || N1.isUndef())

    return DAG.getConstant(0, DL, VT);


  // VANDN(0, x) -> x

  if (ISD::isBuildVectorAllZeros(N0.getNode()))

    return N1;


  // VANDN(x, 0) -> 0

  if (ISD::isBuildVectorAllZeros(N1.getNode()))

    return DAG.getConstant(0, DL, VT);


  // VANDN(x, -1) -> NOT(x) -> XOR(x, -1)

  if (ISD::isBuildVectorAllOnes(N1.getNode()))

    return DAG.getNOT(DL, N0, VT);


  // Turn VANDN back to AND if input is inverted.

  if (SDValue Not = isNOT(N0, DAG))

    return DAG.getNode(ISD::AND, DL, VT, DAG.getBitcast(VT, Not), N1);


  // Folds for better commutativity:

  if (N1->hasOneUse()) {

    // VANDN(x,NOT(y)) -> AND(NOT(x),NOT(y)) -> NOT(OR(X,Y)).

    if (SDValue Not = isNOT(N1, DAG))

      return DAG.getNOT(

          DL, DAG.getNode(ISD::OR, DL, VT, N0, DAG.getBitcast(VT, Not)), VT);


    // VANDN(x, SplatVector(Imm)) -> AND(NOT(x), NOT(SplatVector(~Imm)))

    // -> NOT(OR(x, SplatVector(-Imm))

    // Combination is performed only when VT is v16i8/v32i8, using `vnori.b` to

    // gain benefits.

    if (!DCI.isBeforeLegalizeOps() && (VT == MVT::v16i8 || VT == MVT::v32i8) &&

        N1.getOpcode() == ISD::BUILD_VECTOR) {

      if (SDValue SplatValue =

              cast<BuildVectorSDNode>(N1.getNode())->getSplatValue()) {

        if (!N1->isOnlyUserOf(SplatValue.getNode()))

          return SDValue();


        if (auto *C = dyn_cast<ConstantSDNode>(SplatValue)) {

          uint8_t NCVal = static_cast<uint8_t>(~(C->getSExtValue()));

          SDValue Not =

              DAG.getSplat(VT, DL, DAG.getTargetConstant(NCVal, DL, MVT::i8));

          return DAG.getNOT(

              DL, DAG.getNode(ISD::OR, DL, VT, N0, DAG.getBitcast(VT, Not)),

              VT);

        }

      }

    }

  }


  return SDValue();

}


SDValue LoongArchTargetLowering::PerformDAGCombine(SDNode *N,

                                                   DAGCombinerInfo &DCI) const {

  SelectionDAG &DAG = DCI.DAG;

  switch (N->getOpcode()) {

  default:

    break;

  case ISD::AND:

    return performANDCombine(N, DAG, DCI, Subtarget);

  case ISD::OR:

    return performORCombine(N, DAG, DCI, Subtarget);

  case ISD::SETCC:

    return performSETCCCombine(N, DAG, DCI, Subtarget);

  case ISD::SRL:

    return performSRLCombine(N, DAG, DCI, Subtarget);

  case ISD::BITCAST:

    return performBITCASTCombine(N, DAG, DCI, Subtarget);

  case LoongArchISD::BITREV_W:

    return performBITREV_WCombine(N, DAG, DCI, Subtarget);

  case LoongArchISD::BR_CC:

    return performBR_CCCombine(N, DAG, DCI, Subtarget);

  case LoongArchISD::SELECT_CC:

    return performSELECT_CCCombine(N, DAG, DCI, Subtarget);

  case ISD::INTRINSIC_WO_CHAIN:

    return performINTRINSIC_WO_CHAINCombine(N, DAG, DCI, Subtarget);

  case LoongArchISD::MOVGR2FR_W_LA64:

    return performMOVGR2FR_WCombine(N, DAG, DCI, Subtarget);

  case LoongArchISD::MOVFR2GR_S_LA64:

    return performMOVFR2GR_SCombine(N, DAG, DCI, Subtarget);

  case LoongArchISD::VMSKLTZ:

  case LoongArchISD::XVMSKLTZ:

    return performVMSKLTZCombine(N, DAG, DCI, Subtarget);

  case LoongArchISD::SPLIT_PAIR_F64:

    return performSPLIT_PAIR_F64Combine(N, DAG, DCI, Subtarget);

  case ISD::EXTRACT_VECTOR_ELT:

    return performEXTRACT_VECTOR_ELTCombine(N, DAG, DCI, Subtarget);

  case LoongArchISD::VANDN:

    return performVANDNCombine(N, DAG, DCI, Subtarget);

  }

  return SDValue();

}


static MachineBasicBlock *insertDivByZeroTrap(MachineInstr &MI,

                                              MachineBasicBlock *MBB) {

  if (!ZeroDivCheck)

    return MBB;


  // Build instructions:

  // MBB:

  //   div(or mod)   $dst, $dividend, $divisor

  //   bne           $divisor, $zero, SinkMBB

  // BreakMBB:

  //   break         7 // BRK_DIVZERO

  // SinkMBB:

  //   fallthrough

  const BasicBlock *LLVM_BB = MBB->getBasicBlock();

  MachineFunction::iterator It = ++MBB->getIterator();

  MachineFunction *MF = MBB->getParent();

  auto BreakMBB = MF->CreateMachineBasicBlock(LLVM_BB);

  auto SinkMBB = MF->CreateMachineBasicBlock(LLVM_BB);

  MF->insert(It, BreakMBB);

  MF->insert(It, SinkMBB);


  // Transfer the remainder of MBB and its successor edges to SinkMBB.

  SinkMBB->splice(SinkMBB->end(), MBB, std::next(MI.getIterator()), MBB->end());

  SinkMBB->transferSuccessorsAndUpdatePHIs(MBB);


  const TargetInstrInfo &TII = *MF->getSubtarget().getInstrInfo();

  DebugLoc DL = MI.getDebugLoc();

  MachineOperand &Divisor = MI.getOperand(2);

  Register DivisorReg = Divisor.getReg();


  // MBB:

  BuildMI(MBB, DL, TII.get(LoongArch::BNE))

      .addReg(DivisorReg, getKillRegState(Divisor.isKill()))

      .addReg(LoongArch::R0)

      .addMBB(SinkMBB);

  MBB->addSuccessor(BreakMBB);

  MBB->addSuccessor(SinkMBB);


  // BreakMBB:

  // See linux header file arch/loongarch/include/uapi/asm/break.h for the

  // definition of BRK_DIVZERO.

  BuildMI(BreakMBB, DL, TII.get(LoongArch::BREAK)).addImm(7 /*BRK_DIVZERO*/);

  BreakMBB->addSuccessor(SinkMBB);


  // Clear Divisor's kill flag.

  Divisor.setIsKill(false);


  return SinkMBB;

}


static MachineBasicBlock *


emitVecCondBranchPseudo(MachineInstr &MI, MachineBasicBlock *BB,

                        const LoongArchSubtarget &Subtarget) {

  unsigned CondOpc;

  switch (MI.getOpcode()) {

  default:

    llvm_unreachable("Unexpected opcode");

  case LoongArch::PseudoVBZ:

    CondOpc = LoongArch::VSETEQZ_V;

    break;

  case LoongArch::PseudoVBZ_B:

    CondOpc = LoongArch::VSETANYEQZ_B;

    break;

  case LoongArch::PseudoVBZ_H:

    CondOpc = LoongArch::VSETANYEQZ_H;

    break;

  case LoongArch::PseudoVBZ_W:

    CondOpc = LoongArch::VSETANYEQZ_W;

    break;

  case LoongArch::PseudoVBZ_D:

    CondOpc = LoongArch::VSETANYEQZ_D;

    break;

  case LoongArch::PseudoVBNZ:

    CondOpc = LoongArch::VSETNEZ_V;

    break;

  case LoongArch::PseudoVBNZ_B:

    CondOpc = LoongArch::VSETALLNEZ_B;

    break;

  case LoongArch::PseudoVBNZ_H:

    CondOpc = LoongArch::VSETALLNEZ_H;

    break;

  case LoongArch::PseudoVBNZ_W:

    CondOpc = LoongArch::VSETALLNEZ_W;

    break;

  case LoongArch::PseudoVBNZ_D:

    CondOpc = LoongArch::VSETALLNEZ_D;

    break;

  case LoongArch::PseudoXVBZ:

    CondOpc = LoongArch::XVSETEQZ_V;

    break;

  case LoongArch::PseudoXVBZ_B:

    CondOpc = LoongArch::XVSETANYEQZ_B;

    break;

  case LoongArch::PseudoXVBZ_H:

    CondOpc = LoongArch::XVSETANYEQZ_H;

    break;

  case LoongArch::PseudoXVBZ_W:

    CondOpc = LoongArch::XVSETANYEQZ_W;

    break;

  case LoongArch::PseudoXVBZ_D:

    CondOpc = LoongArch::XVSETANYEQZ_D;

    break;

  case LoongArch::PseudoXVBNZ:

    CondOpc = LoongArch::XVSETNEZ_V;

    break;

  case LoongArch::PseudoXVBNZ_B:

    CondOpc = LoongArch::XVSETALLNEZ_B;

    break;

  case LoongArch::PseudoXVBNZ_H:

    CondOpc = LoongArch::XVSETALLNEZ_H;

    break;

  case LoongArch::PseudoXVBNZ_W:

    CondOpc = LoongArch::XVSETALLNEZ_W;

    break;

  case LoongArch::PseudoXVBNZ_D:

    CondOpc = LoongArch::XVSETALLNEZ_D;

    break;

  }


  const TargetInstrInfo *TII = Subtarget.getInstrInfo();

  const BasicBlock *LLVM_BB = BB->getBasicBlock();

  DebugLoc DL = MI.getDebugLoc();

  MachineRegisterInfo &MRI = BB->getParent()->getRegInfo();

  MachineFunction::iterator It = ++BB->getIterator();


  MachineFunction *F = BB->getParent();

  MachineBasicBlock *FalseBB = F->CreateMachineBasicBlock(LLVM_BB);

  MachineBasicBlock *TrueBB = F->CreateMachineBasicBlock(LLVM_BB);

  MachineBasicBlock *SinkBB = F->CreateMachineBasicBlock(LLVM_BB);


  F->insert(It, FalseBB);

  F->insert(It, TrueBB);

  F->insert(It, SinkBB);


  // Transfer the remainder of MBB and its successor edges to Sink.

  SinkBB->splice(SinkBB->end(), BB, std::next(MI.getIterator()), BB->end());

  SinkBB->transferSuccessorsAndUpdatePHIs(BB);


  // Insert the real instruction to BB.

  Register FCC = MRI.createVirtualRegister(&LoongArch::CFRRegClass);

  BuildMI(BB, DL, TII->get(CondOpc), FCC).addReg(MI.getOperand(1).getReg());


  // Insert branch.

  BuildMI(BB, DL, TII->get(LoongArch::BCNEZ)).addReg(FCC).addMBB(TrueBB);

  BB->addSuccessor(FalseBB);

  BB->addSuccessor(TrueBB);


  // FalseBB.

  Register RD1 = MRI.createVirtualRegister(&LoongArch::GPRRegClass);

  BuildMI(FalseBB, DL, TII->get(LoongArch::ADDI_W), RD1)

      .addReg(LoongArch::R0)

      .addImm(0);

  BuildMI(FalseBB, DL, TII->get(LoongArch::PseudoBR)).addMBB(SinkBB);

  FalseBB->addSuccessor(SinkBB);


  // TrueBB.

  Register RD2 = MRI.createVirtualRegister(&LoongArch::GPRRegClass);

  BuildMI(TrueBB, DL, TII->get(LoongArch::ADDI_W), RD2)

      .addReg(LoongArch::R0)

      .addImm(1);

  TrueBB->addSuccessor(SinkBB);


  // SinkBB: merge the results.

  BuildMI(*SinkBB, SinkBB->begin(), DL, TII->get(LoongArch::PHI),

          MI.getOperand(0).getReg())

      .addReg(RD1)

      .addMBB(FalseBB)

      .addReg(RD2)

      .addMBB(TrueBB);


  // The pseudo instruction is gone now.

  MI.eraseFromParent();

  return SinkBB;

}


static MachineBasicBlock *


emitPseudoXVINSGR2VR(MachineInstr &MI, MachineBasicBlock *BB,

                     const LoongArchSubtarget &Subtarget) {

  unsigned InsOp;

  unsigned BroadcastOp;

  unsigned HalfSize;

  switch (MI.getOpcode()) {

  default:

    llvm_unreachable("Unexpected opcode");

  case LoongArch::PseudoXVINSGR2VR_B:

    HalfSize = 16;

    BroadcastOp = LoongArch::XVREPLGR2VR_B;

    InsOp = LoongArch::XVEXTRINS_B;

    break;

  case LoongArch::PseudoXVINSGR2VR_H:

    HalfSize = 8;

    BroadcastOp = LoongArch::XVREPLGR2VR_H;

    InsOp = LoongArch::XVEXTRINS_H;

    break;

  }

  const TargetInstrInfo *TII = Subtarget.getInstrInfo();

  const TargetRegisterClass *RC = &LoongArch::LASX256RegClass;

  const TargetRegisterClass *SubRC = &LoongArch::LSX128RegClass;

  DebugLoc DL = MI.getDebugLoc();

  MachineRegisterInfo &MRI = BB->getParent()->getRegInfo();

  // XDst = vector_insert XSrc, Elt, Idx

  Register XDst = MI.getOperand(0).getReg();

  Register XSrc = MI.getOperand(1).getReg();

  Register Elt = MI.getOperand(2).getReg();

  unsigned Idx = MI.getOperand(3).getImm();


  if (XSrc.isVirtual() && MRI.getVRegDef(XSrc)->isImplicitDef() &&

      Idx < HalfSize) {

    Register ScratchSubReg1 = MRI.createVirtualRegister(SubRC);

    Register ScratchSubReg2 = MRI.createVirtualRegister(SubRC);


    BuildMI(*BB, MI, DL, TII->get(LoongArch::COPY), ScratchSubReg1)

        .addReg(XSrc, 0, LoongArch::sub_128);

    BuildMI(*BB, MI, DL,

            TII->get(HalfSize == 8 ? LoongArch::VINSGR2VR_H

                                   : LoongArch::VINSGR2VR_B),

            ScratchSubReg2)

        .addReg(ScratchSubReg1)

        .addReg(Elt)

        .addImm(Idx);


    BuildMI(*BB, MI, DL, TII->get(LoongArch::SUBREG_TO_REG), XDst)

        .addImm(0)

        .addReg(ScratchSubReg2)

        .addImm(LoongArch::sub_128);

  } else {

    Register ScratchReg1 = MRI.createVirtualRegister(RC);

    Register ScratchReg2 = MRI.createVirtualRegister(RC);


    BuildMI(*BB, MI, DL, TII->get(BroadcastOp), ScratchReg1).addReg(Elt);


    BuildMI(*BB, MI, DL, TII->get(LoongArch::XVPERMI_Q), ScratchReg2)

        .addReg(ScratchReg1)

        .addReg(XSrc)

        .addImm(Idx >= HalfSize ? 48 : 18);


    BuildMI(*BB, MI, DL, TII->get(InsOp), XDst)

        .addReg(XSrc)

        .addReg(ScratchReg2)

        .addImm((Idx >= HalfSize ? Idx - HalfSize : Idx) * 17);

  }


  MI.eraseFromParent();

  return BB;

}


static MachineBasicBlock *emitPseudoCTPOP(MachineInstr &MI,

                                          MachineBasicBlock *BB,

                                          const LoongArchSubtarget &Subtarget) {

  assert(Subtarget.hasExtLSX());

  const TargetInstrInfo *TII = Subtarget.getInstrInfo();

  const TargetRegisterClass *RC = &LoongArch::LSX128RegClass;

  DebugLoc DL = MI.getDebugLoc();

  MachineRegisterInfo &MRI = BB->getParent()->getRegInfo();

  Register Dst = MI.getOperand(0).getReg();

  Register Src = MI.getOperand(1).getReg();

  Register ScratchReg1 = MRI.createVirtualRegister(RC);

  Register ScratchReg2 = MRI.createVirtualRegister(RC);

  Register ScratchReg3 = MRI.createVirtualRegister(RC);


  BuildMI(*BB, MI, DL, TII->get(LoongArch::VLDI), ScratchReg1).addImm(0);

  BuildMI(*BB, MI, DL,

          TII->get(Subtarget.is64Bit() ? LoongArch::VINSGR2VR_D

                                       : LoongArch::VINSGR2VR_W),

          ScratchReg2)

      .addReg(ScratchReg1)

      .addReg(Src)

      .addImm(0);

  BuildMI(

      *BB, MI, DL,

      TII->get(Subtarget.is64Bit() ? LoongArch::VPCNT_D : LoongArch::VPCNT_W),

      ScratchReg3)

      .addReg(ScratchReg2);

  BuildMI(*BB, MI, DL,

          TII->get(Subtarget.is64Bit() ? LoongArch::VPICKVE2GR_D

                                       : LoongArch::VPICKVE2GR_W),

          Dst)

      .addReg(ScratchReg3)

      .addImm(0);


  MI.eraseFromParent();

  return BB;

}


static MachineBasicBlock *


emitPseudoVMSKCOND(MachineInstr &MI, MachineBasicBlock *BB,

                   const LoongArchSubtarget &Subtarget) {

  const TargetInstrInfo *TII = Subtarget.getInstrInfo();

  const TargetRegisterClass *RC = &LoongArch::LSX128RegClass;

  const LoongArchRegisterInfo *TRI = Subtarget.getRegisterInfo();

  MachineRegisterInfo &MRI = BB->getParent()->getRegInfo();

  Register Dst = MI.getOperand(0).getReg();

  Register Src = MI.getOperand(1).getReg();

  DebugLoc DL = MI.getDebugLoc();

  unsigned EleBits = 8;

  unsigned NotOpc = 0;

  unsigned MskOpc;


  switch (MI.getOpcode()) {

  default:

    llvm_unreachable("Unexpected opcode");

  case LoongArch::PseudoVMSKLTZ_B:

    MskOpc = LoongArch::VMSKLTZ_B;

    break;

  case LoongArch::PseudoVMSKLTZ_H:

    MskOpc = LoongArch::VMSKLTZ_H;

    EleBits = 16;

    break;

  case LoongArch::PseudoVMSKLTZ_W:

    MskOpc = LoongArch::VMSKLTZ_W;

    EleBits = 32;

    break;

  case LoongArch::PseudoVMSKLTZ_D:

    MskOpc = LoongArch::VMSKLTZ_D;

    EleBits = 64;

    break;

  case LoongArch::PseudoVMSKGEZ_B:

    MskOpc = LoongArch::VMSKGEZ_B;

    break;

  case LoongArch::PseudoVMSKEQZ_B:

    MskOpc = LoongArch::VMSKNZ_B;

    NotOpc = LoongArch::VNOR_V;

    break;

  case LoongArch::PseudoVMSKNEZ_B:

    MskOpc = LoongArch::VMSKNZ_B;

    break;

  case LoongArch::PseudoXVMSKLTZ_B:

    MskOpc = LoongArch::XVMSKLTZ_B;

    RC = &LoongArch::LASX256RegClass;

    break;

  case LoongArch::PseudoXVMSKLTZ_H:

    MskOpc = LoongArch::XVMSKLTZ_H;

    RC = &LoongArch::LASX256RegClass;

    EleBits = 16;

    break;

  case LoongArch::PseudoXVMSKLTZ_W:

    MskOpc = LoongArch::XVMSKLTZ_W;

    RC = &LoongArch::LASX256RegClass;

    EleBits = 32;

    break;

  case LoongArch::PseudoXVMSKLTZ_D:

    MskOpc = LoongArch::XVMSKLTZ_D;

    RC = &LoongArch::LASX256RegClass;

    EleBits = 64;

    break;

  case LoongArch::PseudoXVMSKGEZ_B:

    MskOpc = LoongArch::XVMSKGEZ_B;

    RC = &LoongArch::LASX256RegClass;

    break;

  case LoongArch::PseudoXVMSKEQZ_B:

    MskOpc = LoongArch::XVMSKNZ_B;

    NotOpc = LoongArch::XVNOR_V;

    RC = &LoongArch::LASX256RegClass;

    break;

  case LoongArch::PseudoXVMSKNEZ_B:

    MskOpc = LoongArch::XVMSKNZ_B;

    RC = &LoongArch::LASX256RegClass;

    break;

  }


  Register Msk = MRI.createVirtualRegister(RC);

  if (NotOpc) {

    Register Tmp = MRI.createVirtualRegister(RC);

    BuildMI(*BB, MI, DL, TII->get(MskOpc), Tmp).addReg(Src);

    BuildMI(*BB, MI, DL, TII->get(NotOpc), Msk)

        .addReg(Tmp, RegState::Kill)

        .addReg(Tmp, RegState::Kill);

  } else {

    BuildMI(*BB, MI, DL, TII->get(MskOpc), Msk).addReg(Src);

  }


  if (TRI->getRegSizeInBits(*RC) > 128) {

    Register Lo = MRI.createVirtualRegister(&LoongArch::GPRRegClass);

    Register Hi = MRI.createVirtualRegister(&LoongArch::GPRRegClass);

    BuildMI(*BB, MI, DL, TII->get(LoongArch::XVPICKVE2GR_WU), Lo)

        .addReg(Msk)

        .addImm(0);

    BuildMI(*BB, MI, DL, TII->get(LoongArch::XVPICKVE2GR_WU), Hi)

        .addReg(Msk, RegState::Kill)

        .addImm(4);

    BuildMI(*BB, MI, DL,

            TII->get(Subtarget.is64Bit() ? LoongArch::BSTRINS_D

                                         : LoongArch::BSTRINS_W),

            Dst)

        .addReg(Lo, RegState::Kill)

        .addReg(Hi, RegState::Kill)

        .addImm(256 / EleBits - 1)

        .addImm(128 / EleBits);

  } else {

    BuildMI(*BB, MI, DL, TII->get(LoongArch::VPICKVE2GR_HU), Dst)

        .addReg(Msk, RegState::Kill)

        .addImm(0);

  }


  MI.eraseFromParent();

  return BB;

}


static MachineBasicBlock *


emitSplitPairF64Pseudo(MachineInstr &MI, MachineBasicBlock *BB,

                       const LoongArchSubtarget &Subtarget) {

  assert(MI.getOpcode() == LoongArch::SplitPairF64Pseudo &&

         "Unexpected instruction");


  MachineFunction &MF = *BB->getParent();

  DebugLoc DL = MI.getDebugLoc();

  const TargetInstrInfo &TII = *MF.getSubtarget().getInstrInfo();

  Register LoReg = MI.getOperand(0).getReg();

  Register HiReg = MI.getOperand(1).getReg();

  Register SrcReg = MI.getOperand(2).getReg();


  BuildMI(*BB, MI, DL, TII.get(LoongArch::MOVFR2GR_S_64), LoReg).addReg(SrcReg);

  BuildMI(*BB, MI, DL, TII.get(LoongArch::MOVFRH2GR_S), HiReg)

      .addReg(SrcReg, getKillRegState(MI.getOperand(2).isKill()));

  MI.eraseFromParent(); // The pseudo instruction is gone now.

  return BB;

}


static MachineBasicBlock *


emitBuildPairF64Pseudo(MachineInstr &MI, MachineBasicBlock *BB,

                       const LoongArchSubtarget &Subtarget) {

  assert(MI.getOpcode() == LoongArch::BuildPairF64Pseudo &&

         "Unexpected instruction");


  MachineFunction &MF = *BB->getParent();

  DebugLoc DL = MI.getDebugLoc();

  const TargetInstrInfo &TII = *MF.getSubtarget().getInstrInfo();

  MachineRegisterInfo &MRI = BB->getParent()->getRegInfo();

  Register TmpReg = MRI.createVirtualRegister(&LoongArch::FPR64RegClass);

  Register DstReg = MI.getOperand(0).getReg();

  Register LoReg = MI.getOperand(1).getReg();

  Register HiReg = MI.getOperand(2).getReg();


  BuildMI(*BB, MI, DL, TII.get(LoongArch::MOVGR2FR_W_64), TmpReg)

      .addReg(LoReg, getKillRegState(MI.getOperand(1).isKill()));

  BuildMI(*BB, MI, DL, TII.get(LoongArch::MOVGR2FRH_W), DstReg)

      .addReg(TmpReg, RegState::Kill)

      .addReg(HiReg, getKillRegState(MI.getOperand(2).isKill()));

  MI.eraseFromParent(); // The pseudo instruction is gone now.

  return BB;

}


static bool isSelectPseudo(MachineInstr &MI) {

  switch (MI.getOpcode()) {

  default:

    return false;

  case LoongArch::Select_GPR_Using_CC_GPR:

    return true;

  }

}


static MachineBasicBlock *


emitSelectPseudo(MachineInstr &MI, MachineBasicBlock *BB,

                 const LoongArchSubtarget &Subtarget) {

  // To "insert" Select_* instructions, we actually have to insert the triangle

  // control-flow pattern.  The incoming instructions know the destination vreg

  // to set, the condition code register to branch on, the true/false values to

  // select between, and the condcode to use to select the appropriate branch.

  //

  // We produce the following control flow:

  //     HeadMBB

  //     |  \

  //     |  IfFalseMBB

  //     | /

  //    TailMBB

  //

  // When we find a sequence of selects we attempt to optimize their emission

  // by sharing the control flow. Currently we only handle cases where we have

  // multiple selects with the exact same condition (same LHS, RHS and CC).

  // The selects may be interleaved with other instructions if the other

  // instructions meet some requirements we deem safe:

  // - They are not pseudo instructions.

  // - They are debug instructions. Otherwise,

  // - They do not have side-effects, do not access memory and their inputs do

  //   not depend on the results of the select pseudo-instructions.

  // The TrueV/FalseV operands of the selects cannot depend on the result of

  // previous selects in the sequence.

  // These conditions could be further relaxed. See the X86 target for a

  // related approach and more information.


  Register LHS = MI.getOperand(1).getReg();

  Register RHS;

  if (MI.getOperand(2).isReg())

    RHS = MI.getOperand(2).getReg();

  auto CC = static_cast<unsigned>(MI.getOperand(3).getImm());


  SmallVector<MachineInstr *, 4> SelectDebugValues;

  SmallSet<Register, 4> SelectDests;

  SelectDests.insert(MI.getOperand(0).getReg());


  MachineInstr *LastSelectPseudo = &MI;

  for (auto E = BB->end(), SequenceMBBI = MachineBasicBlock::iterator(MI);

       SequenceMBBI != E; ++SequenceMBBI) {

    if (SequenceMBBI->isDebugInstr())

      continue;

    if (isSelectPseudo(*SequenceMBBI)) {

      if (SequenceMBBI->getOperand(1).getReg() != LHS ||

          !SequenceMBBI->getOperand(2).isReg() ||

          SequenceMBBI->getOperand(2).getReg() != RHS ||

          SequenceMBBI->getOperand(3).getImm() != CC ||

          SelectDests.count(SequenceMBBI->getOperand(4).getReg()) ||

          SelectDests.count(SequenceMBBI->getOperand(5).getReg()))

        break;

      LastSelectPseudo = &*SequenceMBBI;

      SequenceMBBI->collectDebugValues(SelectDebugValues);

      SelectDests.insert(SequenceMBBI->getOperand(0).getReg());

      continue;

    }

    if (SequenceMBBI->hasUnmodeledSideEffects() ||

        SequenceMBBI->mayLoadOrStore() ||

        SequenceMBBI->usesCustomInsertionHook())

      break;

    if (llvm::any_of(SequenceMBBI->operands(), [&](MachineOperand &MO) {

          return MO.isReg() && MO.isUse() && SelectDests.count(MO.getReg());

        }))

      break;

  }


  const LoongArchInstrInfo &TII = *Subtarget.getInstrInfo();

  const BasicBlock *LLVM_BB = BB->getBasicBlock();

  DebugLoc DL = MI.getDebugLoc();

  MachineFunction::iterator I = ++BB->getIterator();


  MachineBasicBlock *HeadMBB = BB;

  MachineFunction *F = BB->getParent();

  MachineBasicBlock *TailMBB = F->CreateMachineBasicBlock(LLVM_BB);

  MachineBasicBlock *IfFalseMBB = F->CreateMachineBasicBlock(LLVM_BB);


  F->insert(I, IfFalseMBB);

  F->insert(I, TailMBB);


  // Set the call frame size on entry to the new basic blocks.

  unsigned CallFrameSize = TII.getCallFrameSizeAt(*LastSelectPseudo);

  IfFalseMBB->setCallFrameSize(CallFrameSize);

  TailMBB->setCallFrameSize(CallFrameSize);


  // Transfer debug instructions associated with the selects to TailMBB.

  for (MachineInstr *DebugInstr : SelectDebugValues) {

    TailMBB->push_back(DebugInstr->removeFromParent());

  }


  // Move all instructions after the sequence to TailMBB.

  TailMBB->splice(TailMBB->end(), HeadMBB,

                  std::next(LastSelectPseudo->getIterator()), HeadMBB->end());

  // Update machine-CFG edges by transferring all successors of the current

  // block to the new block which will contain the Phi nodes for the selects.

  TailMBB->transferSuccessorsAndUpdatePHIs(HeadMBB);

  // Set the successors for HeadMBB.

  HeadMBB->addSuccessor(IfFalseMBB);

  HeadMBB->addSuccessor(TailMBB);


  // Insert appropriate branch.

  if (MI.getOperand(2).isImm())

    BuildMI(HeadMBB, DL, TII.get(CC))

        .addReg(LHS)

        .addImm(MI.getOperand(2).getImm())

        .addMBB(TailMBB);

  else

    BuildMI(HeadMBB, DL, TII.get(CC)).addReg(LHS).addReg(RHS).addMBB(TailMBB);


  // IfFalseMBB just falls through to TailMBB.

  IfFalseMBB->addSuccessor(TailMBB);


  // Create PHIs for all of the select pseudo-instructions.

  auto SelectMBBI = MI.getIterator();

  auto SelectEnd = std::next(LastSelectPseudo->getIterator());

  auto InsertionPoint = TailMBB->begin();

  while (SelectMBBI != SelectEnd) {

    auto Next = std::next(SelectMBBI);

    if (isSelectPseudo(*SelectMBBI)) {

      // %Result = phi [ %TrueValue, HeadMBB ], [ %FalseValue, IfFalseMBB ]

      BuildMI(*TailMBB, InsertionPoint, SelectMBBI->getDebugLoc(),

              TII.get(LoongArch::PHI), SelectMBBI->getOperand(0).getReg())

          .addReg(SelectMBBI->getOperand(4).getReg())

          .addMBB(HeadMBB)

          .addReg(SelectMBBI->getOperand(5).getReg())

          .addMBB(IfFalseMBB);

      SelectMBBI->eraseFromParent();

    }

    SelectMBBI = Next;

  }


  F->getProperties().resetNoPHIs();

  return TailMBB;

}


MachineBasicBlock *LoongArchTargetLowering::EmitInstrWithCustomInserter(

    MachineInstr &MI, MachineBasicBlock *BB) const {

  const TargetInstrInfo *TII = Subtarget.getInstrInfo();

  DebugLoc DL = MI.getDebugLoc();


  switch (MI.getOpcode()) {

  default:

    llvm_unreachable("Unexpected instr type to insert");

  case LoongArch::DIV_W:

  case LoongArch::DIV_WU:

  case LoongArch::MOD_W:

  case LoongArch::MOD_WU:

  case LoongArch::DIV_D:

  case LoongArch::DIV_DU:

  case LoongArch::MOD_D:

  case LoongArch::MOD_DU:

    return insertDivByZeroTrap(MI, BB);

    break;

  case LoongArch::WRFCSR: {

    BuildMI(*BB, MI, DL, TII->get(LoongArch::MOVGR2FCSR),

            LoongArch::FCSR0 + MI.getOperand(0).getImm())

        .addReg(MI.getOperand(1).getReg());

    MI.eraseFromParent();

    return BB;

  }

  case LoongArch::RDFCSR: {

    MachineInstr *ReadFCSR =

        BuildMI(*BB, MI, DL, TII->get(LoongArch::MOVFCSR2GR),

                MI.getOperand(0).getReg())

            .addReg(LoongArch::FCSR0 + MI.getOperand(1).getImm());

    ReadFCSR->getOperand(1).setIsUndef();

    MI.eraseFromParent();

    return BB;

  }

  case LoongArch::Select_GPR_Using_CC_GPR:

    return emitSelectPseudo(MI, BB, Subtarget);

  case LoongArch::BuildPairF64Pseudo:

    return emitBuildPairF64Pseudo(MI, BB, Subtarget);

  case LoongArch::SplitPairF64Pseudo:

    return emitSplitPairF64Pseudo(MI, BB, Subtarget);

  case LoongArch::PseudoVBZ:

  case LoongArch::PseudoVBZ_B:

  case LoongArch::PseudoVBZ_H:

  case LoongArch::PseudoVBZ_W:

  case LoongArch::PseudoVBZ_D:

  case LoongArch::PseudoVBNZ:

  case LoongArch::PseudoVBNZ_B:

  case LoongArch::PseudoVBNZ_H:

  case LoongArch::PseudoVBNZ_W:

  case LoongArch::PseudoVBNZ_D:

  case LoongArch::PseudoXVBZ:

  case LoongArch::PseudoXVBZ_B:

  case LoongArch::PseudoXVBZ_H:

  case LoongArch::PseudoXVBZ_W:

  case LoongArch::PseudoXVBZ_D:

  case LoongArch::PseudoXVBNZ:

  case LoongArch::PseudoXVBNZ_B:

  case LoongArch::PseudoXVBNZ_H:

  case LoongArch::PseudoXVBNZ_W:

  case LoongArch::PseudoXVBNZ_D:

    return emitVecCondBranchPseudo(MI, BB, Subtarget);

  case LoongArch::PseudoXVINSGR2VR_B:

  case LoongArch::PseudoXVINSGR2VR_H:

    return emitPseudoXVINSGR2VR(MI, BB, Subtarget);

  case LoongArch::PseudoCTPOP:

    return emitPseudoCTPOP(MI, BB, Subtarget);

  case LoongArch::PseudoVMSKLTZ_B:

  case LoongArch::PseudoVMSKLTZ_H:

  case LoongArch::PseudoVMSKLTZ_W:

  case LoongArch::PseudoVMSKLTZ_D:

  case LoongArch::PseudoVMSKGEZ_B:

  case LoongArch::PseudoVMSKEQZ_B:

  case LoongArch::PseudoVMSKNEZ_B:

  case LoongArch::PseudoXVMSKLTZ_B:

  case LoongArch::PseudoXVMSKLTZ_H:

  case LoongArch::PseudoXVMSKLTZ_W:

  case LoongArch::PseudoXVMSKLTZ_D:

  case LoongArch::PseudoXVMSKGEZ_B:

  case LoongArch::PseudoXVMSKEQZ_B:

  case LoongArch::PseudoXVMSKNEZ_B:

    return emitPseudoVMSKCOND(MI, BB, Subtarget);

  case TargetOpcode::STATEPOINT:

    // STATEPOINT is a pseudo instruction which has no implicit defs/uses

    // while bl call instruction (where statepoint will be lowered at the

    // end) has implicit def. This def is early-clobber as it will be set at

    // the moment of the call and earlier than any use is read.

    // Add this implicit dead def here as a workaround.

    MI.addOperand(*MI.getMF(),

                  MachineOperand::CreateReg(

                      LoongArch::R1, /*isDef*/ true,

                      /*isImp*/ true, /*isKill*/ false, /*isDead*/ true,

                      /*isUndef*/ false, /*isEarlyClobber*/ true));

    if (!Subtarget.is64Bit())

      report_fatal_error("STATEPOINT is only supported on 64-bit targets");

    return emitPatchPoint(MI, BB);

  }

}


bool LoongArchTargetLowering::allowsMisalignedMemoryAccesses(

    EVT VT, unsigned AddrSpace, Align Alignment, MachineMemOperand::Flags Flags,

    unsigned *Fast) const {

  if (!Subtarget.hasUAL())

    return false;


  // TODO: set reasonable speed number.

  if (Fast)

    *Fast = 1;

  return true;

}


//===----------------------------------------------------------------------===//

//                     Calling Convention Implementation

//===----------------------------------------------------------------------===//


// Eight general-purpose registers a0-a7 used for passing integer arguments,

// with a0-a1 reused to return values. Generally, the GPRs are used to pass

// fixed-point arguments, and floating-point arguments when no FPR is available

// or with soft float ABI.


const MCPhysReg ArgGPRs[] = {LoongArch::R4,  LoongArch::R5, LoongArch::R6,

                             LoongArch::R7,  LoongArch::R8, LoongArch::R9,

                             LoongArch::R10, LoongArch::R11};


// Eight floating-point registers fa0-fa7 used for passing floating-point

// arguments, and fa0-fa1 are also used to return values.


const MCPhysReg ArgFPR32s[] = {LoongArch::F0, LoongArch::F1, LoongArch::F2,

                               LoongArch::F3, LoongArch::F4, LoongArch::F5,

                               LoongArch::F6, LoongArch::F7};


// FPR32 and FPR64 alias each other.


const MCPhysReg ArgFPR64s[] = {

    LoongArch::F0_64, LoongArch::F1_64, LoongArch::F2_64, LoongArch::F3_64,

    LoongArch::F4_64, LoongArch::F5_64, LoongArch::F6_64, LoongArch::F7_64};


const MCPhysReg ArgVRs[] = {LoongArch::VR0, LoongArch::VR1, LoongArch::VR2,

                            LoongArch::VR3, LoongArch::VR4, LoongArch::VR5,

                            LoongArch::VR6, LoongArch::VR7};


const MCPhysReg ArgXRs[] = {LoongArch::XR0, LoongArch::XR1, LoongArch::XR2,

                            LoongArch::XR3, LoongArch::XR4, LoongArch::XR5,

                            LoongArch::XR6, LoongArch::XR7};


// Pass a 2*GRLen argument that has been split into two GRLen values through

// registers or the stack as necessary.


static bool CC_LoongArchAssign2GRLen(unsigned GRLen, CCState &State,

                                     CCValAssign VA1, ISD::ArgFlagsTy ArgFlags1,

                                     unsigned ValNo2, MVT ValVT2, MVT LocVT2,

                                     ISD::ArgFlagsTy ArgFlags2) {

  unsigned GRLenInBytes = GRLen / 8;

  if (Register Reg = State.AllocateReg(ArgGPRs)) {

    // At least one half can be passed via register.

    State.addLoc(CCValAssign::getReg(VA1.getValNo(), VA1.getValVT(), Reg,

                                     VA1.getLocVT(), CCValAssign::Full));

  } else {

    // Both halves must be passed on the stack, with proper alignment.

    Align StackAlign =

        std::max(Align(GRLenInBytes), ArgFlags1.getNonZeroOrigAlign());

    State.addLoc(

        CCValAssign::getMem(VA1.getValNo(), VA1.getValVT(),

                            State.AllocateStack(GRLenInBytes, StackAlign),

                            VA1.getLocVT(), CCValAssign::Full));

    State.addLoc(CCValAssign::getMem(

        ValNo2, ValVT2, State.AllocateStack(GRLenInBytes, Align(GRLenInBytes)),

        LocVT2, CCValAssign::Full));

    return false;

  }

  if (Register Reg = State.AllocateReg(ArgGPRs)) {

    // The second half can also be passed via register.

    State.addLoc(

        CCValAssign::getReg(ValNo2, ValVT2, Reg, LocVT2, CCValAssign::Full));

  } else {

    // The second half is passed via the stack, without additional alignment.

    State.addLoc(CCValAssign::getMem(

        ValNo2, ValVT2, State.AllocateStack(GRLenInBytes, Align(GRLenInBytes)),

        LocVT2, CCValAssign::Full));

  }

  return false;

}


// Implements the LoongArch calling convention. Returns true upon failure.


static bool CC_LoongArch(const DataLayout &DL, LoongArchABI::ABI ABI,

                         unsigned ValNo, MVT ValVT,

                         CCValAssign::LocInfo LocInfo, ISD::ArgFlagsTy ArgFlags,

                         CCState &State, bool IsRet, Type *OrigTy) {

  unsigned GRLen = DL.getLargestLegalIntTypeSizeInBits();

  assert((GRLen == 32 || GRLen == 64) && "Unspport GRLen");

  MVT GRLenVT = GRLen == 32 ? MVT::i32 : MVT::i64;

  MVT LocVT = ValVT;


  // Any return value split into more than two values can't be returned

  // directly.

  if (IsRet && ValNo > 1)

    return true;


  // If passing a variadic argument, or if no FPR is available.

  bool UseGPRForFloat = true;


  switch (ABI) {

  default:

    llvm_unreachable("Unexpected ABI");

    break;

  case LoongArchABI::ABI_ILP32F:

  case LoongArchABI::ABI_LP64F:

  case LoongArchABI::ABI_ILP32D:

  case LoongArchABI::ABI_LP64D:

    UseGPRForFloat = ArgFlags.isVarArg();

    break;

  case LoongArchABI::ABI_ILP32S:

  case LoongArchABI::ABI_LP64S:

    break;

  }


  // If this is a variadic argument, the LoongArch calling convention requires

  // that it is assigned an 'even' or 'aligned' register if it has (2*GRLen)/8

  // byte alignment. An aligned register should be used regardless of whether

  // the original argument was split during legalisation or not. The argument

  // will not be passed by registers if the original type is larger than

  // 2*GRLen, so the register alignment rule does not apply.

  unsigned TwoGRLenInBytes = (2 * GRLen) / 8;

  if (ArgFlags.isVarArg() &&

      ArgFlags.getNonZeroOrigAlign() == TwoGRLenInBytes &&

      DL.getTypeAllocSize(OrigTy) == TwoGRLenInBytes) {

    unsigned RegIdx = State.getFirstUnallocated(ArgGPRs);

    // Skip 'odd' register if necessary.

    if (RegIdx != std::size(ArgGPRs) && RegIdx % 2 == 1)

      State.AllocateReg(ArgGPRs);

  }


  SmallVectorImpl<CCValAssign> &PendingLocs = State.getPendingLocs();

  SmallVectorImpl<ISD::ArgFlagsTy> &PendingArgFlags =

      State.getPendingArgFlags();


  assert(PendingLocs.size() == PendingArgFlags.size() &&

         "PendingLocs and PendingArgFlags out of sync");


  // FPR32 and FPR64 alias each other.

  if (State.getFirstUnallocated(ArgFPR32s) == std::size(ArgFPR32s))

    UseGPRForFloat = true;


  if (UseGPRForFloat && ValVT == MVT::f32) {

    LocVT = GRLenVT;

    LocInfo = CCValAssign::BCvt;

  } else if (UseGPRForFloat && GRLen == 64 && ValVT == MVT::f64) {

    LocVT = MVT::i64;

    LocInfo = CCValAssign::BCvt;

  } else if (UseGPRForFloat && GRLen == 32 && ValVT == MVT::f64) {

    // Handle passing f64 on LA32D with a soft float ABI or when floating point

    // registers are exhausted.

    assert(PendingLocs.empty() && "Can't lower f64 if it is split");

    // Depending on available argument GPRS, f64 may be passed in a pair of

    // GPRs, split between a GPR and the stack, or passed completely on the

    // stack. LowerCall/LowerFormalArguments/LowerReturn must recognise these

    // cases.

    MCRegister Reg = State.AllocateReg(ArgGPRs);

    if (!Reg) {

      int64_t StackOffset = State.AllocateStack(8, Align(8));

      State.addLoc(

          CCValAssign::getMem(ValNo, ValVT, StackOffset, LocVT, LocInfo));

      return false;

    }

    LocVT = MVT::i32;

    State.addLoc(CCValAssign::getCustomReg(ValNo, ValVT, Reg, LocVT, LocInfo));

    MCRegister HiReg = State.AllocateReg(ArgGPRs);

    if (HiReg) {

      State.addLoc(

          CCValAssign::getCustomReg(ValNo, ValVT, HiReg, LocVT, LocInfo));

    } else {

      int64_t StackOffset = State.AllocateStack(4, Align(4));

      State.addLoc(

          CCValAssign::getCustomMem(ValNo, ValVT, StackOffset, LocVT, LocInfo));

    }

    return false;

  }


  // Split arguments might be passed indirectly, so keep track of the pending

  // values.

  if (ValVT.isScalarInteger() && (ArgFlags.isSplit() || !PendingLocs.empty())) {

    LocVT = GRLenVT;

    LocInfo = CCValAssign::Indirect;

    PendingLocs.push_back(

        CCValAssign::getPending(ValNo, ValVT, LocVT, LocInfo));

    PendingArgFlags.push_back(ArgFlags);

    if (!ArgFlags.isSplitEnd()) {

      return false;

    }

  }


  // If the split argument only had two elements, it should be passed directly

  // in registers or on the stack.

  if (ValVT.isScalarInteger() && ArgFlags.isSplitEnd() &&

      PendingLocs.size() <= 2) {

    assert(PendingLocs.size() == 2 && "Unexpected PendingLocs.size()");

    // Apply the normal calling convention rules to the first half of the

    // split argument.

    CCValAssign VA = PendingLocs[0];

    ISD::ArgFlagsTy AF = PendingArgFlags[0];

    PendingLocs.clear();

    PendingArgFlags.clear();

    return CC_LoongArchAssign2GRLen(GRLen, State, VA, AF, ValNo, ValVT, LocVT,

                                    ArgFlags);

  }


  // Allocate to a register if possible, or else a stack slot.

  Register Reg;

  unsigned StoreSizeBytes = GRLen / 8;

  Align StackAlign = Align(GRLen / 8);


  if (ValVT == MVT::f32 && !UseGPRForFloat) {

    Reg = State.AllocateReg(ArgFPR32s);

  } else if (ValVT == MVT::f64 && !UseGPRForFloat) {

    Reg = State.AllocateReg(ArgFPR64s);

  } else if (ValVT.is128BitVector()) {

    Reg = State.AllocateReg(ArgVRs);

    UseGPRForFloat = false;

    StoreSizeBytes = 16;

    StackAlign = Align(16);

  } else if (ValVT.is256BitVector()) {

    Reg = State.AllocateReg(ArgXRs);

    UseGPRForFloat = false;

    StoreSizeBytes = 32;

    StackAlign = Align(32);

  } else {

    Reg = State.AllocateReg(ArgGPRs);

  }


  unsigned StackOffset =

      Reg ? 0 : State.AllocateStack(StoreSizeBytes, StackAlign);


  // If we reach this point and PendingLocs is non-empty, we must be at the

  // end of a split argument that must be passed indirectly.

  if (!PendingLocs.empty()) {

    assert(ArgFlags.isSplitEnd() && "Expected ArgFlags.isSplitEnd()");

    assert(PendingLocs.size() > 2 && "Unexpected PendingLocs.size()");

    for (auto &It : PendingLocs) {

      if (Reg)

        It.convertToReg(Reg);

      else

        It.convertToMem(StackOffset);

      State.addLoc(It);

    }

    PendingLocs.clear();

    PendingArgFlags.clear();

    return false;

  }

  assert((!UseGPRForFloat || LocVT == GRLenVT) &&

         "Expected an GRLenVT at this stage");


  if (Reg) {

    State.addLoc(CCValAssign::getReg(ValNo, ValVT, Reg, LocVT, LocInfo));

    return false;

  }


  // When a floating-point value is passed on the stack, no bit-cast is needed.

  if (ValVT.isFloatingPoint()) {

    LocVT = ValVT;

    LocInfo = CCValAssign::Full;

  }


  State.addLoc(CCValAssign::getMem(ValNo, ValVT, StackOffset, LocVT, LocInfo));

  return false;

}


void LoongArchTargetLowering::analyzeInputArgs(

    MachineFunction &MF, CCState &CCInfo,

    const SmallVectorImpl<ISD::InputArg> &Ins, bool IsRet,

    LoongArchCCAssignFn Fn) const {

  FunctionType *FType = MF.getFunction().getFunctionType();

  for (unsigned i = 0, e = Ins.size(); i != e; ++i) {

    MVT ArgVT = Ins[i].VT;

    Type *ArgTy = nullptr;

    if (IsRet)

      ArgTy = FType->getReturnType();

    else if (Ins[i].isOrigArg())

      ArgTy = FType->getParamType(Ins[i].getOrigArgIndex());

    LoongArchABI::ABI ABI =

        MF.getSubtarget<LoongArchSubtarget>().getTargetABI();

    if (Fn(MF.getDataLayout(), ABI, i, ArgVT, CCValAssign::Full, Ins[i].Flags,

           CCInfo, IsRet, ArgTy)) {

      LLVM_DEBUG(dbgs() << "InputArg #" << i << " has unhandled type " << ArgVT

                        << '\n');

      llvm_unreachable("");

    }

  }

}


void LoongArchTargetLowering::analyzeOutputArgs(

    MachineFunction &MF, CCState &CCInfo,

    const SmallVectorImpl<ISD::OutputArg> &Outs, bool IsRet,

    CallLoweringInfo *CLI, LoongArchCCAssignFn Fn) const {

  for (unsigned i = 0, e = Outs.size(); i != e; ++i) {

    MVT ArgVT = Outs[i].VT;

    Type *OrigTy = CLI ? CLI->getArgs()[Outs[i].OrigArgIndex].Ty : nullptr;

    LoongArchABI::ABI ABI =

        MF.getSubtarget<LoongArchSubtarget>().getTargetABI();

    if (Fn(MF.getDataLayout(), ABI, i, ArgVT, CCValAssign::Full, Outs[i].Flags,

           CCInfo, IsRet, OrigTy)) {

      LLVM_DEBUG(dbgs() << "OutputArg #" << i << " has unhandled type " << ArgVT

                        << "\n");

      llvm_unreachable("");

    }

  }

}


// Convert Val to a ValVT. Should not be called for CCValAssign::Indirect

// values.


static SDValue convertLocVTToValVT(SelectionDAG &DAG, SDValue Val,

                                   const CCValAssign &VA, const SDLoc &DL) {

  switch (VA.getLocInfo()) {

  default:

    llvm_unreachable("Unexpected CCValAssign::LocInfo");

  case CCValAssign::Full:

  case CCValAssign::Indirect:

    break;

  case CCValAssign::BCvt:

    if (VA.getLocVT() == MVT::i64 && VA.getValVT() == MVT::f32)

      Val = DAG.getNode(LoongArchISD::MOVGR2FR_W_LA64, DL, MVT::f32, Val);

    else

      Val = DAG.getNode(ISD::BITCAST, DL, VA.getValVT(), Val);

    break;

  }

  return Val;

}


static SDValue unpackFromRegLoc(SelectionDAG &DAG, SDValue Chain,

                                const CCValAssign &VA, const SDLoc &DL,

                                const ISD::InputArg &In,

                                const LoongArchTargetLowering &TLI) {

  MachineFunction &MF = DAG.getMachineFunction();

  MachineRegisterInfo &RegInfo = MF.getRegInfo();

  EVT LocVT = VA.getLocVT();

  SDValue Val;

  const TargetRegisterClass *RC = TLI.getRegClassFor(LocVT.getSimpleVT());

  Register VReg = RegInfo.createVirtualRegister(RC);

  RegInfo.addLiveIn(VA.getLocReg(), VReg);

  Val = DAG.getCopyFromReg(Chain, DL, VReg, LocVT);


  // If input is sign extended from 32 bits, note it for the OptW pass.

  if (In.isOrigArg()) {

    Argument *OrigArg = MF.getFunction().getArg(In.getOrigArgIndex());

    if (OrigArg->getType()->isIntegerTy()) {

      unsigned BitWidth = OrigArg->getType()->getIntegerBitWidth();

      // An input zero extended from i31 can also be considered sign extended.

      if ((BitWidth <= 32 && In.Flags.isSExt()) ||

          (BitWidth < 32 && In.Flags.isZExt())) {

        LoongArchMachineFunctionInfo *LAFI =

            MF.getInfo<LoongArchMachineFunctionInfo>();

        LAFI->addSExt32Register(VReg);

      }

    }

  }


  return convertLocVTToValVT(DAG, Val, VA, DL);

}


// The caller is responsible for loading the full value if the argument is

// passed with CCValAssign::Indirect.


static SDValue unpackFromMemLoc(SelectionDAG &DAG, SDValue Chain,

                                const CCValAssign &VA, const SDLoc &DL) {

  MachineFunction &MF = DAG.getMachineFunction();

  MachineFrameInfo &MFI = MF.getFrameInfo();

  EVT ValVT = VA.getValVT();

  int FI = MFI.CreateFixedObject(ValVT.getStoreSize(), VA.getLocMemOffset(),

                                 /*IsImmutable=*/true);

  SDValue FIN = DAG.getFrameIndex(

      FI, MVT::getIntegerVT(DAG.getDataLayout().getPointerSizeInBits(0)));


  ISD::LoadExtType ExtType;

  switch (VA.getLocInfo()) {

  default:

    llvm_unreachable("Unexpected CCValAssign::LocInfo");

  case CCValAssign::Full:

  case CCValAssign::Indirect:

  case CCValAssign::BCvt:

    ExtType = ISD::NON_EXTLOAD;

    break;

  }

  return DAG.getExtLoad(

      ExtType, DL, VA.getLocVT(), Chain, FIN,

      MachinePointerInfo::getFixedStack(DAG.getMachineFunction(), FI), ValVT);

}


static SDValue unpackF64OnLA32DSoftABI(SelectionDAG &DAG, SDValue Chain,

                                       const CCValAssign &VA,

                                       const CCValAssign &HiVA,

                                       const SDLoc &DL) {

  assert(VA.getLocVT() == MVT::i32 && VA.getValVT() == MVT::f64 &&

         "Unexpected VA");

  MachineFunction &MF = DAG.getMachineFunction();

  MachineFrameInfo &MFI = MF.getFrameInfo();

  MachineRegisterInfo &RegInfo = MF.getRegInfo();


  assert(VA.isRegLoc() && "Expected register VA assignment");


  Register LoVReg = RegInfo.createVirtualRegister(&LoongArch::GPRRegClass);

  RegInfo.addLiveIn(VA.getLocReg(), LoVReg);

  SDValue Lo = DAG.getCopyFromReg(Chain, DL, LoVReg, MVT::i32);

  SDValue Hi;

  if (HiVA.isMemLoc()) {

    // Second half of f64 is passed on the stack.

    int FI = MFI.CreateFixedObject(4, HiVA.getLocMemOffset(),

                                   /*IsImmutable=*/true);

    SDValue FIN = DAG.getFrameIndex(FI, MVT::i32);

    Hi = DAG.getLoad(MVT::i32, DL, Chain, FIN,

                     MachinePointerInfo::getFixedStack(MF, FI));

  } else {

    // Second half of f64 is passed in another GPR.

    Register HiVReg = RegInfo.createVirtualRegister(&LoongArch::GPRRegClass);

    RegInfo.addLiveIn(HiVA.getLocReg(), HiVReg);

    Hi = DAG.getCopyFromReg(Chain, DL, HiVReg, MVT::i32);

  }

  return DAG.getNode(LoongArchISD::BUILD_PAIR_F64, DL, MVT::f64, Lo, Hi);

}


static SDValue convertValVTToLocVT(SelectionDAG &DAG, SDValue Val,

                                   const CCValAssign &VA, const SDLoc &DL) {

  EVT LocVT = VA.getLocVT();


  switch (VA.getLocInfo()) {

  default:

    llvm_unreachable("Unexpected CCValAssign::LocInfo");

  case CCValAssign::Full:

    break;

  case CCValAssign::BCvt:

    if (VA.getLocVT() == MVT::i64 && VA.getValVT() == MVT::f32)

      Val = DAG.getNode(LoongArchISD::MOVFR2GR_S_LA64, DL, MVT::i64, Val);

    else

      Val = DAG.getNode(ISD::BITCAST, DL, LocVT, Val);

    break;

  }

  return Val;

}


static bool CC_LoongArch_GHC(unsigned ValNo, MVT ValVT, MVT LocVT,

                             CCValAssign::LocInfo LocInfo,

                             ISD::ArgFlagsTy ArgFlags, Type *OrigTy,

                             CCState &State) {

  if (LocVT == MVT::i32 || LocVT == MVT::i64) {

    // Pass in STG registers: Base, Sp, Hp, R1, R2, R3, R4, R5, SpLim

    //                        s0    s1  s2  s3  s4  s5  s6  s7  s8

    static const MCPhysReg GPRList[] = {

        LoongArch::R23, LoongArch::R24, LoongArch::R25,

        LoongArch::R26, LoongArch::R27, LoongArch::R28,

        LoongArch::R29, LoongArch::R30, LoongArch::R31};

    if (MCRegister Reg = State.AllocateReg(GPRList)) {

      State.addLoc(CCValAssign::getReg(ValNo, ValVT, Reg, LocVT, LocInfo));

      return false;

    }

  }


  if (LocVT == MVT::f32) {

    // Pass in STG registers: F1, F2, F3, F4

    //                        fs0,fs1,fs2,fs3

    static const MCPhysReg FPR32List[] = {LoongArch::F24, LoongArch::F25,

                                          LoongArch::F26, LoongArch::F27};

    if (MCRegister Reg = State.AllocateReg(FPR32List)) {

      State.addLoc(CCValAssign::getReg(ValNo, ValVT, Reg, LocVT, LocInfo));

      return false;

    }

  }


  if (LocVT == MVT::f64) {

    // Pass in STG registers: D1, D2, D3, D4

    //                        fs4,fs5,fs6,fs7

    static const MCPhysReg FPR64List[] = {LoongArch::F28_64, LoongArch::F29_64,

                                          LoongArch::F30_64, LoongArch::F31_64};

    if (MCRegister Reg = State.AllocateReg(FPR64List)) {

      State.addLoc(CCValAssign::getReg(ValNo, ValVT, Reg, LocVT, LocInfo));

      return false;

    }

  }


  report_fatal_error("No registers left in GHC calling convention");

  return true;

}


// Transform physical registers into virtual registers.


SDValue LoongArchTargetLowering::LowerFormalArguments(

    SDValue Chain, CallingConv::ID CallConv, bool IsVarArg,

    const SmallVectorImpl<ISD::InputArg> &Ins, const SDLoc &DL,

    SelectionDAG &DAG, SmallVectorImpl<SDValue> &InVals) const {


  MachineFunction &MF = DAG.getMachineFunction();


  switch (CallConv) {

  default:

    llvm_unreachable("Unsupported calling convention");

  case CallingConv::C:

  case CallingConv::Fast:

  case CallingConv::PreserveMost:

    break;

  case CallingConv::GHC:

    if (!MF.getSubtarget().hasFeature(LoongArch::FeatureBasicF) ||

        !MF.getSubtarget().hasFeature(LoongArch::FeatureBasicD))

      report_fatal_error(

          "GHC calling convention requires the F and D extensions");

  }


  EVT PtrVT = getPointerTy(DAG.getDataLayout());

  MVT GRLenVT = Subtarget.getGRLenVT();

  unsigned GRLenInBytes = Subtarget.getGRLen() / 8;

  // Used with varargs to acumulate store chains.

  std::vector<SDValue> OutChains;


  // Assign locations to all of the incoming arguments.

  SmallVector<CCValAssign> ArgLocs;

  CCState CCInfo(CallConv, IsVarArg, MF, ArgLocs, *DAG.getContext());


  if (CallConv == CallingConv::GHC)

    CCInfo.AnalyzeFormalArguments(Ins, CC_LoongArch_GHC);

  else

    analyzeInputArgs(MF, CCInfo, Ins, /*IsRet=*/false, CC_LoongArch);


  for (unsigned i = 0, e = ArgLocs.size(), InsIdx = 0; i != e; ++i, ++InsIdx) {

    CCValAssign &VA = ArgLocs[i];

    SDValue ArgValue;

    // Passing f64 on LA32D with a soft float ABI must be handled as a special

    // case.

    if (VA.getLocVT() == MVT::i32 && VA.getValVT() == MVT::f64) {

      assert(VA.needsCustom());

      ArgValue = unpackF64OnLA32DSoftABI(DAG, Chain, VA, ArgLocs[++i], DL);

    } else if (VA.isRegLoc())

      ArgValue = unpackFromRegLoc(DAG, Chain, VA, DL, Ins[InsIdx], *this);

    else

      ArgValue = unpackFromMemLoc(DAG, Chain, VA, DL);

    if (VA.getLocInfo() == CCValAssign::Indirect) {

      // If the original argument was split and passed by reference, we need to

      // load all parts of it here (using the same address).

      InVals.push_back(DAG.getLoad(VA.getValVT(), DL, Chain, ArgValue,

                                   MachinePointerInfo()));

      unsigned ArgIndex = Ins[InsIdx].OrigArgIndex;

      unsigned ArgPartOffset = Ins[InsIdx].PartOffset;

      assert(ArgPartOffset == 0);

      while (i + 1 != e && Ins[InsIdx + 1].OrigArgIndex == ArgIndex) {

        CCValAssign &PartVA = ArgLocs[i + 1];

        unsigned PartOffset = Ins[InsIdx + 1].PartOffset - ArgPartOffset;

        SDValue Offset = DAG.getIntPtrConstant(PartOffset, DL);

        SDValue Address = DAG.getNode(ISD::ADD, DL, PtrVT, ArgValue, Offset);

        InVals.push_back(DAG.getLoad(PartVA.getValVT(), DL, Chain, Address,

                                     MachinePointerInfo()));

        ++i;

        ++InsIdx;

      }

      continue;

    }

    InVals.push_back(ArgValue);

  }


  if (IsVarArg) {

    ArrayRef<MCPhysReg> ArgRegs = ArrayRef(ArgGPRs);

    unsigned Idx = CCInfo.getFirstUnallocated(ArgRegs);

    const TargetRegisterClass *RC = &LoongArch::GPRRegClass;

    MachineFrameInfo &MFI = MF.getFrameInfo();

    MachineRegisterInfo &RegInfo = MF.getRegInfo();

    auto *LoongArchFI = MF.getInfo<LoongArchMachineFunctionInfo>();


    // Offset of the first variable argument from stack pointer, and size of

    // the vararg save area. For now, the varargs save area is either zero or

    // large enough to hold a0-a7.

    int VaArgOffset, VarArgsSaveSize;


    // If all registers are allocated, then all varargs must be passed on the

    // stack and we don't need to save any argregs.

    if (ArgRegs.size() == Idx) {

      VaArgOffset = CCInfo.getStackSize();

      VarArgsSaveSize = 0;

    } else {

      VarArgsSaveSize = GRLenInBytes * (ArgRegs.size() - Idx);

      VaArgOffset = -VarArgsSaveSize;

    }


    // Record the frame index of the first variable argument

    // which is a value necessary to VASTART.

    int FI = MFI.CreateFixedObject(GRLenInBytes, VaArgOffset, true);

    LoongArchFI->setVarArgsFrameIndex(FI);


    // If saving an odd number of registers then create an extra stack slot to

    // ensure that the frame pointer is 2*GRLen-aligned, which in turn ensures

    // offsets to even-numbered registered remain 2*GRLen-aligned.

    if (Idx % 2) {

      MFI.CreateFixedObject(GRLenInBytes, VaArgOffset - (int)GRLenInBytes,

                            true);

      VarArgsSaveSize += GRLenInBytes;

    }


    // Copy the integer registers that may have been used for passing varargs

    // to the vararg save area.

    for (unsigned I = Idx; I < ArgRegs.size();

         ++I, VaArgOffset += GRLenInBytes) {

      const Register Reg = RegInfo.createVirtualRegister(RC);

      RegInfo.addLiveIn(ArgRegs[I], Reg);

      SDValue ArgValue = DAG.getCopyFromReg(Chain, DL, Reg, GRLenVT);

      FI = MFI.CreateFixedObject(GRLenInBytes, VaArgOffset, true);

      SDValue PtrOff = DAG.getFrameIndex(FI, getPointerTy(DAG.getDataLayout()));

      SDValue Store = DAG.getStore(Chain, DL, ArgValue, PtrOff,

                                   MachinePointerInfo::getFixedStack(MF, FI));

      cast<StoreSDNode>(Store.getNode())

          ->getMemOperand()

          ->setValue((Value *)nullptr);

      OutChains.push_back(Store);

    }

    LoongArchFI->setVarArgsSaveSize(VarArgsSaveSize);

  }


  // All stores are grouped in one node to allow the matching between

  // the size of Ins and InVals. This only happens for vararg functions.

  if (!OutChains.empty()) {

    OutChains.push_back(Chain);

    Chain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, OutChains);

  }


  return Chain;

}


bool LoongArchTargetLowering::mayBeEmittedAsTailCall(const CallInst *CI) const {

  return CI->isTailCall();

}


// Check if the return value is used as only a return value, as otherwise

// we can't perform a tail-call.


bool LoongArchTargetLowering::isUsedByReturnOnly(SDNode *N,

                                                 SDValue &Chain) const {

  if (N->getNumValues() != 1)

    return false;

  if (!N->hasNUsesOfValue(1, 0))

    return false;


  SDNode *Copy = *N->user_begin();

  if (Copy->getOpcode() != ISD::CopyToReg)

    return false;


  // If the ISD::CopyToReg has a glue operand, we conservatively assume it

  // isn't safe to perform a tail call.

  if (Copy->getGluedNode())

    return false;


  // The copy must be used by a LoongArchISD::RET, and nothing else.

  bool HasRet = false;

  for (SDNode *Node : Copy->users()) {

    if (Node->getOpcode() != LoongArchISD::RET)

      return false;

    HasRet = true;

  }


  if (!HasRet)

    return false;


  Chain = Copy->getOperand(0);

  return true;

}


// Check whether the call is eligible for tail call optimization.

bool LoongArchTargetLowering::isEligibleForTailCallOptimization(

    CCState &CCInfo, CallLoweringInfo &CLI, MachineFunction &MF,

    const SmallVectorImpl<CCValAssign> &ArgLocs) const {


  auto CalleeCC = CLI.CallConv;

  auto &Outs = CLI.Outs;

  auto &Caller = MF.getFunction();

  auto CallerCC = Caller.getCallingConv();


  // Do not tail call opt if the stack is used to pass parameters.

  if (CCInfo.getStackSize() != 0)

    return false;


  // Do not tail call opt if any parameters need to be passed indirectly.

  for (auto &VA : ArgLocs)

    if (VA.getLocInfo() == CCValAssign::Indirect)

      return false;


  // Do not tail call opt if either caller or callee uses struct return

  // semantics.

  auto IsCallerStructRet = Caller.hasStructRetAttr();

  auto IsCalleeStructRet = Outs.empty() ? false : Outs[0].Flags.isSRet();

  if (IsCallerStructRet || IsCalleeStructRet)

    return false;


  // Do not tail call opt if either the callee or caller has a byval argument.

  for (auto &Arg : Outs)

    if (Arg.Flags.isByVal())

      return false;


  // The callee has to preserve all registers the caller needs to preserve.

  const LoongArchRegisterInfo *TRI = Subtarget.getRegisterInfo();

  const uint32_t *CallerPreserved = TRI->getCallPreservedMask(MF, CallerCC);

  if (CalleeCC != CallerCC) {

    const uint32_t *CalleePreserved = TRI->getCallPreservedMask(MF, CalleeCC);

    if (!TRI->regmaskSubsetEqual(CallerPreserved, CalleePreserved))

      return false;

  }

  return true;

}


static Align getPrefTypeAlign(EVT VT, SelectionDAG &DAG) {

  return DAG.getDataLayout().getPrefTypeAlign(

      VT.getTypeForEVT(*DAG.getContext()));

}


// Lower a call to a callseq_start + CALL + callseq_end chain, and add input

// and output parameter nodes.

SDValue


LoongArchTargetLowering::LowerCall(CallLoweringInfo &CLI,

                                   SmallVectorImpl<SDValue> &InVals) const {

  SelectionDAG &DAG = CLI.DAG;

  SDLoc &DL = CLI.DL;

  SmallVectorImpl<ISD::OutputArg> &Outs = CLI.Outs;

  SmallVectorImpl<SDValue> &OutVals = CLI.OutVals;

  SmallVectorImpl<ISD::InputArg> &Ins = CLI.Ins;

  SDValue Chain = CLI.Chain;

  SDValue Callee = CLI.Callee;

  CallingConv::ID CallConv = CLI.CallConv;

  bool IsVarArg = CLI.IsVarArg;

  EVT PtrVT = getPointerTy(DAG.getDataLayout());

  MVT GRLenVT = Subtarget.getGRLenVT();

  bool &IsTailCall = CLI.IsTailCall;


  MachineFunction &MF = DAG.getMachineFunction();


  // Analyze the operands of the call, assigning locations to each operand.

  SmallVector<CCValAssign> ArgLocs;

  CCState ArgCCInfo(CallConv, IsVarArg, MF, ArgLocs, *DAG.getContext());


  if (CallConv == CallingConv::GHC)

    ArgCCInfo.AnalyzeCallOperands(Outs, CC_LoongArch_GHC);

  else

    analyzeOutputArgs(MF, ArgCCInfo, Outs, /*IsRet=*/false, &CLI, CC_LoongArch);


  // Check if it's really possible to do a tail call.

  if (IsTailCall)

    IsTailCall = isEligibleForTailCallOptimization(ArgCCInfo, CLI, MF, ArgLocs);


  if (IsTailCall)

    ++NumTailCalls;

  else if (CLI.CB && CLI.CB->isMustTailCall())

    report_fatal_error("failed to perform tail call elimination on a call "

                       "site marked musttail");


  // Get a count of how many bytes are to be pushed on the stack.

  unsigned NumBytes = ArgCCInfo.getStackSize();


  // Create local copies for byval args.

  SmallVector<SDValue> ByValArgs;

  for (unsigned i = 0, e = Outs.size(); i != e; ++i) {

    ISD::ArgFlagsTy Flags = Outs[i].Flags;

    if (!Flags.isByVal())

      continue;


    SDValue Arg = OutVals[i];

    unsigned Size = Flags.getByValSize();

    Align Alignment = Flags.getNonZeroByValAlign();


    int FI =

        MF.getFrameInfo().CreateStackObject(Size, Alignment, /*isSS=*/false);

    SDValue FIPtr = DAG.getFrameIndex(FI, getPointerTy(DAG.getDataLayout()));

    SDValue SizeNode = DAG.getConstant(Size, DL, GRLenVT);


    Chain = DAG.getMemcpy(Chain, DL, FIPtr, Arg, SizeNode, Alignment,

                          /*IsVolatile=*/false,

                          /*AlwaysInline=*/false, /*CI=*/nullptr, std::nullopt,

                          MachinePointerInfo(), MachinePointerInfo());

    ByValArgs.push_back(FIPtr);

  }


  if (!IsTailCall)

    Chain = DAG.getCALLSEQ_START(Chain, NumBytes, 0, CLI.DL);


  // Copy argument values to their designated locations.

  SmallVector<std::pair<Register, SDValue>> RegsToPass;

  SmallVector<SDValue> MemOpChains;

  SDValue StackPtr;

  for (unsigned i = 0, j = 0, e = ArgLocs.size(), OutIdx = 0; i != e;

       ++i, ++OutIdx) {

    CCValAssign &VA = ArgLocs[i];

    SDValue ArgValue = OutVals[OutIdx];

    ISD::ArgFlagsTy Flags = Outs[OutIdx].Flags;


    // Handle passing f64 on LA32D with a soft float ABI as a special case.

    if (VA.getLocVT() == MVT::i32 && VA.getValVT() == MVT::f64) {

      assert(VA.isRegLoc() && "Expected register VA assignment");

      assert(VA.needsCustom());

      SDValue SplitF64 =

          DAG.getNode(LoongArchISD::SPLIT_PAIR_F64, DL,

                      DAG.getVTList(MVT::i32, MVT::i32), ArgValue);

      SDValue Lo = SplitF64.getValue(0);

      SDValue Hi = SplitF64.getValue(1);


      Register RegLo = VA.getLocReg();

      RegsToPass.push_back(std::make_pair(RegLo, Lo));


      // Get the CCValAssign for the Hi part.

      CCValAssign &HiVA = ArgLocs[++i];


      if (HiVA.isMemLoc()) {

        // Second half of f64 is passed on the stack.

        if (!StackPtr.getNode())

          StackPtr = DAG.getCopyFromReg(Chain, DL, LoongArch::R3, PtrVT);

        SDValue Address =

            DAG.getNode(ISD::ADD, DL, PtrVT, StackPtr,

                        DAG.getIntPtrConstant(HiVA.getLocMemOffset(), DL));

        // Emit the store.

        MemOpChains.push_back(DAG.getStore(

            Chain, DL, Hi, Address,

            MachinePointerInfo::getStack(MF, HiVA.getLocMemOffset())));

      } else {

        // Second half of f64 is passed in another GPR.

        Register RegHigh = HiVA.getLocReg();

        RegsToPass.push_back(std::make_pair(RegHigh, Hi));

      }

      continue;

    }


    // Promote the value if needed.

    // For now, only handle fully promoted and indirect arguments.

    if (VA.getLocInfo() == CCValAssign::Indirect) {

      // Store the argument in a stack slot and pass its address.

      Align StackAlign =

          std::max(getPrefTypeAlign(Outs[OutIdx].ArgVT, DAG),

                   getPrefTypeAlign(ArgValue.getValueType(), DAG));

      TypeSize StoredSize = ArgValue.getValueType().getStoreSize();

      // If the original argument was split and passed by reference, we need to

      // store the required parts of it here (and pass just one address).

      unsigned ArgIndex = Outs[OutIdx].OrigArgIndex;

      unsigned ArgPartOffset = Outs[OutIdx].PartOffset;

      assert(ArgPartOffset == 0);

      // Calculate the total size to store. We don't have access to what we're

      // actually storing other than performing the loop and collecting the

      // info.

      SmallVector<std::pair<SDValue, SDValue>> Parts;

      while (i + 1 != e && Outs[OutIdx + 1].OrigArgIndex == ArgIndex) {

        SDValue PartValue = OutVals[OutIdx + 1];

        unsigned PartOffset = Outs[OutIdx + 1].PartOffset - ArgPartOffset;

        SDValue Offset = DAG.getIntPtrConstant(PartOffset, DL);

        EVT PartVT = PartValue.getValueType();


        StoredSize += PartVT.getStoreSize();

        StackAlign = std::max(StackAlign, getPrefTypeAlign(PartVT, DAG));

        Parts.push_back(std::make_pair(PartValue, Offset));

        ++i;

        ++OutIdx;

      }

      SDValue SpillSlot = DAG.CreateStackTemporary(StoredSize, StackAlign);

      int FI = cast<FrameIndexSDNode>(SpillSlot)->getIndex();

      MemOpChains.push_back(

          DAG.getStore(Chain, DL, ArgValue, SpillSlot,

                       MachinePointerInfo::getFixedStack(MF, FI)));

      for (const auto &Part : Parts) {

        SDValue PartValue = Part.first;

        SDValue PartOffset = Part.second;

        SDValue Address =

            DAG.getNode(ISD::ADD, DL, PtrVT, SpillSlot, PartOffset);

        MemOpChains.push_back(

            DAG.getStore(Chain, DL, PartValue, Address,

                         MachinePointerInfo::getFixedStack(MF, FI)));

      }

      ArgValue = SpillSlot;

    } else {

      ArgValue = convertValVTToLocVT(DAG, ArgValue, VA, DL);

    }


    // Use local copy if it is a byval arg.

    if (Flags.isByVal())

      ArgValue = ByValArgs[j++];


    if (VA.isRegLoc()) {

      // Queue up the argument copies and emit them at the end.

      RegsToPass.push_back(std::make_pair(VA.getLocReg(), ArgValue));

    } else {

      assert(VA.isMemLoc() && "Argument not register or memory");

      assert(!IsTailCall && "Tail call not allowed if stack is used "

                            "for passing parameters");


      // Work out the address of the stack slot.

      if (!StackPtr.getNode())

        StackPtr = DAG.getCopyFromReg(Chain, DL, LoongArch::R3, PtrVT);

      SDValue Address =

          DAG.getNode(ISD::ADD, DL, PtrVT, StackPtr,

                      DAG.getIntPtrConstant(VA.getLocMemOffset(), DL));


      // Emit the store.

      MemOpChains.push_back(

          DAG.getStore(Chain, DL, ArgValue, Address, MachinePointerInfo()));

    }

  }


  // Join the stores, which are independent of one another.

  if (!MemOpChains.empty())

    Chain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, MemOpChains);


  SDValue Glue;


  // Build a sequence of copy-to-reg nodes, chained and glued together.

  for (auto &Reg : RegsToPass) {

    Chain = DAG.getCopyToReg(Chain, DL, Reg.first, Reg.second, Glue);

    Glue = Chain.getValue(1);

  }


  // If the callee is a GlobalAddress/ExternalSymbol node, turn it into a

  // TargetGlobalAddress/TargetExternalSymbol node so that legalize won't

  // split it and then direct call can be matched by PseudoCALL.

  if (GlobalAddressSDNode *S = dyn_cast<GlobalAddressSDNode>(Callee)) {

    const GlobalValue *GV = S->getGlobal();

    unsigned OpFlags = getTargetMachine().shouldAssumeDSOLocal(GV)

                           ? LoongArchII::MO_CALL

                           : LoongArchII::MO_CALL_PLT;

    Callee = DAG.getTargetGlobalAddress(S->getGlobal(), DL, PtrVT, 0, OpFlags);

  } else if (ExternalSymbolSDNode *S = dyn_cast<ExternalSymbolSDNode>(Callee)) {

    unsigned OpFlags = getTargetMachine().shouldAssumeDSOLocal(nullptr)

                           ? LoongArchII::MO_CALL

                           : LoongArchII::MO_CALL_PLT;

    Callee = DAG.getTargetExternalSymbol(S->getSymbol(), PtrVT, OpFlags);

  }


  // The first call operand is the chain and the second is the target address.

  SmallVector<SDValue> Ops;

  Ops.push_back(Chain);

  Ops.push_back(Callee);


  // Add argument registers to the end of the list so that they are

  // known live into the call.

  for (auto &Reg : RegsToPass)

    Ops.push_back(DAG.getRegister(Reg.first, Reg.second.getValueType()));


  if (!IsTailCall) {

    // Add a register mask operand representing the call-preserved registers.

    const TargetRegisterInfo *TRI = Subtarget.getRegisterInfo();

    const uint32_t *Mask = TRI->getCallPreservedMask(MF, CallConv);

    assert(Mask && "Missing call preserved mask for calling convention");

    Ops.push_back(DAG.getRegisterMask(Mask));

  }


  // Glue the call to the argument copies, if any.

  if (Glue.getNode())

    Ops.push_back(Glue);


  // Emit the call.

  SDVTList NodeTys = DAG.getVTList(MVT::Other, MVT::Glue);

  unsigned Op;

  switch (DAG.getTarget().getCodeModel()) {

  default:

    report_fatal_error("Unsupported code model");

  case CodeModel::Small:

    Op = IsTailCall ? LoongArchISD::TAIL : LoongArchISD::CALL;

    break;

  case CodeModel::Medium:

    assert(Subtarget.is64Bit() && "Medium code model requires LA64");

    Op = IsTailCall ? LoongArchISD::TAIL_MEDIUM : LoongArchISD::CALL_MEDIUM;

    break;

  case CodeModel::Large:

    assert(Subtarget.is64Bit() && "Large code model requires LA64");

    Op = IsTailCall ? LoongArchISD::TAIL_LARGE : LoongArchISD::CALL_LARGE;

    break;

  }


  if (IsTailCall) {

    MF.getFrameInfo().setHasTailCall();

    SDValue Ret = DAG.getNode(Op, DL, NodeTys, Ops);

    DAG.addNoMergeSiteInfo(Ret.getNode(), CLI.NoMerge);

    return Ret;

  }


  Chain = DAG.getNode(Op, DL, NodeTys, Ops);

  DAG.addNoMergeSiteInfo(Chain.getNode(), CLI.NoMerge);

  Glue = Chain.getValue(1);


  // Mark the end of the call, which is glued to the call itself.

  Chain = DAG.getCALLSEQ_END(Chain, NumBytes, 0, Glue, DL);

  Glue = Chain.getValue(1);


  // Assign locations to each value returned by this call.

  SmallVector<CCValAssign> RVLocs;

  CCState RetCCInfo(CallConv, IsVarArg, MF, RVLocs, *DAG.getContext());

  analyzeInputArgs(MF, RetCCInfo, Ins, /*IsRet=*/true, CC_LoongArch);


  // Copy all of the result registers out of their specified physreg.

  for (unsigned i = 0, e = RVLocs.size(); i != e; ++i) {

    auto &VA = RVLocs[i];

    // Copy the value out.

    SDValue RetValue =

        DAG.getCopyFromReg(Chain, DL, VA.getLocReg(), VA.getLocVT(), Glue);

    // Glue the RetValue to the end of the call sequence.

    Chain = RetValue.getValue(1);

    Glue = RetValue.getValue(2);


    if (VA.getLocVT() == MVT::i32 && VA.getValVT() == MVT::f64) {

      assert(VA.needsCustom());

      SDValue RetValue2 = DAG.getCopyFromReg(Chain, DL, RVLocs[++i].getLocReg(),

                                             MVT::i32, Glue);

      Chain = RetValue2.getValue(1);

      Glue = RetValue2.getValue(2);

      RetValue = DAG.getNode(LoongArchISD::BUILD_PAIR_F64, DL, MVT::f64,

                             RetValue, RetValue2);

    } else

      RetValue = convertLocVTToValVT(DAG, RetValue, VA, DL);


    InVals.push_back(RetValue);

  }


  return Chain;

}


bool LoongArchTargetLowering::CanLowerReturn(

    CallingConv::ID CallConv, MachineFunction &MF, bool IsVarArg,

    const SmallVectorImpl<ISD::OutputArg> &Outs, LLVMContext &Context,

    const Type *RetTy) const {

  SmallVector<CCValAssign> RVLocs;

  CCState CCInfo(CallConv, IsVarArg, MF, RVLocs, Context);


  for (unsigned i = 0, e = Outs.size(); i != e; ++i) {

    LoongArchABI::ABI ABI =

        MF.getSubtarget<LoongArchSubtarget>().getTargetABI();

    if (CC_LoongArch(MF.getDataLayout(), ABI, i, Outs[i].VT, CCValAssign::Full,

                     Outs[i].Flags, CCInfo, /*IsRet=*/true, nullptr))

      return false;

  }

  return true;

}


SDValue LoongArchTargetLowering::LowerReturn(

    SDValue Chain, CallingConv::ID CallConv, bool IsVarArg,

    const SmallVectorImpl<ISD::OutputArg> &Outs,

    const SmallVectorImpl<SDValue> &OutVals, const SDLoc &DL,

    SelectionDAG &DAG) const {

  // Stores the assignment of the return value to a location.

  SmallVector<CCValAssign> RVLocs;


  // Info about the registers and stack slot.

  CCState CCInfo(CallConv, IsVarArg, DAG.getMachineFunction(), RVLocs,

                 *DAG.getContext());


  analyzeOutputArgs(DAG.getMachineFunction(), CCInfo, Outs, /*IsRet=*/true,

                    nullptr, CC_LoongArch);

  if (CallConv == CallingConv::GHC && !RVLocs.empty())

    report_fatal_error("GHC functions return void only");

  SDValue Glue;

  SmallVector<SDValue, 4> RetOps(1, Chain);


  // Copy the result values into the output registers.

  for (unsigned i = 0, e = RVLocs.size(), OutIdx = 0; i < e; ++i, ++OutIdx) {

    SDValue Val = OutVals[OutIdx];

    CCValAssign &VA = RVLocs[i];

    assert(VA.isRegLoc() && "Can only return in registers!");


    if (VA.getLocVT() == MVT::i32 && VA.getValVT() == MVT::f64) {

      // Handle returning f64 on LA32D with a soft float ABI.

      assert(VA.isRegLoc() && "Expected return via registers");

      assert(VA.needsCustom());

      SDValue SplitF64 = DAG.getNode(LoongArchISD::SPLIT_PAIR_F64, DL,

                                     DAG.getVTList(MVT::i32, MVT::i32), Val);

      SDValue Lo = SplitF64.getValue(0);

      SDValue Hi = SplitF64.getValue(1);

      Register RegLo = VA.getLocReg();

      Register RegHi = RVLocs[++i].getLocReg();


      Chain = DAG.getCopyToReg(Chain, DL, RegLo, Lo, Glue);

      Glue = Chain.getValue(1);

      RetOps.push_back(DAG.getRegister(RegLo, MVT::i32));

      Chain = DAG.getCopyToReg(Chain, DL, RegHi, Hi, Glue);

      Glue = Chain.getValue(1);

      RetOps.push_back(DAG.getRegister(RegHi, MVT::i32));

    } else {

      // Handle a 'normal' return.

      Val = convertValVTToLocVT(DAG, Val, VA, DL);

      Chain = DAG.getCopyToReg(Chain, DL, VA.getLocReg(), Val, Glue);


      // Guarantee that all emitted copies are stuck together.

      Glue = Chain.getValue(1);

      RetOps.push_back(DAG.getRegister(VA.getLocReg(), VA.getLocVT()));

    }

  }


  RetOps[0] = Chain; // Update chain.


  // Add the glue node if we have it.

  if (Glue.getNode())

    RetOps.push_back(Glue);


  return DAG.getNode(LoongArchISD::RET, DL, MVT::Other, RetOps);

}


// Check if a constant splat can be generated using [x]vldi, where imm[12] == 1.

// Note: The following prefixes are excluded:

//   imm[11:8] == 4'b0000, 4'b0100, 4'b1000

// as they can be represented using [x]vrepli.[whb]


std::pair<bool, uint64_t> LoongArchTargetLowering::isImmVLDILegalForMode1(

    const APInt &SplatValue, const unsigned SplatBitSize) const {

  uint64_t RequiredImm = 0;

  uint64_t V = SplatValue.getZExtValue();

  if (SplatBitSize == 16 && !(V & 0x00FF)) {

    // 4'b0101

    RequiredImm = (0b10101 << 8) | (V >> 8);

    return {true, RequiredImm};

  } else if (SplatBitSize == 32) {

    // 4'b0001

    if (!(V & 0xFFFF00FF)) {

      RequiredImm = (0b10001 << 8) | (V >> 8);

      return {true, RequiredImm};

    }

    // 4'b0010

    if (!(V & 0xFF00FFFF)) {

      RequiredImm = (0b10010 << 8) | (V >> 16);

      return {true, RequiredImm};

    }

    // 4'b0011

    if (!(V & 0x00FFFFFF)) {

      RequiredImm = (0b10011 << 8) | (V >> 24);

      return {true, RequiredImm};

    }

    // 4'b0110

    if ((V & 0xFFFF00FF) == 0xFF) {

      RequiredImm = (0b10110 << 8) | (V >> 8);

      return {true, RequiredImm};

    }

    // 4'b0111

    if ((V & 0xFF00FFFF) == 0xFFFF) {

      RequiredImm = (0b10111 << 8) | (V >> 16);

      return {true, RequiredImm};

    }

    // 4'b1010

    if ((V & 0x7E07FFFF) == 0x3E000000 || (V & 0x7E07FFFF) == 0x40000000) {

      RequiredImm =

          (0b11010 << 8) | (((V >> 24) & 0xC0) ^ 0x40) | ((V >> 19) & 0x3F);

      return {true, RequiredImm};

    }

  } else if (SplatBitSize == 64) {

    // 4'b1011

    if ((V & 0xFFFFFFFF7E07FFFFULL) == 0x3E000000ULL ||

        (V & 0xFFFFFFFF7E07FFFFULL) == 0x40000000ULL) {

      RequiredImm =

          (0b11011 << 8) | (((V >> 24) & 0xC0) ^ 0x40) | ((V >> 19) & 0x3F);

      return {true, RequiredImm};

    }

    // 4'b1100

    if ((V & 0x7FC0FFFFFFFFFFFFULL) == 0x4000000000000000ULL ||

        (V & 0x7FC0FFFFFFFFFFFFULL) == 0x3FC0000000000000ULL) {

      RequiredImm =

          (0b11100 << 8) | (((V >> 56) & 0xC0) ^ 0x40) | ((V >> 48) & 0x3F);

      return {true, RequiredImm};

    }

    // 4'b1001

    auto sameBitsPreByte = [](uint64_t x) -> std::pair<bool, uint8_t> {

      uint8_t res = 0;

      for (int i = 0; i < 8; ++i) {

        uint8_t byte = x & 0xFF;

        if (byte == 0 || byte == 0xFF)

          res |= ((byte & 1) << i);

        else

          return {false, 0};

        x >>= 8;

      }

      return {true, res};

    };

    auto [IsSame, Suffix] = sameBitsPreByte(V);

    if (IsSame) {

      RequiredImm = (0b11001 << 8) | Suffix;

      return {true, RequiredImm};

    }

  }

  return {false, RequiredImm};

}


bool LoongArchTargetLowering::isFPImmVLDILegal(const APFloat &Imm,

                                               EVT VT) const {

  if (!Subtarget.hasExtLSX())

    return false;


  if (VT == MVT::f32) {

    uint64_t masked = Imm.bitcastToAPInt().getZExtValue() & 0x7e07ffff;

    return (masked == 0x3e000000 || masked == 0x40000000);

  }


  if (VT == MVT::f64) {

    uint64_t masked = Imm.bitcastToAPInt().getZExtValue() & 0x7fc0ffffffffffff;

    return (masked == 0x3fc0000000000000 || masked == 0x4000000000000000);

  }


  return false;

}


bool LoongArchTargetLowering::isFPImmLegal(const APFloat &Imm, EVT VT,

                                           bool ForCodeSize) const {

  // TODO: Maybe need more checks here after vector extension is supported.

  if (VT == MVT::f32 && !Subtarget.hasBasicF())

    return false;

  if (VT == MVT::f64 && !Subtarget.hasBasicD())

    return false;

  return (Imm.isZero() || Imm.isExactlyValue(1.0) || isFPImmVLDILegal(Imm, VT));

}


bool LoongArchTargetLowering::isCheapToSpeculateCttz(Type *) const {

  return true;

}


bool LoongArchTargetLowering::isCheapToSpeculateCtlz(Type *) const {

  return true;

}


bool LoongArchTargetLowering::shouldInsertFencesForAtomic(

    const Instruction *I) const {

  if (!Subtarget.is64Bit())

    return isa<LoadInst>(I) || isa<StoreInst>(I);


  if (isa<LoadInst>(I))

    return true;


  // On LA64, atomic store operations with IntegerBitWidth of 32 and 64 do not

  // require fences beacuse we can use amswap_db.[w/d].

  Type *Ty = I->getOperand(0)->getType();

  if (isa<StoreInst>(I) && Ty->isIntegerTy()) {

    unsigned Size = Ty->getIntegerBitWidth();

    return (Size == 8 || Size == 16);

  }


  return false;

}


EVT LoongArchTargetLowering::getSetCCResultType(const DataLayout &DL,

                                                LLVMContext &Context,

                                                EVT VT) const {

  if (!VT.isVector())

    return getPointerTy(DL);

  return VT.changeVectorElementTypeToInteger();

}


bool LoongArchTargetLowering::hasAndNot(SDValue Y) const {

  EVT VT = Y.getValueType();


  if (VT.isVector())

    return Subtarget.hasExtLSX() && VT.isInteger();


  return VT.isScalarInteger() && !isa<ConstantSDNode>(Y);

}


bool LoongArchTargetLowering::getTgtMemIntrinsic(IntrinsicInfo &Info,

                                                 const CallBase &I,

                                                 MachineFunction &MF,

                                                 unsigned Intrinsic) const {

  switch (Intrinsic) {

  default:

    return false;

  case Intrinsic::loongarch_masked_atomicrmw_xchg_i32:

  case Intrinsic::loongarch_masked_atomicrmw_add_i32:

  case Intrinsic::loongarch_masked_atomicrmw_sub_i32:

  case Intrinsic::loongarch_masked_atomicrmw_nand_i32:

    Info.opc = ISD::INTRINSIC_W_CHAIN;

    Info.memVT = MVT::i32;

    Info.ptrVal = I.getArgOperand(0);

    Info.offset = 0;

    Info.align = Align(4);

    Info.flags = MachineMemOperand::MOLoad | MachineMemOperand::MOStore |

                 MachineMemOperand::MOVolatile;

    return true;

    // TODO: Add more Intrinsics later.

  }

}


// When -mlamcas is enabled, MinCmpXchgSizeInBits will be set to 8,

// atomicrmw and/or/xor operations with operands less than 32 bits cannot be

// expanded to am{and/or/xor}[_db].w through AtomicExpandPass. To prevent

// regression, we need to implement it manually.


void LoongArchTargetLowering::emitExpandAtomicRMW(AtomicRMWInst *AI) const {

  AtomicRMWInst::BinOp Op = AI->getOperation();


  assert((Op == AtomicRMWInst::Or || Op == AtomicRMWInst::Xor ||

          Op == AtomicRMWInst::And) &&

         "Unable to expand");

  unsigned MinWordSize = 4;


  IRBuilder<> Builder(AI);

  LLVMContext &Ctx = Builder.getContext();

  const DataLayout &DL = AI->getDataLayout();

  Type *ValueType = AI->getType();

  Type *WordType = Type::getIntNTy(Ctx, MinWordSize * 8);


  Value *Addr = AI->getPointerOperand();

  PointerType *PtrTy = cast<PointerType>(Addr->getType());

  IntegerType *IntTy = DL.getIndexType(Ctx, PtrTy->getAddressSpace());


  Value *AlignedAddr = Builder.CreateIntrinsic(

      Intrinsic::ptrmask, {PtrTy, IntTy},

      {Addr, ConstantInt::get(IntTy, ~(uint64_t)(MinWordSize - 1))}, nullptr,

      "AlignedAddr");


  Value *AddrInt = Builder.CreatePtrToInt(Addr, IntTy);

  Value *PtrLSB = Builder.CreateAnd(AddrInt, MinWordSize - 1, "PtrLSB");

  Value *ShiftAmt = Builder.CreateShl(PtrLSB, 3);

  ShiftAmt = Builder.CreateTrunc(ShiftAmt, WordType, "ShiftAmt");

  Value *Mask = Builder.CreateShl(

      ConstantInt::get(WordType,

                       (1 << (DL.getTypeStoreSize(ValueType) * 8)) - 1),

      ShiftAmt, "Mask");

  Value *Inv_Mask = Builder.CreateNot(Mask, "Inv_Mask");

  Value *ValOperand_Shifted =

      Builder.CreateShl(Builder.CreateZExt(AI->getValOperand(), WordType),

                        ShiftAmt, "ValOperand_Shifted");

  Value *NewOperand;

  if (Op == AtomicRMWInst::And)

    NewOperand = Builder.CreateOr(ValOperand_Shifted, Inv_Mask, "AndOperand");

  else

    NewOperand = ValOperand_Shifted;


  AtomicRMWInst *NewAI =

      Builder.CreateAtomicRMW(Op, AlignedAddr, NewOperand, Align(MinWordSize),

                              AI->getOrdering(), AI->getSyncScopeID());


  Value *Shift = Builder.CreateLShr(NewAI, ShiftAmt, "shifted");

  Value *Trunc = Builder.CreateTrunc(Shift, ValueType, "extracted");

  Value *FinalOldResult = Builder.CreateBitCast(Trunc, ValueType);

  AI->replaceAllUsesWith(FinalOldResult);

  AI->eraseFromParent();

}


TargetLowering::AtomicExpansionKind


LoongArchTargetLowering::shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const {

  // TODO: Add more AtomicRMWInst that needs to be extended.


  // Since floating-point operation requires a non-trivial set of data

  // operations, use CmpXChg to expand.

  if (AI->isFloatingPointOperation() ||

      AI->getOperation() == AtomicRMWInst::UIncWrap ||

      AI->getOperation() == AtomicRMWInst::UDecWrap ||

      AI->getOperation() == AtomicRMWInst::USubCond ||

      AI->getOperation() == AtomicRMWInst::USubSat)

    return AtomicExpansionKind::CmpXChg;


  if (Subtarget.hasLAM_BH() && Subtarget.is64Bit() &&

      (AI->getOperation() == AtomicRMWInst::Xchg ||

       AI->getOperation() == AtomicRMWInst::Add ||

       AI->getOperation() == AtomicRMWInst::Sub)) {

    return AtomicExpansionKind::None;

  }


  unsigned Size = AI->getType()->getPrimitiveSizeInBits();

  if (Subtarget.hasLAMCAS()) {

    if (Size < 32 && (AI->getOperation() == AtomicRMWInst::And ||

                      AI->getOperation() == AtomicRMWInst::Or ||

                      AI->getOperation() == AtomicRMWInst::Xor))

      return AtomicExpansionKind::CustomExpand;

    if (AI->getOperation() == AtomicRMWInst::Nand || Size < 32)

      return AtomicExpansionKind::CmpXChg;

  }


  if (Size == 8 || Size == 16)

    return AtomicExpansionKind::MaskedIntrinsic;

  return AtomicExpansionKind::None;

}


static Intrinsic::ID


getIntrinsicForMaskedAtomicRMWBinOp(unsigned GRLen,

                                    AtomicRMWInst::BinOp BinOp) {

  if (GRLen == 64) {

    switch (BinOp) {

    default:

      llvm_unreachable("Unexpected AtomicRMW BinOp");

    case AtomicRMWInst::Xchg:

      return Intrinsic::loongarch_masked_atomicrmw_xchg_i64;

    case AtomicRMWInst::Add:

      return Intrinsic::loongarch_masked_atomicrmw_add_i64;

    case AtomicRMWInst::Sub:

      return Intrinsic::loongarch_masked_atomicrmw_sub_i64;

    case AtomicRMWInst::Nand:

      return Intrinsic::loongarch_masked_atomicrmw_nand_i64;

    case AtomicRMWInst::UMax:

      return Intrinsic::loongarch_masked_atomicrmw_umax_i64;

    case AtomicRMWInst::UMin:

      return Intrinsic::loongarch_masked_atomicrmw_umin_i64;

    case AtomicRMWInst::Max:

      return Intrinsic::loongarch_masked_atomicrmw_max_i64;

    case AtomicRMWInst::Min:

      return Intrinsic::loongarch_masked_atomicrmw_min_i64;

      // TODO: support other AtomicRMWInst.

    }

  }


  if (GRLen == 32) {

    switch (BinOp) {

    default:

      llvm_unreachable("Unexpected AtomicRMW BinOp");

    case AtomicRMWInst::Xchg:

      return Intrinsic::loongarch_masked_atomicrmw_xchg_i32;

    case AtomicRMWInst::Add:

      return Intrinsic::loongarch_masked_atomicrmw_add_i32;

    case AtomicRMWInst::Sub:

      return Intrinsic::loongarch_masked_atomicrmw_sub_i32;

    case AtomicRMWInst::Nand:

      return Intrinsic::loongarch_masked_atomicrmw_nand_i32;

    case AtomicRMWInst::UMax:

      return Intrinsic::loongarch_masked_atomicrmw_umax_i32;

    case AtomicRMWInst::UMin:

      return Intrinsic::loongarch_masked_atomicrmw_umin_i32;

    case AtomicRMWInst::Max:

      return Intrinsic::loongarch_masked_atomicrmw_max_i32;

    case AtomicRMWInst::Min:

      return Intrinsic::loongarch_masked_atomicrmw_min_i32;

      // TODO: support other AtomicRMWInst.

    }

  }


  llvm_unreachable("Unexpected GRLen\n");

}


TargetLowering::AtomicExpansionKind


LoongArchTargetLowering::shouldExpandAtomicCmpXchgInIR(

    AtomicCmpXchgInst *CI) const {


  if (Subtarget.hasLAMCAS())

    return AtomicExpansionKind::None;


  unsigned Size = CI->getCompareOperand()->getType()->getPrimitiveSizeInBits();

  if (Size == 8 || Size == 16)

    return AtomicExpansionKind::MaskedIntrinsic;

  return AtomicExpansionKind::None;

}


Value *LoongArchTargetLowering::emitMaskedAtomicCmpXchgIntrinsic(

    IRBuilderBase &Builder, AtomicCmpXchgInst *CI, Value *AlignedAddr,

    Value *CmpVal, Value *NewVal, Value *Mask, AtomicOrdering Ord) const {

  unsigned GRLen = Subtarget.getGRLen();

  AtomicOrdering FailOrd = CI->getFailureOrdering();

  Value *FailureOrdering =

      Builder.getIntN(Subtarget.getGRLen(), static_cast<uint64_t>(FailOrd));

  Intrinsic::ID CmpXchgIntrID = Intrinsic::loongarch_masked_cmpxchg_i32;

  if (GRLen == 64) {

    CmpXchgIntrID = Intrinsic::loongarch_masked_cmpxchg_i64;

    CmpVal = Builder.CreateSExt(CmpVal, Builder.getInt64Ty());

    NewVal = Builder.CreateSExt(NewVal, Builder.getInt64Ty());

    Mask = Builder.CreateSExt(Mask, Builder.getInt64Ty());

  }

  Type *Tys[] = {AlignedAddr->getType()};

  Value *Result = Builder.CreateIntrinsic(

      CmpXchgIntrID, Tys, {AlignedAddr, CmpVal, NewVal, Mask, FailureOrdering});

  if (GRLen == 64)

    Result = Builder.CreateTrunc(Result, Builder.getInt32Ty());

  return Result;

}


Value *LoongArchTargetLowering::emitMaskedAtomicRMWIntrinsic(

    IRBuilderBase &Builder, AtomicRMWInst *AI, Value *AlignedAddr, Value *Incr,

    Value *Mask, Value *ShiftAmt, AtomicOrdering Ord) const {

  // In the case of an atomicrmw xchg with a constant 0/-1 operand, replace

  // the atomic instruction with an AtomicRMWInst::And/Or with appropriate

  // mask, as this produces better code than the LL/SC loop emitted by

  // int_loongarch_masked_atomicrmw_xchg.

  if (AI->getOperation() == AtomicRMWInst::Xchg &&

      isa<ConstantInt>(AI->getValOperand())) {

    ConstantInt *CVal = cast<ConstantInt>(AI->getValOperand());

    if (CVal->isZero())

      return Builder.CreateAtomicRMW(AtomicRMWInst::And, AlignedAddr,

                                     Builder.CreateNot(Mask, "Inv_Mask"),

                                     AI->getAlign(), Ord);

    if (CVal->isMinusOne())

      return Builder.CreateAtomicRMW(AtomicRMWInst::Or, AlignedAddr, Mask,

                                     AI->getAlign(), Ord);

  }


  unsigned GRLen = Subtarget.getGRLen();

  Value *Ordering =

      Builder.getIntN(GRLen, static_cast<uint64_t>(AI->getOrdering()));

  Type *Tys[] = {AlignedAddr->getType()};

  Function *LlwOpScwLoop = Intrinsic::getOrInsertDeclaration(

      AI->getModule(),

      getIntrinsicForMaskedAtomicRMWBinOp(GRLen, AI->getOperation()), Tys);


  if (GRLen == 64) {

    Incr = Builder.CreateSExt(Incr, Builder.getInt64Ty());

    Mask = Builder.CreateSExt(Mask, Builder.getInt64Ty());

    ShiftAmt = Builder.CreateSExt(ShiftAmt, Builder.getInt64Ty());

  }


  Value *Result;


  // Must pass the shift amount needed to sign extend the loaded value prior

  // to performing a signed comparison for min/max. ShiftAmt is the number of

  // bits to shift the value into position. Pass GRLen-ShiftAmt-ValWidth, which

  // is the number of bits to left+right shift the value in order to

  // sign-extend.

  if (AI->getOperation() == AtomicRMWInst::Min ||

      AI->getOperation() == AtomicRMWInst::Max) {

    const DataLayout &DL = AI->getDataLayout();

    unsigned ValWidth =

        DL.getTypeStoreSizeInBits(AI->getValOperand()->getType());

    Value *SextShamt =

        Builder.CreateSub(Builder.getIntN(GRLen, GRLen - ValWidth), ShiftAmt);

    Result = Builder.CreateCall(LlwOpScwLoop,

                                {AlignedAddr, Incr, Mask, SextShamt, Ordering});

  } else {

    Result =

        Builder.CreateCall(LlwOpScwLoop, {AlignedAddr, Incr, Mask, Ordering});

  }


  if (GRLen == 64)

    Result = Builder.CreateTrunc(Result, Builder.getInt32Ty());

  return Result;

}


bool LoongArchTargetLowering::isFMAFasterThanFMulAndFAdd(

    const MachineFunction &MF, EVT VT) const {

  VT = VT.getScalarType();


  if (!VT.isSimple())

    return false;


  switch (VT.getSimpleVT().SimpleTy) {

  case MVT::f32:

  case MVT::f64:

    return true;

  default:

    break;

  }


  return false;

}


Register LoongArchTargetLowering::getExceptionPointerRegister(

    const Constant *PersonalityFn) const {

  return LoongArch::R4;

}


Register LoongArchTargetLowering::getExceptionSelectorRegister(

    const Constant *PersonalityFn) const {

  return LoongArch::R5;

}


//===----------------------------------------------------------------------===//

// Target Optimization Hooks

//===----------------------------------------------------------------------===//


static int getEstimateRefinementSteps(EVT VT,

                                      const LoongArchSubtarget &Subtarget) {

  // Feature FRECIPE instrucions relative accuracy is 2^-14.

  // IEEE float has 23 digits and double has 52 digits.

  int RefinementSteps = VT.getScalarType() == MVT::f64 ? 2 : 1;

  return RefinementSteps;

}


SDValue LoongArchTargetLowering::getSqrtEstimate(SDValue Operand,

                                                 SelectionDAG &DAG, int Enabled,

                                                 int &RefinementSteps,

                                                 bool &UseOneConstNR,

                                                 bool Reciprocal) const {

  if (Subtarget.hasFrecipe()) {

    SDLoc DL(Operand);

    EVT VT = Operand.getValueType();


    if (VT == MVT::f32 || (VT == MVT::f64 && Subtarget.hasBasicD()) ||

        (VT == MVT::v4f32 && Subtarget.hasExtLSX()) ||

        (VT == MVT::v2f64 && Subtarget.hasExtLSX()) ||

        (VT == MVT::v8f32 && Subtarget.hasExtLASX()) ||

        (VT == MVT::v4f64 && Subtarget.hasExtLASX())) {


      if (RefinementSteps == ReciprocalEstimate::Unspecified)

        RefinementSteps = getEstimateRefinementSteps(VT, Subtarget);


      SDValue Estimate = DAG.getNode(LoongArchISD::FRSQRTE, DL, VT, Operand);

      if (Reciprocal)

        Estimate = DAG.getNode(ISD::FMUL, DL, VT, Operand, Estimate);


      return Estimate;

    }

  }


  return SDValue();

}


SDValue LoongArchTargetLowering::getRecipEstimate(SDValue Operand,

                                                  SelectionDAG &DAG,

                                                  int Enabled,

                                                  int &RefinementSteps) const {

  if (Subtarget.hasFrecipe()) {

    SDLoc DL(Operand);

    EVT VT = Operand.getValueType();


    if (VT == MVT::f32 || (VT == MVT::f64 && Subtarget.hasBasicD()) ||

        (VT == MVT::v4f32 && Subtarget.hasExtLSX()) ||

        (VT == MVT::v2f64 && Subtarget.hasExtLSX()) ||

        (VT == MVT::v8f32 && Subtarget.hasExtLASX()) ||

        (VT == MVT::v4f64 && Subtarget.hasExtLASX())) {


      if (RefinementSteps == ReciprocalEstimate::Unspecified)

        RefinementSteps = getEstimateRefinementSteps(VT, Subtarget);


      return DAG.getNode(LoongArchISD::FRECIPE, DL, VT, Operand);

    }

  }


  return SDValue();

}


//===----------------------------------------------------------------------===//

//                           LoongArch Inline Assembly Support

//===----------------------------------------------------------------------===//


LoongArchTargetLowering::ConstraintType

LoongArchTargetLowering::getConstraintType(StringRef Constraint) const {

  // LoongArch specific constraints in GCC: config/loongarch/constraints.md

  //

  // 'f':  A floating-point register (if available).

  // 'k':  A memory operand whose address is formed by a base register and

  //       (optionally scaled) index register.

  // 'l':  A signed 16-bit constant.

  // 'm':  A memory operand whose address is formed by a base register and

  //       offset that is suitable for use in instructions with the same

  //       addressing mode as st.w and ld.w.

  // 'q':  A general-purpose register except for $r0 and $r1 (for the csrxchg

  //       instruction)

  // 'I':  A signed 12-bit constant (for arithmetic instructions).

  // 'J':  Integer zero.

  // 'K':  An unsigned 12-bit constant (for logic instructions).

  // "ZB": An address that is held in a general-purpose register. The offset is

  //       zero.

  // "ZC": A memory operand whose address is formed by a base register and

  //       offset that is suitable for use in instructions with the same

  //       addressing mode as ll.w and sc.w.

  if (Constraint.size() == 1) {

    switch (Constraint[0]) {

    default:

      break;

    case 'f':

    case 'q':

      return C_RegisterClass;

    case 'l':

    case 'I':

    case 'J':

    case 'K':

      return C_Immediate;

    case 'k':

      return C_Memory;

    }

  }


  if (Constraint == "ZC" || Constraint == "ZB")

    return C_Memory;


  // 'm' is handled here.

  return TargetLowering::getConstraintType(Constraint);

}


InlineAsm::ConstraintCode LoongArchTargetLowering::getInlineAsmMemConstraint(

    StringRef ConstraintCode) const {

  return StringSwitch<InlineAsm::ConstraintCode>(ConstraintCode)

      .Case("k", InlineAsm::ConstraintCode::k)

      .Case("ZB", InlineAsm::ConstraintCode::ZB)

      .Case("ZC", InlineAsm::ConstraintCode::ZC)

      .Default(TargetLowering::getInlineAsmMemConstraint(ConstraintCode));

}


std::pair<unsigned, const TargetRegisterClass *>

LoongArchTargetLowering::getRegForInlineAsmConstraint(

    const TargetRegisterInfo *TRI, StringRef Constraint, MVT VT) const {

  // First, see if this is a constraint that directly corresponds to a LoongArch

  // register class.

  if (Constraint.size() == 1) {

    switch (Constraint[0]) {

    case 'r':

      // TODO: Support fixed vectors up to GRLen?

      if (VT.isVector())

        break;

      return std::make_pair(0U, &LoongArch::GPRRegClass);

    case 'q':

      return std::make_pair(0U, &LoongArch::GPRNoR0R1RegClass);

    case 'f':

      if (Subtarget.hasBasicF() && VT == MVT::f32)

        return std::make_pair(0U, &LoongArch::FPR32RegClass);

      if (Subtarget.hasBasicD() && VT == MVT::f64)

        return std::make_pair(0U, &LoongArch::FPR64RegClass);

      if (Subtarget.hasExtLSX() &&

          TRI->isTypeLegalForClass(LoongArch::LSX128RegClass, VT))

        return std::make_pair(0U, &LoongArch::LSX128RegClass);

      if (Subtarget.hasExtLASX() &&

          TRI->isTypeLegalForClass(LoongArch::LASX256RegClass, VT))

        return std::make_pair(0U, &LoongArch::LASX256RegClass);

      break;

    default:

      break;

    }

  }


  // TargetLowering::getRegForInlineAsmConstraint uses the name of the TableGen

  // record (e.g. the "R0" in `def R0`) to choose registers for InlineAsm

  // constraints while the official register name is prefixed with a '$'. So we

  // clip the '$' from the original constraint string (e.g. {$r0} to {r0}.)

  // before it being parsed. And TargetLowering::getRegForInlineAsmConstraint is

  // case insensitive, so no need to convert the constraint to upper case here.

  //

  // For now, no need to support ABI names (e.g. `$a0`) as clang will correctly

  // decode the usage of register name aliases into their official names. And

  // AFAIK, the not yet upstreamed `rustc` for LoongArch will always use

  // official register names.

  if (Constraint.starts_with("{$r") || Constraint.starts_with("{$f") ||

      Constraint.starts_with("{$vr") || Constraint.starts_with("{$xr")) {

    bool IsFP = Constraint[2] == 'f';

    std::pair<StringRef, StringRef> Temp = Constraint.split('$');

    std::pair<unsigned, const TargetRegisterClass *> R;

    R = TargetLowering::getRegForInlineAsmConstraint(

        TRI, join_items("", Temp.first, Temp.second), VT);

    // Match those names to the widest floating point register type available.

    if (IsFP) {

      unsigned RegNo = R.first;

      if (LoongArch::F0 <= RegNo && RegNo <= LoongArch::F31) {

        if (Subtarget.hasBasicD() && (VT == MVT::f64 || VT == MVT::Other)) {

          unsigned DReg = RegNo - LoongArch::F0 + LoongArch::F0_64;

          return std::make_pair(DReg, &LoongArch::FPR64RegClass);

        }

      }

    }

    return R;

  }


  return TargetLowering::getRegForInlineAsmConstraint(TRI, Constraint, VT);

}


void LoongArchTargetLowering::LowerAsmOperandForConstraint(

    SDValue Op, StringRef Constraint, std::vector<SDValue> &Ops,

    SelectionDAG &DAG) const {

  // Currently only support length 1 constraints.

  if (Constraint.size() == 1) {

    switch (Constraint[0]) {

    case 'l':

      // Validate & create a 16-bit signed immediate operand.

      if (auto *C = dyn_cast<ConstantSDNode>(Op)) {

        uint64_t CVal = C->getSExtValue();

        if (isInt<16>(CVal))

          Ops.push_back(DAG.getSignedTargetConstant(CVal, SDLoc(Op),

                                                    Subtarget.getGRLenVT()));

      }

      return;

    case 'I':

      // Validate & create a 12-bit signed immediate operand.

      if (auto *C = dyn_cast<ConstantSDNode>(Op)) {

        uint64_t CVal = C->getSExtValue();

        if (isInt<12>(CVal))

          Ops.push_back(DAG.getSignedTargetConstant(CVal, SDLoc(Op),

                                                    Subtarget.getGRLenVT()));

      }

      return;

    case 'J':

      // Validate & create an integer zero operand.

      if (auto *C = dyn_cast<ConstantSDNode>(Op))

        if (C->getZExtValue() == 0)

          Ops.push_back(

              DAG.getTargetConstant(0, SDLoc(Op), Subtarget.getGRLenVT()));

      return;

    case 'K':

      // Validate & create a 12-bit unsigned immediate operand.

      if (auto *C = dyn_cast<ConstantSDNode>(Op)) {

        uint64_t CVal = C->getZExtValue();

        if (isUInt<12>(CVal))

          Ops.push_back(

              DAG.getTargetConstant(CVal, SDLoc(Op), Subtarget.getGRLenVT()));

      }

      return;

    default:

      break;

    }

  }

  TargetLowering::LowerAsmOperandForConstraint(Op, Constraint, Ops, DAG);

}


#define GET_REGISTER_MATCHER

#include "LoongArchGenAsmMatcher.inc"


Register


LoongArchTargetLowering::getRegisterByName(const char *RegName, LLT VT,

                                           const MachineFunction &MF) const {

  std::pair<StringRef, StringRef> Name = StringRef(RegName).split('$');

  std::string NewRegName = Name.second.str();

  Register Reg = MatchRegisterAltName(NewRegName);

  if (!Reg)

    Reg = MatchRegisterName(NewRegName);

  if (!Reg)

    return Reg;

  BitVector ReservedRegs = Subtarget.getRegisterInfo()->getReservedRegs(MF);

  if (!ReservedRegs.test(Reg))

    report_fatal_error(Twine("Trying to obtain non-reserved register \"" +

                             StringRef(RegName) + "\"."));

  return Reg;

}


bool LoongArchTargetLowering::decomposeMulByConstant(LLVMContext &Context,

                                                     EVT VT, SDValue C) const {

  // TODO: Support vectors.

  if (!VT.isScalarInteger())

    return false;


  // Omit the optimization if the data size exceeds GRLen.

  if (VT.getSizeInBits() > Subtarget.getGRLen())

    return false;


  if (auto *ConstNode = dyn_cast<ConstantSDNode>(C.getNode())) {

    const APInt &Imm = ConstNode->getAPIntValue();

    // Break MUL into (SLLI + ADD/SUB) or ALSL.

    if ((Imm + 1).isPowerOf2() || (Imm - 1).isPowerOf2() ||

        (1 - Imm).isPowerOf2() || (-1 - Imm).isPowerOf2())

      return true;

    // Break MUL into (ALSL x, (SLLI x, imm0), imm1).

    if (ConstNode->hasOneUse() &&

        ((Imm - 2).isPowerOf2() || (Imm - 4).isPowerOf2() ||

         (Imm - 8).isPowerOf2() || (Imm - 16).isPowerOf2()))

      return true;

    // Break (MUL x, imm) into (ADD (SLLI x, s0), (SLLI x, s1)),

    // in which the immediate has two set bits. Or Break (MUL x, imm)

    // into (SUB (SLLI x, s0), (SLLI x, s1)), in which the immediate

    // equals to (1 << s0) - (1 << s1).

    if (ConstNode->hasOneUse() && !(Imm.sge(-2048) && Imm.sle(4095))) {

      unsigned Shifts = Imm.countr_zero();

      // Reject immediates which can be composed via a single LUI.

      if (Shifts >= 12)

        return false;

      // Reject multiplications can be optimized to

      // (SLLI (ALSL x, x, 1/2/3/4), s).

      APInt ImmPop = Imm.ashr(Shifts);

      if (ImmPop == 3 || ImmPop == 5 || ImmPop == 9 || ImmPop == 17)

        return false;

      // We do not consider the case `(-Imm - ImmSmall).isPowerOf2()`,

      // since it needs one more instruction than other 3 cases.

      APInt ImmSmall = APInt(Imm.getBitWidth(), 1ULL << Shifts, true);

      if ((Imm - ImmSmall).isPowerOf2() || (Imm + ImmSmall).isPowerOf2() ||

          (ImmSmall - Imm).isPowerOf2())

        return true;

    }

  }


  return false;

}


bool LoongArchTargetLowering::isLegalAddressingMode(const DataLayout &DL,

                                                    const AddrMode &AM,

                                                    Type *Ty, unsigned AS,

                                                    Instruction *I) const {

  // LoongArch has four basic addressing modes:

  //  1. reg

  //  2. reg + 12-bit signed offset

  //  3. reg + 14-bit signed offset left-shifted by 2

  //  4. reg1 + reg2

  // TODO: Add more checks after support vector extension.


  // No global is ever allowed as a base.

  if (AM.BaseGV)

    return false;


  // Require a 12-bit signed offset or 14-bit signed offset left-shifted by 2

  // with `UAL` feature.

  if (!isInt<12>(AM.BaseOffs) &&

      !(isShiftedInt<14, 2>(AM.BaseOffs) && Subtarget.hasUAL()))

    return false;


  switch (AM.Scale) {

  case 0:

    // "r+i" or just "i", depending on HasBaseReg.

    break;

  case 1:

    // "r+r+i" is not allowed.

    if (AM.HasBaseReg && AM.BaseOffs)

      return false;

    // Otherwise we have "r+r" or "r+i".

    break;

  case 2:

    // "2*r+r" or "2*r+i" is not allowed.

    if (AM.HasBaseReg || AM.BaseOffs)

      return false;

    // Allow "2*r" as "r+r".

    break;

  default:

    return false;

  }


  return true;

}


bool LoongArchTargetLowering::isLegalICmpImmediate(int64_t Imm) const {

  return isInt<12>(Imm);

}


bool LoongArchTargetLowering::isLegalAddImmediate(int64_t Imm) const {

  return isInt<12>(Imm);

}


bool LoongArchTargetLowering::isZExtFree(SDValue Val, EVT VT2) const {

  // Zexts are free if they can be combined with a load.

  // Don't advertise i32->i64 zextload as being free for LA64. It interacts

  // poorly with type legalization of compares preferring sext.

  if (auto *LD = dyn_cast<LoadSDNode>(Val)) {

    EVT MemVT = LD->getMemoryVT();

    if ((MemVT == MVT::i8 || MemVT == MVT::i16) &&

        (LD->getExtensionType() == ISD::NON_EXTLOAD ||

         LD->getExtensionType() == ISD::ZEXTLOAD))

      return true;

  }


  return TargetLowering::isZExtFree(Val, VT2);

}


bool LoongArchTargetLowering::isSExtCheaperThanZExt(EVT SrcVT,

                                                    EVT DstVT) const {

  return Subtarget.is64Bit() && SrcVT == MVT::i32 && DstVT == MVT::i64;

}


bool LoongArchTargetLowering::signExtendConstant(const ConstantInt *CI) const {

  return Subtarget.is64Bit() && CI->getType()->isIntegerTy(32);

}


bool LoongArchTargetLowering::hasAndNotCompare(SDValue Y) const {

  // TODO: Support vectors.

  if (Y.getValueType().isVector())

    return false;


  return !isa<ConstantSDNode>(Y);

}


ISD::NodeType LoongArchTargetLowering::getExtendForAtomicCmpSwapArg() const {

  // LAMCAS will use amcas[_DB].{b/h/w/d} which does not require extension.

  return Subtarget.hasLAMCAS() ? ISD::ANY_EXTEND : ISD::SIGN_EXTEND;

}


bool LoongArchTargetLowering::shouldSignExtendTypeInLibCall(

    Type *Ty, bool IsSigned) const {

  if (Subtarget.is64Bit() && Ty->isIntegerTy(32))

    return true;


  return IsSigned;

}


bool LoongArchTargetLowering::shouldExtendTypeInLibCall(EVT Type) const {

  // Return false to suppress the unnecessary extensions if the LibCall

  // arguments or return value is a float narrower than GRLEN on a soft FP ABI.

  if (Subtarget.isSoftFPABI() && (Type.isFloatingPoint() && !Type.isVector() &&

                                  Type.getSizeInBits() < Subtarget.getGRLen()))

    return false;

  return true;

}


// memcpy, and other memory intrinsics, typically tries to use wider load/store

// if the source/dest is aligned and the copy size is large enough. We therefore

// want to align such objects passed to memory intrinsics.


bool LoongArchTargetLowering::shouldAlignPointerArgs(CallInst *CI,

                                                     unsigned &MinSize,

                                                     Align &PrefAlign) const {

  if (!isa<MemIntrinsic>(CI))

    return false;


  if (Subtarget.is64Bit()) {

    MinSize = 8;

    PrefAlign = Align(8);

  } else {

    MinSize = 4;

    PrefAlign = Align(4);

  }


  return true;

}


TargetLoweringBase::LegalizeTypeAction


LoongArchTargetLowering::getPreferredVectorAction(MVT VT) const {

  if (!VT.isScalableVector() && VT.getVectorNumElements() != 1 &&

      VT.getVectorElementType() != MVT::i1)

    return TypeWidenVector;


  return TargetLoweringBase::getPreferredVectorAction(VT);

}


bool LoongArchTargetLowering::splitValueIntoRegisterParts(

    SelectionDAG &DAG, const SDLoc &DL, SDValue Val, SDValue *Parts,

    unsigned NumParts, MVT PartVT, std::optional<CallingConv::ID> CC) const {

  bool IsABIRegCopy = CC.has_value();

  EVT ValueVT = Val.getValueType();


  if (IsABIRegCopy && (ValueVT == MVT::f16 || ValueVT == MVT::bf16) &&

      PartVT == MVT::f32) {

    // Cast the [b]f16 to i16, extend to i32, pad with ones to make a float

    // nan, and cast to f32.

    Val = DAG.getNode(ISD::BITCAST, DL, MVT::i16, Val);

    Val = DAG.getNode(ISD::ANY_EXTEND, DL, MVT::i32, Val);

    Val = DAG.getNode(ISD::OR, DL, MVT::i32, Val,

                      DAG.getConstant(0xFFFF0000, DL, MVT::i32));

    Val = DAG.getNode(ISD::BITCAST, DL, MVT::f32, Val);

    Parts[0] = Val;

    return true;

  }


  return false;

}


SDValue LoongArchTargetLowering::joinRegisterPartsIntoValue(

    SelectionDAG &DAG, const SDLoc &DL, const SDValue *Parts, unsigned NumParts,

    MVT PartVT, EVT ValueVT, std::optional<CallingConv::ID> CC) const {

  bool IsABIRegCopy = CC.has_value();


  if (IsABIRegCopy && (ValueVT == MVT::f16 || ValueVT == MVT::bf16) &&

      PartVT == MVT::f32) {

    SDValue Val = Parts[0];


    // Cast the f32 to i32, truncate to i16, and cast back to [b]f16.

    Val = DAG.getNode(ISD::BITCAST, DL, MVT::i32, Val);

    Val = DAG.getNode(ISD::TRUNCATE, DL, MVT::i16, Val);

    Val = DAG.getNode(ISD::BITCAST, DL, ValueVT, Val);

    return Val;

  }


  return SDValue();

}


MVT LoongArchTargetLowering::getRegisterTypeForCallingConv(LLVMContext &Context,

                                                           CallingConv::ID CC,

                                                           EVT VT) const {

  // Use f32 to pass f16.

  if (VT == MVT::f16 && Subtarget.hasBasicF())

    return MVT::f32;


  return TargetLowering::getRegisterTypeForCallingConv(Context, CC, VT);

}


unsigned LoongArchTargetLowering::getNumRegistersForCallingConv(

    LLVMContext &Context, CallingConv::ID CC, EVT VT) const {

  // Use f32 to pass f16.

  if (VT == MVT::f16 && Subtarget.hasBasicF())

    return 1;


  return TargetLowering::getNumRegistersForCallingConv(Context, CC, VT);

}


bool LoongArchTargetLowering::SimplifyDemandedBitsForTargetNode(

    SDValue Op, const APInt &OriginalDemandedBits,

    const APInt &OriginalDemandedElts, KnownBits &Known, TargetLoweringOpt &TLO,

    unsigned Depth) const {

  EVT VT = Op.getValueType();

  unsigned BitWidth = OriginalDemandedBits.getBitWidth();

  unsigned Opc = Op.getOpcode();

  switch (Opc) {

  default:

    break;

  case LoongArchISD::VMSKLTZ:

  case LoongArchISD::XVMSKLTZ: {

    SDValue Src = Op.getOperand(0);

    MVT SrcVT = Src.getSimpleValueType();

    unsigned SrcBits = SrcVT.getScalarSizeInBits();

    unsigned NumElts = SrcVT.getVectorNumElements();


    // If we don't need the sign bits at all just return zero.

    if (OriginalDemandedBits.countr_zero() >= NumElts)

      return TLO.CombineTo(Op, TLO.DAG.getConstant(0, SDLoc(Op), VT));


    // Only demand the vector elements of the sign bits we need.

    APInt KnownUndef, KnownZero;

    APInt DemandedElts = OriginalDemandedBits.zextOrTrunc(NumElts);

    if (SimplifyDemandedVectorElts(Src, DemandedElts, KnownUndef, KnownZero,

                                   TLO, Depth + 1))

      return true;


    Known.Zero = KnownZero.zext(BitWidth);

    Known.Zero.setHighBits(BitWidth - NumElts);


    // [X]VMSKLTZ only uses the MSB from each vector element.

    KnownBits KnownSrc;

    APInt DemandedSrcBits = APInt::getSignMask(SrcBits);

    if (SimplifyDemandedBits(Src, DemandedSrcBits, DemandedElts, KnownSrc, TLO,

                             Depth + 1))

      return true;


    if (KnownSrc.One[SrcBits - 1])

      Known.One.setLowBits(NumElts);

    else if (KnownSrc.Zero[SrcBits - 1])

      Known.Zero.setLowBits(NumElts);


    // Attempt to avoid multi-use ops if we don't need anything from it.

    if (SDValue NewSrc = SimplifyMultipleUseDemandedBits(

            Src, DemandedSrcBits, DemandedElts, TLO.DAG, Depth + 1))

      return TLO.CombineTo(Op, TLO.DAG.getNode(Opc, SDLoc(Op), VT, NewSrc));

    return false;

  }

  }


  return TargetLowering::SimplifyDemandedBitsForTargetNode(

      Op, OriginalDemandedBits, OriginalDemandedElts, Known, TLO, Depth);

}


bool LoongArchTargetLowering::shouldScalarizeBinop(SDValue VecOp) const {

  unsigned Opc = VecOp.getOpcode();


  // Assume target opcodes can't be scalarized.

  // TODO - do we have any exceptions?

  if (Opc >= ISD::BUILTIN_OP_END || !isBinOp(Opc))

    return false;


  // If the vector op is not supported, try to convert to scalar.

  EVT VecVT = VecOp.getValueType();

  if (!isOperationLegalOrCustomOrPromote(Opc, VecVT))

    return true;


  // If the vector op is supported, but the scalar op is not, the transform may

  // not be worthwhile.

  EVT ScalarVT = VecVT.getScalarType();

  return isOperationLegalOrCustomOrPromote(Opc, ScalarVT);

}


bool LoongArchTargetLowering::isExtractSubvectorCheap(EVT ResVT, EVT SrcVT,

                                                      unsigned Index) const {

  if (!isOperationLegalOrCustom(ISD::EXTRACT_SUBVECTOR, ResVT))

    return false;


  // Extract a 128-bit subvector from index 0 of a 256-bit vector is free.

  return Index == 0;

}


bool LoongArchTargetLowering::isExtractVecEltCheap(EVT VT,

                                                   unsigned Index) const {

  EVT EltVT = VT.getScalarType();


  // Extract a scalar FP value from index 0 of a vector is free.

  return (EltVT == MVT::f32 || EltVT == MVT::f64) && Index == 0;

}


MRI
unsigned const MachineRegisterInfo * MRI
Definition AArch64AdvSIMDScalarPass.cpp:103

MatchRegisterName
static MCRegister MatchRegisterName(StringRef Name)

checkValueWidth
static bool checkValueWidth(SDValue V, unsigned width, ISD::LoadExtType &ExtType)
Definition AArch64ISelLowering.cpp:25777

performORCombine
static SDValue performORCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI, const AArch64Subtarget *Subtarget, const AArch64TargetLowering &TLI)
Definition AArch64ISelLowering.cpp:20493

SDValue
return SDValue()

performANDCombine
static SDValue performANDCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI)
Definition AArch64ISelLowering.cpp:20694

performSETCCCombine
static SDValue performSETCCCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI, SelectionDAG &DAG)
Definition AArch64ISelLowering.cpp:26574

assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

getNode
static msgpack::DocNode getNode(msgpack::DocNode DN, msgpack::Type Type, MCValue Val)
Definition AMDGPUDelayedMCExpr.cpp:15

MBB
MachineBasicBlock & MBB
Definition ARMSLSHardening.cpp:71

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition ARMSLSHardening.cpp:73

MatchRegisterAltName
static MCRegister MatchRegisterAltName(StringRef Name)
Maps from the set of all alternative registernames to a register number.

Results
Function Alias Analysis Results
Definition AliasAnalysis.cpp:747

getConstant
static uint64_t getConstant(const Value *IndexValue)
Definition BPFAbstractMemberAccess.cpp:318

getTargetNode
static SDValue getTargetNode(ConstantPoolSDNode *N, const SDLoc &DL, EVT Ty, SelectionDAG &DAG, unsigned Flags)
Definition BPFISelLowering.cpp:826

E
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")

convertValVTToLocVT
static SDValue convertValVTToLocVT(SelectionDAG &DAG, SDValue Val, const CCValAssign &VA, const SDLoc &DL)
Definition CSKYISelLowering.cpp:199

unpackFromMemLoc
static SDValue unpackFromMemLoc(SelectionDAG &DAG, SDValue Chain, const CCValAssign &VA, const SDLoc &DL)
Definition CSKYISelLowering.cpp:261

convertLocVTToValVT
static SDValue convertLocVTToValVT(SelectionDAG &DAG, SDValue Val, const CCValAssign &VA, const SDLoc &DL)
Definition CSKYISelLowering.cpp:215

emitSelectPseudo
static MachineBasicBlock * emitSelectPseudo(MachineInstr &MI, MachineBasicBlock *BB, unsigned Opcode)
Definition CSKYISelLowering.cpp:963

unpackFromRegLoc
static SDValue unpackFromRegLoc(const CSKYSubtarget &Subtarget, SelectionDAG &DAG, SDValue Chain, const CCValAssign &VA, const SDLoc &DL)
Definition CSKYISelLowering.cpp:229

CodeGen.h

clEnumValN
#define clEnumValN(ENUMVAL, FLAGNAME, DESC)
Definition CommandLine.h:688

TII
const HexagonInstrInfo * TII
Definition HexagonCopyToCombine.cpp:118

IRBuilder.h

MI
IRTranslator LLVM IR MI
Definition IRTranslator.cpp:110

IntrinsicInst.h

ISDOpcodes.h

InlinePriorityMode::Size
@ Size
Definition InlineOrder.cpp:25

NumOps
const size_t AbstractManglingParser< Derived, Alloc >::NumOps
Definition ItaniumDemangle.h:3452

TemplateParamKind::Type
@ Type
Definition ItaniumDemangle.h:1243

Ops
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
Definition ItaniumDemangle.h:3370

KnownBits.h

RegName
#define RegName(no)

LoongArchBaseInfo.h

performINTRINSIC_WO_CHAINCombine
static SDValue performINTRINSIC_WO_CHAINCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:6228

ArgFPR32s
const MCPhysReg ArgFPR32s[]
Definition LoongArchISelLowering.cpp:7709

lower128BitShuffle
static SDValue lower128BitShuffle(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Dispatching routine to lower various 128-bit LoongArch vector shuffles.
Definition LoongArchISelLowering.cpp:2149

lowerVECTOR_SHUFFLE_XVSHUF4I
static SDValue lowerVECTOR_SHUFFLE_XVSHUF4I(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Lower VECTOR_SHUFFLE into XVSHUF4I (if possible).
Definition LoongArchISelLowering.cpp:2262

ArgVRs
const MCPhysReg ArgVRs[]
Definition LoongArchISelLowering.cpp:7717

lowerVECTOR_SHUFFLE_VPICKEV
static SDValue lowerVECTOR_SHUFFLE_VPICKEV(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VPICKEV (if possible).
Definition LoongArchISelLowering.cpp:2051

combineSelectToBinOp
static SDValue combineSelectToBinOp(SDNode *N, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:915

lowerVECTOR_SHUFFLE_XVPICKOD
static SDValue lowerVECTOR_SHUFFLE_XVPICKOD(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVPICKOD (if possible).
Definition LoongArchISelLowering.cpp:2458

unpackF64OnLA32DSoftABI
static SDValue unpackF64OnLA32DSoftABI(SelectionDAG &DAG, SDValue Chain, const CCValAssign &VA, const CCValAssign &HiVA, const SDLoc &DL)
Definition LoongArchISelLowering.cpp:8064

fitsRegularPattern
static bool fitsRegularPattern(typename SmallVectorImpl< ValType >::const_iterator Begin, unsigned CheckStride, typename SmallVectorImpl< ValType >::const_iterator End, ValType ExpectedIndex, unsigned ExpectedIndexStride)
Determine whether a range fits a regular pattern of values.
Definition LoongArchISelLowering.cpp:1450

lowerVECTOR_SHUFFLE_IsReverse
static SDValue lowerVECTOR_SHUFFLE_IsReverse(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Lower VECTOR_SHUFFLE whose result is the reversed source vector.
Definition LoongArchISelLowering.cpp:1844

emitIntrinsicErrorMessage
static SDValue emitIntrinsicErrorMessage(SDValue Op, StringRef ErrorMsg, SelectionDAG &DAG)
Definition LoongArchISelLowering.cpp:4308

ZeroDivCheck
static cl::opt< bool > ZeroDivCheck("loongarch-check-zero-division", cl::Hidden, cl::desc("Trap on integer division by zero."), cl::init(false))

lowerVECTOR_SHUFFLE_VSHUF
static SDValue lowerVECTOR_SHUFFLE_VSHUF(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Lower VECTOR_SHUFFLE into VSHUF.
Definition LoongArchISelLowering.cpp:2123

getEstimateRefinementSteps
static int getEstimateRefinementSteps(EVT VT, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:9208

emitErrorAndReplaceIntrinsicResults
static void emitErrorAndReplaceIntrinsicResults(SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG, StringRef ErrorMsg, bool WithChain=true)
Definition LoongArchISelLowering.cpp:4656

lowerVECTOR_SHUFFLEAsByteRotate
static SDValue lowerVECTOR_SHUFFLEAsByteRotate(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Lower VECTOR_SHUFFLE as byte rotate (if possible).
Definition LoongArchISelLowering.cpp:1612

checkIntrinsicImmArg
static SDValue checkIntrinsicImmArg(SDValue Op, unsigned ImmOp, SelectionDAG &DAG, bool IsSigned=false)
Definition LoongArchISelLowering.cpp:3892

lowerVECTOR_SHUFFLE_XVINSVE0
static SDValue lowerVECTOR_SHUFFLE_XVINSVE0(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Lower VECTOR_SHUFFLE into XVINSVE0 (if possible).
Definition LoongArchISelLowering.cpp:2495

performMOVFR2GR_SCombine
static SDValue performMOVFR2GR_SCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:6799

lowerVECTOR_SHUFFLE_VILVH
static SDValue lowerVECTOR_SHUFFLE_VILVH(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VILVH (if possible).
Definition LoongArchISelLowering.cpp:1968

CC_LoongArch
static bool CC_LoongArch(const DataLayout &DL, LoongArchABI::ABI ABI, unsigned ValNo, MVT ValVT, CCValAssign::LocInfo LocInfo, ISD::ArgFlagsTy ArgFlags, CCState &State, bool IsRet, Type *OrigTy)
Definition LoongArchISelLowering.cpp:7763

getPrefTypeAlign
static Align getPrefTypeAlign(EVT VT, SelectionDAG &DAG)
Definition LoongArchISelLowering.cpp:8375

performSPLIT_PAIR_F64Combine
static SDValue performSPLIT_PAIR_F64Combine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:6830

performBITCASTCombine
static SDValue performBITCASTCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:5467

performSRLCombine
static SDValue performSRLCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:5292

emitSplitPairF64Pseudo
static MachineBasicBlock * emitSplitPairF64Pseudo(MachineInstr &MI, MachineBasicBlock *BB, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:7399

lowerVectorBitSetImm
static SDValue lowerVectorBitSetImm(SDNode *Node, SelectionDAG &DAG)
Definition LoongArchISelLowering.cpp:6178

performSETCC_BITCASTCombine
static SDValue performSETCC_BITCASTCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:5394

MaterializeFPImm
MaterializeFPImm
Definition LoongArchISelLowering.cpp:46

NoMaterializeFPImm
@ NoMaterializeFPImm
Definition LoongArchISelLowering.cpp:47

MaterializeFPImm2Ins
@ MaterializeFPImm2Ins
Definition LoongArchISelLowering.cpp:48

MaterializeFPImm5Ins
@ MaterializeFPImm5Ins
Definition LoongArchISelLowering.cpp:51

MaterializeFPImm6Ins
@ MaterializeFPImm6Ins
Definition LoongArchISelLowering.cpp:52

MaterializeFPImm3Ins
@ MaterializeFPImm3Ins
Definition LoongArchISelLowering.cpp:49

MaterializeFPImm4Ins
@ MaterializeFPImm4Ins
Definition LoongArchISelLowering.cpp:50

lowerVECTOR_SHUFFLE_XVPACKOD
static SDValue lowerVECTOR_SHUFFLE_XVPACKOD(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVPACKOD (if possible).
Definition LoongArchISelLowering.cpp:2343

matchSetCC
static std::optional< bool > matchSetCC(SDValue LHS, SDValue RHS, ISD::CondCode CC, SDValue Val)
Definition LoongArchISelLowering.cpp:892

combineAndNotIntoVANDN
static SDValue combineAndNotIntoVANDN(SDNode *N, const SDLoc &DL, SelectionDAG &DAG)
Try to fold: (and (xor X, -1), Y) -> (vandn X, Y).
Definition LoongArchISelLowering.cpp:5173

lowerBUILD_VECTORAsBroadCastLoad
static SDValue lowerBUILD_VECTORAsBroadCastLoad(BuildVectorSDNode *BVOp, const SDLoc &DL, SelectionDAG &DAG)
Definition LoongArchISelLowering.cpp:2971

CRC_CASE_EXT_BINARYOP
#define CRC_CASE_EXT_BINARYOP(NAME, NODE)

lowerVectorBitRevImm
static SDValue lowerVectorBitRevImm(SDNode *Node, SelectionDAG &DAG)
Definition LoongArchISelLowering.cpp:6195

checkBitcastSrcVectorSize
static bool checkBitcastSrcVectorSize(SDValue Src, unsigned Size, unsigned Depth)
Definition LoongArchISelLowering.cpp:5339

lowerVECTOR_SHUFFLEAsShift
static SDValue lowerVECTOR_SHUFFLEAsShift(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget, const APInt &Zeroable)
Lower VECTOR_SHUFFLE as shift (if possible).
Definition LoongArchISelLowering.cpp:1412

lowerVECTOR_SHUFFLE_VSHUF4I
static SDValue lowerVECTOR_SHUFFLE_VSHUF4I(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Lower VECTOR_SHUFFLE into VSHUF4I (if possible).
Definition LoongArchISelLowering.cpp:1780

truncateVecElts
static SDValue truncateVecElts(SDNode *Node, SelectionDAG &DAG)
Definition LoongArchISelLowering.cpp:6140

CC_LoongArch_GHC
static bool CC_LoongArch_GHC(unsigned ValNo, MVT ValVT, MVT LocVT, CCValAssign::LocInfo LocInfo, ISD::ArgFlagsTy ArgFlags, Type *OrigTy, CCState &State)
Definition LoongArchISelLowering.cpp:8115

insertDivByZeroTrap
static MachineBasicBlock * insertDivByZeroTrap(MachineInstr &MI, MachineBasicBlock *MBB)
Definition LoongArchISelLowering.cpp:7000

customLegalizeToWOpWithSExt
static SDValue customLegalizeToWOpWithSExt(SDNode *N, SelectionDAG &DAG)
Definition LoongArchISelLowering.cpp:4644

lowerVectorBitClear
static SDValue lowerVectorBitClear(SDNode *Node, SelectionDAG &DAG)
Definition LoongArchISelLowering.cpp:6148

lowerVECTOR_SHUFFLE_VPACKEV
static SDValue lowerVECTOR_SHUFFLE_VPACKEV(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VPACKEV (if possible).
Definition LoongArchISelLowering.cpp:1887

emitPseudoVMSKCOND
static MachineBasicBlock * emitPseudoVMSKCOND(MachineInstr &MI, MachineBasicBlock *BB, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:7285

performSELECT_CCCombine
static SDValue performSELECT_CCCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:6052

performVANDNCombine
static SDValue performVANDNCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Do target-specific dag combines on LoongArchISD::VANDN nodes.
Definition LoongArchISelLowering.cpp:6897

replaceVPICKVE2GRResults
static void replaceVPICKVE2GRResults(SDNode *Node, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget, unsigned ResOp)
Definition LoongArchISelLowering.cpp:4668

lowerVECTOR_SHUFFLEAsZeroOrAnyExtend
static SDValue lowerVECTOR_SHUFFLEAsZeroOrAnyExtend(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG, const APInt &Zeroable)
Lower VECTOR_SHUFFLE as ZERO_EXTEND Or ANY_EXTEND (if possible).
Definition LoongArchISelLowering.cpp:1645

legalizeIntrinsicImmArg
static SDValue legalizeIntrinsicImmArg(SDNode *Node, unsigned ImmOp, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget, bool IsSigned=false)
Definition LoongArchISelLowering.cpp:6104

MaterializeFPImmInsNum
static cl::opt< MaterializeFPImm > MaterializeFPImmInsNum("loongarch-materialize-float-imm", cl::Hidden, cl::desc("Maximum number of instructions used (including code sequence " "to generate the value and moving the value to FPR) when " "materializing floating-point immediates (default = 3)"), cl::init(MaterializeFPImm3Ins), cl::values(clEnumValN(NoMaterializeFPImm, "0", "Use constant pool"), clEnumValN(MaterializeFPImm2Ins, "2", "Materialize FP immediate within 2 instructions"), clEnumValN(MaterializeFPImm3Ins, "3", "Materialize FP immediate within 3 instructions"), clEnumValN(MaterializeFPImm4Ins, "4", "Materialize FP immediate within 4 instructions"), clEnumValN(MaterializeFPImm5Ins, "5", "Materialize FP immediate within 5 instructions"), clEnumValN(MaterializeFPImm6Ins, "6", "Materialize FP immediate within 6 instructions " "(behaves same as 5 on loongarch64)")))

lowerVECTOR_SHUFFLE_XVPERMI
static SDValue lowerVECTOR_SHUFFLE_XVPERMI(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Lower VECTOR_SHUFFLE into XVPERMI (if possible).
Definition LoongArchISelLowering.cpp:2274

emitIntrinsicWithChainErrorMessage
static SDValue emitIntrinsicWithChainErrorMessage(SDValue Op, StringRef ErrorMsg, SelectionDAG &DAG)
Definition LoongArchISelLowering.cpp:4185

ArgXRs
const MCPhysReg ArgXRs[]
Definition LoongArchISelLowering.cpp:7721

CC_LoongArchAssign2GRLen
static bool CC_LoongArchAssign2GRLen(unsigned GRLen, CCState &State, CCValAssign VA1, ISD::ArgFlagsTy ArgFlags1, unsigned ValNo2, MVT ValVT2, MVT LocVT2, ISD::ArgFlagsTy ArgFlags2)
Definition LoongArchISelLowering.cpp:7727

getLoongArchWOpcode
static unsigned getLoongArchWOpcode(unsigned Opcode)
Definition LoongArchISelLowering.cpp:4577

ArgFPR64s
const MCPhysReg ArgFPR64s[]
Definition LoongArchISelLowering.cpp:7713

emitPseudoCTPOP
static MachineBasicBlock * emitPseudoCTPOP(MachineInstr &MI, MachineBasicBlock *BB, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:7246

performMOVGR2FR_WCombine
static SDValue performMOVGR2FR_WCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:6787

IOCSRWR_CASE
#define IOCSRWR_CASE(NAME, NODE)

CRC_CASE_EXT_UNARYOP
#define CRC_CASE_EXT_UNARYOP(NAME, NODE)

lowerVECTOR_SHUFFLE_VPACKOD
static SDValue lowerVECTOR_SHUFFLE_VPACKOD(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VPACKOD (if possible).
Definition LoongArchISelLowering.cpp:1927

signExtendBitcastSrcVector
static SDValue signExtendBitcastSrcVector(SelectionDAG &DAG, EVT SExtVT, SDValue Src, const SDLoc &DL)
Definition LoongArchISelLowering.cpp:5368

isNOT
static SDValue isNOT(SDValue V, SelectionDAG &DAG)
Definition LoongArchISelLowering.cpp:626

lower256BitShuffle
static SDValue lower256BitShuffle(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Dispatching routine to lower various 256-bit LoongArch vector shuffles.
Definition LoongArchISelLowering.cpp:2761

lowerVECTOR_SHUFFLE_VREPLVEI
static SDValue lowerVECTOR_SHUFFLE_VREPLVEI(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Lower VECTOR_SHUFFLE into VREPLVEI (if possible).
Definition LoongArchISelLowering.cpp:1738

emitPseudoXVINSGR2VR
static MachineBasicBlock * emitPseudoXVINSGR2VR(MachineInstr &MI, MachineBasicBlock *BB, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:7176

fillVector
static void fillVector(ArrayRef< SDValue > Ops, SelectionDAG &DAG, SDLoc DL, const LoongArchSubtarget &Subtarget, SDValue &Vector, EVT ResTy)
Definition LoongArchISelLowering.cpp:3017

performEXTRACT_VECTOR_ELTCombine
static SDValue performEXTRACT_VECTOR_ELTCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:6861

fillSubVectorFromBuildVector
static SDValue fillSubVectorFromBuildVector(BuildVectorSDNode *Node, SelectionDAG &DAG, SDLoc DL, const LoongArchSubtarget &Subtarget, EVT ResTy, unsigned first)
Definition LoongArchISelLowering.cpp:3036

isSelectPseudo
static bool isSelectPseudo(MachineInstr &MI)
Definition LoongArchISelLowering.cpp:7442

foldBinOpIntoSelectIfProfitable
static SDValue foldBinOpIntoSelectIfProfitable(SDNode *BO, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:989

lowerVectorSplatImm
static SDValue lowerVectorSplatImm(SDNode *Node, unsigned ImmOp, SelectionDAG &DAG, bool IsSigned=false)
Definition LoongArchISelLowering.cpp:6121

ArgGPRs
const MCPhysReg ArgGPRs[]
Definition LoongArchISelLowering.cpp:7704

lowerVECTOR_SHUFFLE_XVPERM
static SDValue lowerVECTOR_SHUFFLE_XVPERM(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Lower VECTOR_SHUFFLE into XVPERM (if possible).
Definition LoongArchISelLowering.cpp:2293

lowerVECTOR_SHUFFLE_XVILVL
static SDValue lowerVECTOR_SHUFFLE_XVILVL(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVILVL (if possible).
Definition LoongArchISelLowering.cpp:2389

customLegalizeToWOp
static SDValue customLegalizeToWOp(SDNode *N, SelectionDAG &DAG, int NumOp, unsigned ExtOpc=ISD::ANY_EXTEND)
Definition LoongArchISelLowering.cpp:4610

replaceVecCondBranchResults
static void replaceVecCondBranchResults(SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget, unsigned ResOp)
Definition LoongArchISelLowering.cpp:4689

ASRT_LE_GT_CASE
#define ASRT_LE_GT_CASE(NAME)

lowerVECTOR_SHUFFLE_XVPACKEV
static SDValue lowerVECTOR_SHUFFLE_XVPACKEV(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVPACKEV (if possible).
Definition LoongArchISelLowering.cpp:2336

performBR_CCCombine
static SDValue performBR_CCCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:6037

computeZeroableShuffleElements
static void computeZeroableShuffleElements(ArrayRef< int > Mask, SDValue V1, SDValue V2, APInt &KnownUndef, APInt &KnownZero)
Compute whether each element of a shuffle is zeroable.
Definition LoongArchISelLowering.cpp:1472

combine_CC
static bool combine_CC(SDValue &LHS, SDValue &RHS, SDValue &CC, const SDLoc &DL, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:5965

widenShuffleMask
static SDValue widenShuffleMask(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Definition LoongArchISelLowering.cpp:1307

emitVecCondBranchPseudo
static MachineBasicBlock * emitVecCondBranchPseudo(MachineInstr &MI, MachineBasicBlock *BB, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:7051

canonicalizeShuffleVectorByLane
static bool canonicalizeShuffleVectorByLane(const SDLoc &DL, MutableArrayRef< int > Mask, MVT VT, SDValue &V1, SDValue &V2, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Shuffle vectors by lane to generate more optimized instructions.
Definition LoongArchISelLowering.cpp:2611

lowerVECTOR_SHUFFLE_XVILVH
static SDValue lowerVECTOR_SHUFFLE_XVILVH(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVILVH (if possible).
Definition LoongArchISelLowering.cpp:2350

lowerVECTOR_SHUFFLE_XVSHUF
static SDValue lowerVECTOR_SHUFFLE_XVSHUF(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVSHUF (if possible).
Definition LoongArchISelLowering.cpp:2541

replaceCMP_XCHG_128Results
static void replaceCMP_XCHG_128Results(SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG)
Definition LoongArchISelLowering.cpp:4770

lowerVectorPickVE2GR
static SDValue lowerVectorPickVE2GR(SDNode *N, SelectionDAG &DAG, unsigned ResOp)
Definition LoongArchISelLowering.cpp:6212

performBITREV_WCombine
static SDValue performBITREV_WCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:5950

IOCSRRD_CASE
#define IOCSRRD_CASE(NAME, NODE)

matchShuffleAsByteRotate
static int matchShuffleAsByteRotate(MVT VT, SDValue &V1, SDValue &V2, ArrayRef< int > Mask)
Attempts to match vector shuffle as byte rotation.
Definition LoongArchISelLowering.cpp:1537

lowerVECTOR_SHUFFLE_XVPICKEV
static SDValue lowerVECTOR_SHUFFLE_XVPICKEV(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into XVPICKEV (if possible).
Definition LoongArchISelLowering.cpp:2423

lowerVECTOR_SHUFFLE_XVREPLVEI
static SDValue lowerVECTOR_SHUFFLE_XVREPLVEI(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Lower VECTOR_SHUFFLE into XVREPLVEI (if possible).
Definition LoongArchISelLowering.cpp:2228

matchShuffleAsShift
static int matchShuffleAsShift(MVT &ShiftVT, unsigned &Opcode, unsigned ScalarSizeInBits, ArrayRef< int > Mask, int MaskOffset, const APInt &Zeroable)
Attempts to match a shuffle mask against the VBSLL, VBSRL, VSLLI and VSRLI instruction.
Definition LoongArchISelLowering.cpp:1337

lowerVECTOR_SHUFFLE_VILVL
static SDValue lowerVECTOR_SHUFFLE_VILVL(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VILVL (if possible).
Definition LoongArchISelLowering.cpp:2011

lowerVectorBitClearImm
static SDValue lowerVectorBitClearImm(SDNode *Node, SelectionDAG &DAG)
Definition LoongArchISelLowering.cpp:6160

emitBuildPairF64Pseudo
static MachineBasicBlock * emitBuildPairF64Pseudo(MachineInstr &MI, MachineBasicBlock *BB, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:7419

lowerVECTOR_SHUFFLEAsLanePermuteAndShuffle
static SDValue lowerVECTOR_SHUFFLEAsLanePermuteAndShuffle(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE as lane permute and then shuffle (if possible).
Definition LoongArchISelLowering.cpp:2722

performVMSKLTZCombine
static SDValue performVMSKLTZCombine(SDNode *N, SelectionDAG &DAG, TargetLowering::DAGCombinerInfo &DCI, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:6814

replaceINTRINSIC_WO_CHAINResults
static void replaceINTRINSIC_WO_CHAINResults(SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG, const LoongArchSubtarget &Subtarget)
Definition LoongArchISelLowering.cpp:4703

CSR_CASE
#define CSR_CASE(ID)

lowerVECTOR_SHUFFLE_VPICKOD
static SDValue lowerVECTOR_SHUFFLE_VPICKOD(const SDLoc &DL, ArrayRef< int > Mask, MVT VT, SDValue V1, SDValue V2, SelectionDAG &DAG)
Lower VECTOR_SHUFFLE into VPICKOD (if possible).
Definition LoongArchISelLowering.cpp:2093

getIntrinsicForMaskedAtomicRMWBinOp
static Intrinsic::ID getIntrinsicForMaskedAtomicRMWBinOp(unsigned GRLen, AtomicRMWInst::BinOp BinOp)
Definition LoongArchISelLowering.cpp:9029

translateSetCCForBranch
static void translateSetCCForBranch(const SDLoc &DL, SDValue &LHS, SDValue &RHS, ISD::CondCode &CC, SelectionDAG &DAG)
Definition LoongArchISelLowering.cpp:1048

isRepeatedShuffleMask
static bool isRepeatedShuffleMask(unsigned LaneSizeInBits, MVT VT, ArrayRef< int > Mask, SmallVectorImpl< int > &RepeatedMask)
Test whether a shuffle mask is equivalent within each sub-lane.
Definition LoongArchISelLowering.cpp:1508

LoongArchISelLowering.h

LoongArchMCTargetDesc.h

LoongArchMachineFunctionInfo.h

LoongArchMatInt.h

LoongArchRegisterInfo.h

LoongArchSelectionDAGInfo.h

LoongArchSubtarget.h

LoongArch.h

F
#define F(x, y, z)
Definition MD5.cpp:54

I
#define I(x, y, z)
Definition MD5.cpp:57

MachineInstrBuilder.h

Reg
Register Reg
Definition MachineSink.cpp:2117

TRI
Register const TargetRegisterInfo * TRI
Definition MachineSink.cpp:2118

MathExtras.h

Register
Promote Memory to Register
Definition Mem2Reg.cpp:110

Context
@ Context
Definition MemProfContextDisambiguation.cpp:133

T
#define T
Definition Mips16ISelLowering.cpp:282

getCodeModel
static CodeModel::Model getCodeModel(const PPCSubtarget &S, const TargetMachine &TM, const MachineOperand &MO)
Definition PPCAsmPrinter.cpp:481

Opc
auto Opc
Definition RISCVRedundantCopyElimination.cpp:75

RuntimeLibcallUtil.h

SelectionDAGNodes.h

SmallSet.h
This file defines the SmallSet class.

Statistic.h
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...

STATISTIC
#define STATISTIC(VARNAME, DESC)
Definition Statistic.h:171

StringExtras.h
This file contains some functions that are useful when dealing with strings.

Debug.h

LLVM_DEBUG
#define LLVM_DEBUG(...)
Definition Debug.h:114

inRange
static bool inRange(const MCExpr *Expr, int64_t MinValue, int64_t MaxValue, bool AllowSymbol=false)
Definition SystemZAsmParser.cpp:49

Y
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")

X
static TableGen::Emitter::OptClass< SkeletonEmitter > X("gen-skeleton-class", "Generate example skeleton class")

VectorUtils.h

isSequentialOrUndefInRange
static bool isSequentialOrUndefInRange(ArrayRef< int > Mask, unsigned Pos, unsigned Size, int Low, int Step=1)
Return true if every element in Mask, beginning from position Pos and ending in Pos + Size,...
Definition X86ISelLowering.cpp:3864

RHS
Value * RHS
Definition X86PartialReduction.cpp:81

LHS
Value * LHS
Definition X86PartialReduction.cpp:80

Node
Definition ItaniumDemangle.h:166

llvm::APFloat
Definition APFloat.h:940

llvm::APFloat::isExactlyValue
bool isExactlyValue(double V) const
We don't rely on operator== working on double values, as it returns true for things that are clearly ...
Definition APFloat.h:1414

llvm::APFloat::isZero
bool isZero() const
Definition APFloat.h:1427

llvm::APFloat::bitcastToAPInt
APInt bitcastToAPInt() const
Definition APFloat.h:1335

llvm::APInt
Class for arbitrary precision integers.
Definition APInt.h:78

llvm::APInt::getAllOnes
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
Definition APInt.h:235

llvm::APInt::zext
LLVM_ABI APInt zext(unsigned width) const
Zero extend to a new width.
Definition APInt.cpp:1012

llvm::APInt::getSignMask
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
Definition APInt.h:230

llvm::APInt::getZExtValue
uint64_t getZExtValue() const
Get zero extended value.
Definition APInt.h:1541

llvm::APInt::setHighBits
void setHighBits(unsigned hiBits)
Set the top hiBits bits.
Definition APInt.h:1392

llvm::APInt::zextOrTrunc
LLVM_ABI APInt zextOrTrunc(unsigned width) const
Zero extend or truncate to width.
Definition APInt.cpp:1033

llvm::APInt::trunc
LLVM_ABI APInt trunc(unsigned width) const
Truncate to new width.
Definition APInt.cpp:936

llvm::APInt::setBit
void setBit(unsigned BitPosition)
Set the given bit to 1 whose position is given as "bitPosition".
Definition APInt.h:1331

llvm::APInt::isAllOnes
bool isAllOnes() const
Determine if all bits are set. This is true for zero-width values.
Definition APInt.h:372

llvm::APInt::isZero
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
Definition APInt.h:381

llvm::APInt::urem
LLVM_ABI APInt urem(const APInt &RHS) const
Unsigned remainder operation.
Definition APInt.cpp:1666

llvm::APInt::getBitWidth
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition APInt.h:1489

llvm::APInt::countr_zero
unsigned countr_zero() const
Count the number of trailing zero bits.
Definition APInt.h:1640

llvm::APInt::isSignedIntN
bool isSignedIntN(unsigned N) const
Check if this APInt has an N-bits signed integer value.
Definition APInt.h:436

llvm::APInt::isSubsetOf
bool isSubsetOf(const APInt &RHS) const
This operation checks that all bits set in this APInt are also set in RHS.
Definition APInt.h:1258

llvm::APInt::getZero
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
Definition APInt.h:201

llvm::APInt::setLowBits
void setLowBits(unsigned loBits)
Set the bottom loBits bits.
Definition APInt.h:1389

llvm::APInt::getBitsSetFrom
static APInt getBitsSetFrom(unsigned numBits, unsigned loBit)
Constructs an APInt value that has a contiguous range of bits set.
Definition APInt.h:287

llvm::APInt::getSExtValue
int64_t getSExtValue() const
Get sign extended value.
Definition APInt.h:1563

llvm::APInt::lshr
APInt lshr(unsigned shiftAmt) const
Logical right-shift function.
Definition APInt.h:852

llvm::Argument
This class represents an incoming formal argument to a Function.
Definition Argument.h:32

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40

llvm::ArrayRef::size
size_t size() const
size - Get the array size.
Definition ArrayRef.h:142

llvm::AtomicCmpXchgInst
An instruction that atomically checks whether a specified value is in a memory location,...
Definition Instructions.h:507

llvm::AtomicCmpXchgInst::getCompareOperand
Value * getCompareOperand()
Definition Instructions.h:639

llvm::AtomicCmpXchgInst::getFailureOrdering
AtomicOrdering getFailureOrdering() const
Returns the failure ordering constraint of this cmpxchg instruction.
Definition Instructions.h:600

llvm::AtomicRMWInst
an instruction that atomically reads a memory location, combines it with another value,...
Definition Instructions.h:710

llvm::AtomicRMWInst::getAlign
Align getAlign() const
Return the alignment of the memory that is being allocated by the instruction.
Definition Instructions.h:844

llvm::AtomicRMWInst::BinOp
BinOp
This enumeration lists the possible modifications atomicrmw can make.
Definition Instructions.h:722

llvm::AtomicRMWInst::Add
@ Add
*p = old + v
Definition Instructions.h:726

llvm::AtomicRMWInst::USubCond
@ USubCond
Subtract only if no unsigned overflow.
Definition Instructions.h:778

llvm::AtomicRMWInst::Min
@ Min
*p = old <signed v ? old : v
Definition Instructions.h:740

llvm::AtomicRMWInst::Or
@ Or
*p = old | v
Definition Instructions.h:734

llvm::AtomicRMWInst::Sub
@ Sub
*p = old - v
Definition Instructions.h:728

llvm::AtomicRMWInst::And
@ And
*p = old & v
Definition Instructions.h:730

llvm::AtomicRMWInst::Xor
@ Xor
*p = old ^ v
Definition Instructions.h:736

llvm::AtomicRMWInst::USubSat
@ USubSat
*p = usub.sat(old, v) usub.sat matches the behavior of llvm.usub.sat.
Definition Instructions.h:782

llvm::AtomicRMWInst::UIncWrap
@ UIncWrap
Increment one up to a maximum value.
Definition Instructions.h:770

llvm::AtomicRMWInst::Max
@ Max
*p = old >signed v ? old : v
Definition Instructions.h:738

llvm::AtomicRMWInst::UMin
@ UMin
*p = old <unsigned v ? old : v
Definition Instructions.h:744

llvm::AtomicRMWInst::UMax
@ UMax
*p = old >unsigned v ? old : v
Definition Instructions.h:742

llvm::AtomicRMWInst::UDecWrap
@ UDecWrap
Decrement one until a minimum value or zero.
Definition Instructions.h:774

llvm::AtomicRMWInst::Xchg
@ Xchg
*p = v
Definition Instructions.h:724

llvm::AtomicRMWInst::Nand
@ Nand
*p = ~(old & v)
Definition Instructions.h:732

llvm::AtomicRMWInst::getPointerOperand
Value * getPointerOperand()
Definition Instructions.h:887

llvm::AtomicRMWInst::isFloatingPointOperation
bool isFloatingPointOperation() const
Definition Instructions.h:899

llvm::AtomicRMWInst::getOperation
BinOp getOperation() const
Definition Instructions.h:820

llvm::AtomicRMWInst::getSyncScopeID
SyncScope::ID getSyncScopeID() const
Returns the synchronization scope ID of this rmw instruction.
Definition Instructions.h:878

llvm::AtomicRMWInst::getValOperand
Value * getValOperand()
Definition Instructions.h:891

llvm::AtomicRMWInst::getOrdering
AtomicOrdering getOrdering() const
Returns the ordering constraint of this rmw instruction.
Definition Instructions.h:864

llvm::BasicBlock
LLVM Basic Block Representation.
Definition BasicBlock.h:62

llvm::BitVector
Definition BitVector.h:101

llvm::BitVector::test
bool test(unsigned Idx) const
Definition BitVector.h:480

llvm::BitVector::count
size_type count() const
count - Returns the number of bits which are set.
Definition BitVector.h:181

llvm::BlockAddressSDNode
Definition SelectionDAGNodes.h:2424

llvm::BuildVectorSDNode
A "pseudo-class" with methods for operating on BUILD_VECTORs.
Definition SelectionDAGNodes.h:2215

llvm::CCState
CCState - This class holds information needed while lowering arguments and return values.
Definition CallingConvLower.h:171

llvm::CCState::getFirstUnallocated
unsigned getFirstUnallocated(ArrayRef< MCPhysReg > Regs) const
getFirstUnallocated - Return the index of the first unallocated register in the set,...
Definition CallingConvLower.h:318

llvm::CCState::AnalyzeCallOperands
LLVM_ABI void AnalyzeCallOperands(const SmallVectorImpl< ISD::OutputArg > &Outs, CCAssignFn Fn)
AnalyzeCallOperands - Analyze the outgoing arguments to a call, incorporating info about the passed v...
Definition CallingConvLower.cpp:126

llvm::CCState::getStackSize
uint64_t getStackSize() const
Returns the size of the currently allocated portion of the stack.
Definition CallingConvLower.h:246

llvm::CCState::AnalyzeFormalArguments
LLVM_ABI void AnalyzeFormalArguments(const SmallVectorImpl< ISD::InputArg > &Ins, CCAssignFn Fn)
AnalyzeFormalArguments - Analyze an array of argument values, incorporating info about the formals in...
Definition CallingConvLower.cpp:85

llvm::CCValAssign
CCValAssign - Represent assignment of one arg/retval to a location.
Definition CallingConvLower.h:34

llvm::CCValAssign::isRegLoc
bool isRegLoc() const
Definition CallingConvLower.h:123

llvm::CCValAssign::getPending
static CCValAssign getPending(unsigned ValNo, MVT ValVT, MVT LocVT, LocInfo HTP, unsigned ExtraInfo=0)
Definition CallingConvLower.h:109

llvm::CCValAssign::getLocReg
Register getLocReg() const
Definition CallingConvLower.h:129

llvm::CCValAssign::getLocInfo
LocInfo getLocInfo() const
Definition CallingConvLower.h:135

llvm::CCValAssign::getReg
static CCValAssign getReg(unsigned ValNo, MVT ValVT, MCRegister Reg, MVT LocVT, LocInfo HTP, bool IsCustom=false)
Definition CallingConvLower.h:85

llvm::CCValAssign::LocInfo
LocInfo
Definition CallingConvLower.h:36

llvm::CCValAssign::BCvt
@ BCvt
Definition CallingConvLower.h:47

llvm::CCValAssign::Full
@ Full
Definition CallingConvLower.h:37

llvm::CCValAssign::Indirect
@ Indirect
Definition CallingConvLower.h:53

llvm::CCValAssign::getCustomReg
static CCValAssign getCustomReg(unsigned ValNo, MVT ValVT, MCRegister Reg, MVT LocVT, LocInfo HTP)
Definition CallingConvLower.h:92

llvm::CCValAssign::getMem
static CCValAssign getMem(unsigned ValNo, MVT ValVT, int64_t Offset, MVT LocVT, LocInfo HTP, bool IsCustom=false)
Definition CallingConvLower.h:97

llvm::CCValAssign::needsCustom
bool needsCustom() const
Definition CallingConvLower.h:127

llvm::CCValAssign::getValVT
MVT getValVT() const
Definition CallingConvLower.h:121

llvm::CCValAssign::isMemLoc
bool isMemLoc() const
Definition CallingConvLower.h:124

llvm::CCValAssign::getLocMemOffset
int64_t getLocMemOffset() const
Definition CallingConvLower.h:130

llvm::CCValAssign::getValNo
unsigned getValNo() const
Definition CallingConvLower.h:120

llvm::CCValAssign::getCustomMem
static CCValAssign getCustomMem(unsigned ValNo, MVT ValVT, int64_t Offset, MVT LocVT, LocInfo HTP)
Definition CallingConvLower.h:104

llvm::CCValAssign::getLocVT
MVT getLocVT() const
Definition CallingConvLower.h:133

llvm::CallBase
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition InstrTypes.h:1114

llvm::CallBase::isMustTailCall
LLVM_ABI bool isMustTailCall() const
Tests if this call site must be tail call optimized.
Definition Instructions.cpp:336

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition Instructions.h:1511

llvm::CallInst::isTailCall
bool isTailCall() const
Definition Instructions.h:1622

llvm::ConstantFPSDNode
Definition SelectionDAGNodes.h:1806

llvm::ConstantFPSDNode::getValueAPF
const APFloat & getValueAPF() const
Definition SelectionDAGNodes.h:1819

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition Constants.h:87

llvm::ConstantInt::isMinusOne
bool isMinusOne() const
This function will return true iff every bit in this constant is set to true.
Definition Constants.h:234

llvm::ConstantInt::isZero
bool isZero() const
This is just a convenience method to make client code smaller for a common code.
Definition Constants.h:222

llvm::ConstantPoolSDNode
Definition SelectionDAGNodes.h:2110

llvm::ConstantSDNode
Definition SelectionDAGNodes.h:1751

llvm::ConstantSDNode::getZExtValue
uint64_t getZExtValue() const
Definition SelectionDAGNodes.h:1768

llvm::ConstantSDNode::getSExtValue
int64_t getSExtValue() const
Definition SelectionDAGNodes.h:1769

llvm::ConstantSDNode::isOpaque
bool isOpaque() const
Definition SelectionDAGNodes.h:1782

llvm::ConstantSDNode::isZero
bool isZero() const
Definition SelectionDAGNodes.h:1777

llvm::ConstantSDNode::isAllOnes
bool isAllOnes() const
Definition SelectionDAGNodes.h:1778

llvm::Constant
This is an important base class in LLVM.
Definition Constant.h:43

llvm::DWARFExpression::Operation::getNumOperands
uint64_t getNumOperands() const
Definition DWARFExpression.h:93

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64

llvm::DataLayout::getPointerSizeInBits
unsigned getPointerSizeInBits(unsigned AS=0) const
The size in bits of the pointer representation in a given address space.
Definition DataLayout.h:490

llvm::DataLayout::getPrefTypeAlign
LLVM_ABI Align getPrefTypeAlign(Type *Ty) const
Returns the preferred stack/global alignment for the specified type.
Definition DataLayout.cpp:967

llvm::DebugLoc
A debug info location.
Definition DebugLoc.h:123

llvm::ExternalSymbolSDNode
Definition SelectionDAGNodes.h:2466

llvm::Function
Definition Function.h:64

llvm::Function::getFunctionType
FunctionType * getFunctionType() const
Returns the FunctionType for me.
Definition Function.h:209

llvm::Function::getCallingConv
CallingConv::ID getCallingConv() const
getCallingConv()/setCallingConv(CC) - These method get and set the calling convention of this functio...
Definition Function.h:270

llvm::Function::getArg
Argument * getArg(unsigned i) const
Definition Function.h:884

llvm::GlobalAddressSDNode
Definition SelectionDAGNodes.h:1980

llvm::GlobalValue
Definition GlobalValue.h:49

llvm::GlobalValue::isDSOLocal
bool isDSOLocal() const
Definition GlobalValue.h:307

llvm::IRBuilderBase
Common base class shared among various IRBuilders.
Definition IRBuilder.h:114

llvm::IRBuilder
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition IRBuilder.h:2788

llvm::InlineAsm::ConstraintCode
ConstraintCode
Definition InlineAsm.h:242

llvm::InlineAsm::ConstraintCode::k
@ k
Definition InlineAsm.h:246

llvm::InlineAsm::ConstraintCode::ZB
@ ZB
Definition InlineAsm.h:264

llvm::InlineAsm::ConstraintCode::ZC
@ ZC
Definition InlineAsm.h:265

llvm::Instruction
Definition Instruction.h:69

llvm::Instruction::getModule
LLVM_ABI const Module * getModule() const
Return the module owning the function this instruction belongs to or nullptr it the function does not...
Definition Instruction.cpp:82

llvm::Instruction::eraseFromParent
LLVM_ABI InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
Definition Instruction.cpp:108

llvm::Instruction::getDataLayout
LLVM_ABI const DataLayout & getDataLayout() const
Get the data layout of the module this instruction belongs to.
Definition Instruction.cpp:90

llvm::IntegerType
Class to represent integer types.
Definition DerivedTypes.h:42

llvm::JumpTableSDNode
Definition SelectionDAGNodes.h:2089

llvm::LLT
Definition LowLevelType.h:40

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition LLVMContext.h:68

llvm::LLVMContext::emitError
LLVM_ABI void emitError(const Instruction *I, const Twine &ErrorStr)
emitError - Emit an error message to the currently installed error handler with optional location inf...
Definition LLVMContext.cpp:214

llvm::LoadSDNode
This class is used to represent ISD::LOAD nodes.
Definition SelectionDAGNodes.h:2574

llvm::LoadSDNode::getExtensionType
ISD::LoadExtType getExtensionType() const
Return whether this is a plain node, or one of the varieties of value-extending loads.
Definition SelectionDAGNodes.h:2589

llvm::LoongArchInstrInfo
Definition LoongArchInstrInfo.h:26

llvm::LoongArchMachineFunctionInfo
LoongArchMachineFunctionInfo - This class is derived from MachineFunctionInfo and contains private Lo...
Definition LoongArchMachineFunctionInfo.h:25

llvm::LoongArchMachineFunctionInfo::addSExt32Register
void addSExt32Register(Register Reg)
Definition LoongArchMachineFunctionInfo.h:73

llvm::LoongArchSubtarget
Definition LoongArchSubtarget.h:31

llvm::LoongArchSubtarget::getRegisterInfo
const LoongArchRegisterInfo * getRegisterInfo() const override
Definition LoongArchSubtarget.h:80

llvm::LoongArchSubtarget::getGRLenVT
MVT getGRLenVT() const
Definition LoongArchSubtarget.h:94

llvm::LoongArchSubtarget::is64Bit
bool is64Bit() const
Definition LoongArchSubtarget.h:93

llvm::LoongArchSubtarget::getInstrInfo
const LoongArchInstrInfo * getInstrInfo() const override
Definition LoongArchSubtarget.h:79

llvm::LoongArchSubtarget::getGRLen
unsigned getGRLen() const
Definition LoongArchSubtarget.h:95

llvm::LoongArchTargetLowering
Definition LoongArchISelLowering.h:25

llvm::LoongArchTargetLowering::getTgtMemIntrinsic
bool getTgtMemIntrinsic(IntrinsicInfo &Info, const CallBase &I, MachineFunction &MF, unsigned Intrinsic) const override
Given an intrinsic, checks if on the target the intrinsic will need to map to a MemIntrinsicNode (tou...
Definition LoongArchISelLowering.cpp:8914

llvm::LoongArchTargetLowering::isUsedByReturnOnly
bool isUsedByReturnOnly(SDNode *N, SDValue &Chain) const override
Return true if result of the specified node is used by a return node only.
Definition LoongArchISelLowering.cpp:8302

llvm::LoongArchTargetLowering::PerformDAGCombine
SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override
This method will be invoked for all target nodes and for any target-independent nodes that the target...
Definition LoongArchISelLowering.cpp:6959

llvm::LoongArchTargetLowering::getSqrtEstimate
SDValue getSqrtEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled, int &RefinementSteps, bool &UseOneConstNR, bool Reciprocal) const override
Hooks for building estimates in place of slower divisions and square roots.
Definition LoongArchISelLowering.cpp:9216

llvm::LoongArchTargetLowering::isLegalICmpImmediate
bool isLegalICmpImmediate(int64_t Imm) const override
Return true if the specified immediate is legal icmp immediate, that is the target has icmp instructi...
Definition LoongArchISelLowering.cpp:9550

llvm::LoongArchTargetLowering::shouldExpandAtomicCmpXchgInIR
TargetLowering::AtomicExpansionKind shouldExpandAtomicCmpXchgInIR(AtomicCmpXchgInst *CI) const override
Returns how the given atomic cmpxchg should be expanded by the IR-level AtomicExpand pass.
Definition LoongArchISelLowering.cpp:9083

llvm::LoongArchTargetLowering::emitMaskedAtomicCmpXchgIntrinsic
Value * emitMaskedAtomicCmpXchgIntrinsic(IRBuilderBase &Builder, AtomicCmpXchgInst *CI, Value *AlignedAddr, Value *CmpVal, Value *NewVal, Value *Mask, AtomicOrdering Ord) const override
Perform a masked cmpxchg using a target-specific intrinsic.
Definition LoongArchISelLowering.cpp:9095

llvm::LoongArchTargetLowering::getSetCCResultType
EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Context, EVT VT) const override
Return the ValueType of the result of SETCC operations.
Definition LoongArchISelLowering.cpp:8897

llvm::LoongArchTargetLowering::isImmVLDILegalForMode1
std::pair< bool, uint64_t > isImmVLDILegalForMode1(const APInt &SplatValue, const unsigned SplatBitSize) const
Check if a constant splat can be generated using [x]vldi, where imm[12] is 1.
Definition LoongArchISelLowering.cpp:8765

llvm::LoongArchTargetLowering::isFMAFasterThanFMulAndFAdd
bool isFMAFasterThanFMulAndFAdd(const MachineFunction &MF, EVT VT) const override
Return true if an FMA operation is faster than a pair of fmul and fadd instructions.
Definition LoongArchISelLowering.cpp:9176

llvm::LoongArchTargetLowering::LowerCall
SDValue LowerCall(TargetLowering::CallLoweringInfo &CLI, SmallVectorImpl< SDValue > &InVals) const override
This hook must be implemented to lower calls into the specified DAG.
Definition LoongArchISelLowering.cpp:8383

llvm::LoongArchTargetLowering::decomposeMulByConstant
bool decomposeMulByConstant(LLVMContext &Context, EVT VT, SDValue C) const override
Return true if it is profitable to transform an integer multiplication-by-constant into simpler opera...
Definition LoongArchISelLowering.cpp:9459

llvm::LoongArchTargetLowering::isExtractVecEltCheap
bool isExtractVecEltCheap(EVT VT, unsigned Index) const override
Return true if extraction of a scalar element from the given vector type at the given index is cheap.
Definition LoongArchISelLowering.cpp:9784

llvm::LoongArchTargetLowering::getPreferredVectorAction
LegalizeTypeAction getPreferredVectorAction(MVT VT) const override
Return the preferred vector type legalization action.
Definition LoongArchISelLowering.cpp:9633

llvm::LoongArchTargetLowering::isSExtCheaperThanZExt
bool isSExtCheaperThanZExt(EVT SrcVT, EVT DstVT) const override
Return true if sign-extension from FromTy to ToTy is cheaper than zero-extension.
Definition LoongArchISelLowering.cpp:9573

llvm::LoongArchTargetLowering::shouldExpandAtomicRMWInIR
TargetLowering::AtomicExpansionKind shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override
Returns how the IR-level AtomicExpand pass should expand the given AtomicRMW, if at all.
Definition LoongArchISelLowering.cpp:8994

llvm::LoongArchTargetLowering::allowsMisalignedMemoryAccesses
bool allowsMisalignedMemoryAccesses(EVT VT, unsigned AddrSpace=0, Align Alignment=Align(1), MachineMemOperand::Flags Flags=MachineMemOperand::MONone, unsigned *Fast=nullptr) const override
Determine if the target supports unaligned memory accesses.
Definition LoongArchISelLowering.cpp:7684

llvm::LoongArchTargetLowering::isCheapToSpeculateCtlz
bool isCheapToSpeculateCtlz(Type *Ty) const override
Return true if it is cheap to speculate a call to intrinsic ctlz.
Definition LoongArchISelLowering.cpp:8874

llvm::LoongArchTargetLowering::LowerOperation
SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override
This callback is invoked for operations that are unsupported by the target, which are registered to u...
Definition LoongArchISelLowering.cpp:533

llvm::LoongArchTargetLowering::shouldAlignPointerArgs
bool shouldAlignPointerArgs(CallInst *CI, unsigned &MinSize, Align &PrefAlign) const override
Return true if the pointer arguments to CI should be aligned by aligning the object whose address is ...
Definition LoongArchISelLowering.cpp:9615

llvm::LoongArchTargetLowering::emitMaskedAtomicRMWIntrinsic
Value * emitMaskedAtomicRMWIntrinsic(IRBuilderBase &Builder, AtomicRMWInst *AI, Value *AlignedAddr, Value *Incr, Value *Mask, Value *ShiftAmt, AtomicOrdering Ord) const override
Perform a masked atomicrmw using a target-specific intrinsic.
Definition LoongArchISelLowering.cpp:9117

llvm::LoongArchTargetLowering::isExtractSubvectorCheap
bool isExtractSubvectorCheap(EVT ResVT, EVT SrcVT, unsigned Index) const override
Return true if EXTRACT_SUBVECTOR is cheap for extracting this result type from this source type with ...
Definition LoongArchISelLowering.cpp:9775

llvm::LoongArchTargetLowering::isZExtFree
bool isZExtFree(SDValue Val, EVT VT2) const override
Return true if zero-extending the specific node Val to type VT2 is free (either because it's implicit...
Definition LoongArchISelLowering.cpp:9558

llvm::LoongArchTargetLowering::getExceptionPointerRegister
Register getExceptionPointerRegister(const Constant *PersonalityFn) const override
If a physical register, this returns the register that receives the exception address on entry to an ...
Definition LoongArchISelLowering.cpp:9194

llvm::LoongArchTargetLowering::signExtendConstant
bool signExtendConstant(const ConstantInt *CI) const override
Return true if this constant should be sign extended when promoting to a larger type.
Definition LoongArchISelLowering.cpp:9578

llvm::LoongArchTargetLowering::isLegalAddImmediate
bool isLegalAddImmediate(int64_t Imm) const override
Return true if the specified immediate is legal add immediate, that is the target has add instruction...
Definition LoongArchISelLowering.cpp:9554

llvm::LoongArchTargetLowering::isCheapToSpeculateCttz
bool isCheapToSpeculateCttz(Type *Ty) const override
Return true if it is cheap to speculate a call to intrinsic cttz.
Definition LoongArchISelLowering.cpp:8870

llvm::LoongArchTargetLowering::isLegalAddressingMode
bool isLegalAddressingMode(const DataLayout &DL, const AddrMode &AM, Type *Ty, unsigned AS, Instruction *I=nullptr) const override
Return true if the addressing mode represented by AM is legal for this target, for a load/store of th...
Definition LoongArchISelLowering.cpp:9506

llvm::LoongArchTargetLowering::shouldSignExtendTypeInLibCall
bool shouldSignExtendTypeInLibCall(Type *Ty, bool IsSigned) const override
Returns true if arguments should be sign-extended in lib calls.
Definition LoongArchISelLowering.cpp:9595

llvm::LoongArchTargetLowering::shouldScalarizeBinop
bool shouldScalarizeBinop(SDValue VecOp) const override
Try to convert an extract element of a vector binary operation into an extract element followed by a ...
Definition LoongArchISelLowering.cpp:9756

llvm::LoongArchTargetLowering::isFPImmVLDILegal
bool isFPImmVLDILegal(const APFloat &Imm, EVT VT) const
Definition LoongArchISelLowering.cpp:8842

llvm::LoongArchTargetLowering::shouldExtendTypeInLibCall
bool shouldExtendTypeInLibCall(EVT Type) const override
Returns true if arguments should be extended in lib calls.
Definition LoongArchISelLowering.cpp:9603

llvm::LoongArchTargetLowering::getRegisterByName
Register getRegisterByName(const char *RegName, LLT VT, const MachineFunction &MF) const override
Return the register ID of the name passed in.
Definition LoongArchISelLowering.cpp:9443

llvm::LoongArchTargetLowering::hasAndNot
bool hasAndNot(SDValue Y) const override
Return true if the target has a bitwise and-not operation: X = ~A & B This can be used to simplify se...
Definition LoongArchISelLowering.cpp:8905

llvm::LoongArchTargetLowering::isOffsetFoldingLegal
bool isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const override
Return true if folding a constant offset with the given GlobalAddress is legal.
Definition LoongArchISelLowering.cpp:524

llvm::LoongArchTargetLowering::getExceptionSelectorRegister
Register getExceptionSelectorRegister(const Constant *PersonalityFn) const override
If a physical register, this returns the register that receives the exception typeid on entry to a la...
Definition LoongArchISelLowering.cpp:9199

llvm::LoongArchTargetLowering::ReplaceNodeResults
void ReplaceNodeResults(SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG) const override
This callback is invoked when a node result type is illegal for the target, and the operation was reg...
Definition LoongArchISelLowering.cpp:4807

llvm::LoongArchTargetLowering::SimplifyDemandedBitsForTargetNode
bool SimplifyDemandedBitsForTargetNode(SDValue Op, const APInt &DemandedBits, const APInt &DemandedElts, KnownBits &Known, TargetLoweringOpt &TLO, unsigned Depth) const override
Attempt to simplify any target nodes based on the demanded bits/elts, returning true on success.
Definition LoongArchISelLowering.cpp:9701

llvm::LoongArchTargetLowering::emitExpandAtomicRMW
void emitExpandAtomicRMW(AtomicRMWInst *AI) const override
Perform a atomicrmw expansion using a target-specific way.
Definition LoongArchISelLowering.cpp:8941

llvm::LoongArchTargetLowering::getExtendForAtomicCmpSwapArg
ISD::NodeType getExtendForAtomicCmpSwapArg() const override
Returns how the platform's atomic compare and swap expects its comparison value to be extended (ZERO_...
Definition LoongArchISelLowering.cpp:9590

llvm::LoongArchTargetLowering::LoongArchTargetLowering
LoongArchTargetLowering(const TargetMachine &TM, const LoongArchSubtarget &STI)
Definition LoongArchISelLowering.cpp:78

llvm::LoongArchTargetLowering::LowerReturn
SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool IsVarArg, const SmallVectorImpl< ISD::OutputArg > &Outs, const SmallVectorImpl< SDValue > &OutVals, const SDLoc &DL, SelectionDAG &DAG) const override
This hook must be implemented to lower outgoing return values, described by the Outs array,...
Definition LoongArchISelLowering.cpp:8699

llvm::LoongArchTargetLowering::hasAndNotCompare
bool hasAndNotCompare(SDValue Y) const override
Return true if the target should transform: (X & Y) == Y ---> (~X & Y) == 0 (X & Y) !...
Definition LoongArchISelLowering.cpp:9582

llvm::LoongArchTargetLowering::getRecipEstimate
SDValue getRecipEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled, int &RefinementSteps) const override
Return a reciprocal estimate value for the input operand.
Definition LoongArchISelLowering.cpp:9245

llvm::LoongArchTargetLowering::CanLowerReturn
bool CanLowerReturn(CallingConv::ID CallConv, MachineFunction &MF, bool IsVarArg, const SmallVectorImpl< ISD::OutputArg > &Outs, LLVMContext &Context, const Type *RetTy) const override
This hook should be implemented to check whether the return values described by the Outs array can fi...
Definition LoongArchISelLowering.cpp:8682

llvm::LoongArchTargetLowering::LowerFormalArguments
SDValue LowerFormalArguments(SDValue Chain, CallingConv::ID CallConv, bool IsVarArg, const SmallVectorImpl< ISD::InputArg > &Ins, const SDLoc &DL, SelectionDAG &DAG, SmallVectorImpl< SDValue > &InVals) const override
This hook must be implemented to lower the incoming (formal) arguments, described by the Ins array,...
Definition LoongArchISelLowering.cpp:8159

llvm::LoongArchTargetLowering::mayBeEmittedAsTailCall
bool mayBeEmittedAsTailCall(const CallInst *CI) const override
Return true if the target may be able emit the call instruction as a tail call.
Definition LoongArchISelLowering.cpp:8296

llvm::MCRegister
Wrapper class representing physical registers. Should be passed by value.
Definition MCRegister.h:41

llvm::MCSubtargetInfo::hasFeature
bool hasFeature(unsigned Feature) const
Definition MCSubtargetInfo.h:122

llvm::MVT
Machine Value Type.
Definition MachineValueType.h:36

llvm::MVT::getFloatingPointVT
static MVT getFloatingPointVT(unsigned BitWidth)
Definition MachineValueType.h:437

llvm::MVT::is128BitVector
bool is128BitVector() const
Return true if this is a 128-bit vector type.
Definition MachineValueType.h:156

llvm::MVT::SimpleValueType
SimpleValueType
Definition MachineValueType.h:38

llvm::MVT::SimpleTy
SimpleValueType SimpleTy
Definition MachineValueType.h:55

llvm::MVT::getScalarSizeInBits
uint64_t getScalarSizeInBits() const
Definition MachineValueType.h:352

llvm::MVT::getVectorNumElements
unsigned getVectorNumElements() const
Definition MachineValueType.h:300

llvm::MVT::isVector
bool isVector() const
Return true if this is a vector value type.
Definition MachineValueType.h:106

llvm::MVT::isScalableVector
bool isScalableVector() const
Return true if this is a vector value type where the runtime length is machine dependent.
Definition MachineValueType.h:113

llvm::MVT::getSizeInBits
TypeSize getSizeInBits() const
Returns the size of the specified MVT in bits.
Definition MachineValueType.h:314

llvm::MVT::fixedlen_vector_valuetypes
static auto fixedlen_vector_valuetypes()
Definition MachineValueType.h:547

llvm::MVT::is256BitVector
bool is256BitVector() const
Return true if this is a 256-bit vector type.
Definition MachineValueType.h:161

llvm::MVT::isScalarInteger
bool isScalarInteger() const
Return true if this is an integer, not including vectors.
Definition MachineValueType.h:100

llvm::MVT::getVectorVT
static MVT getVectorVT(MVT VT, unsigned NumElements)
Definition MachineValueType.h:457

llvm::MVT::getVectorElementType
MVT getVectorElementType() const
Definition MachineValueType.h:269

llvm::MVT::isFloatingPoint
bool isFloatingPoint() const
Return true if this is a FP or a vector FP type.
Definition MachineValueType.h:80

llvm::MVT::getIntegerVT
static MVT getIntegerVT(unsigned BitWidth)
Definition MachineValueType.h:447

llvm::MVT::getHalfNumVectorElementsVT
MVT getHalfNumVectorElementsVT() const
Return a VT for a vector type with the same element type but half the number of elements.
Definition MachineValueType.h:231

llvm::MVT::changeVectorElementTypeToInteger
MVT changeVectorElementTypeToInteger() const
Return a vector with the same number of elements as this vector, but with the element type converted ...
Definition MachineValueType.h:202

llvm::MachineBasicBlock
Definition MachineBasicBlock.h:122

llvm::MachineBasicBlock::transferSuccessorsAndUpdatePHIs
LLVM_ABI void transferSuccessorsAndUpdatePHIs(MachineBasicBlock *FromMBB)
Transfers all the successors, as in transferSuccessors, and update PHI operands in the successor bloc...
Definition MachineBasicBlock.cpp:955

llvm::MachineBasicBlock::push_back
void push_back(MachineInstr *MI)
Definition MachineBasicBlock.h:1049

llvm::MachineBasicBlock::setCallFrameSize
void setCallFrameSize(unsigned N)
Set the call frame size on entry to this basic block.
Definition MachineBasicBlock.h:1273

llvm::MachineBasicBlock::getBasicBlock
const BasicBlock * getBasicBlock() const
Return the LLVM basic block that this instance corresponded to originally.
Definition MachineBasicBlock.h:253

llvm::MachineBasicBlock::addSuccessor
LLVM_ABI void addSuccessor(MachineBasicBlock *Succ, BranchProbability Prob=BranchProbability::getUnknown())
Add Succ as a successor of this MachineBasicBlock.
Definition MachineBasicBlock.cpp:816

llvm::MachineBasicBlock::begin
iterator begin()
Definition MachineBasicBlock.h:377

llvm::MachineBasicBlock::end
iterator end()
Definition MachineBasicBlock.h:379

llvm::MachineBasicBlock::getParent
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
Definition MachineBasicBlock.h:323

llvm::MachineBasicBlock::splice
void splice(iterator Where, MachineBasicBlock *Other, iterator From)
Take an instruction from MBB 'Other' at the position From, and insert it into this MBB right before '...
Definition MachineBasicBlock.h:1156

llvm::MachineBasicBlock::iterator
MachineInstrBundleIterator< MachineInstr > iterator
Definition MachineBasicBlock.h:341

llvm::MachineFrameInfo
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
Definition MachineFrameInfo.h:111

llvm::MachineFrameInfo::CreateFixedObject
LLVM_ABI int CreateFixedObject(uint64_t Size, int64_t SPOffset, bool IsImmutable, bool isAliased=false)
Create a new object at a fixed location on the stack.
Definition MachineFrameInfo.cpp:83

llvm::MachineFrameInfo::CreateStackObject
LLVM_ABI int CreateStackObject(uint64_t Size, Align Alignment, bool isSpillSlot, const AllocaInst *Alloca=nullptr, uint8_t ID=0)
Create a new statically sized stack object, returning a nonnegative identifier to represent it.
Definition MachineFrameInfo.cpp:51

llvm::MachineFrameInfo::setFrameAddressIsTaken
void setFrameAddressIsTaken(bool T)
Definition MachineFrameInfo.h:383

llvm::MachineFrameInfo::setHasTailCall
void setHasTailCall(bool V=true)
Definition MachineFrameInfo.h:667

llvm::MachineFrameInfo::setReturnAddressIsTaken
void setReturnAddressIsTaken(bool s)
Definition MachineFrameInfo.h:389

llvm::MachineFunction
Definition MachineFunction.h:286

llvm::MachineFunction::getSubtarget
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
Definition MachineFunction.h:762

llvm::MachineFunction::getMachineMemOperand
MachineMemOperand * getMachineMemOperand(MachinePointerInfo PtrInfo, MachineMemOperand::Flags f, LLT MemTy, Align base_alignment, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr, SyncScope::ID SSID=SyncScope::System, AtomicOrdering Ordering=AtomicOrdering::NotAtomic, AtomicOrdering FailureOrdering=AtomicOrdering::NotAtomic)
getMachineMemOperand - Allocate a new MachineMemOperand.
Definition MachineFunction.cpp:536

llvm::MachineFunction::getFrameInfo
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
Definition MachineFunction.h:778

llvm::MachineFunction::getRegInfo
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Definition MachineFunction.h:772

llvm::MachineFunction::getDataLayout
const DataLayout & getDataLayout() const
Return the DataLayout attached to the Module associated to this MF.
Definition MachineFunction.cpp:309

llvm::MachineFunction::getFunction
Function & getFunction()
Return the LLVM function that this machine code represents.
Definition MachineFunction.h:733

llvm::MachineFunction::iterator
BasicBlockListType::iterator iterator
Definition MachineFunction.h:966

llvm::MachineFunction::getInfo
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
Definition MachineFunction.h:860

llvm::MachineFunction::addLiveIn
Register addLiveIn(MCRegister PReg, const TargetRegisterClass *RC)
addLiveIn - Add the specified physical register as a live-in value and create a corresponding virtual...
Definition MachineFunction.cpp:780

llvm::MachineFunction::CreateMachineBasicBlock
MachineBasicBlock * CreateMachineBasicBlock(const BasicBlock *BB=nullptr, std::optional< UniqueBBID > BBID=std::nullopt)
CreateMachineInstr - Allocate a new MachineInstr.
Definition MachineFunction.cpp:499

llvm::MachineFunction::insert
void insert(iterator MBBI, MachineBasicBlock *MBB)
Definition MachineFunction.h:1003

llvm::MachineInstrBuilder::addImm
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
Definition MachineInstrBuilder.h:175

llvm::MachineInstrBuilder::addReg
const MachineInstrBuilder & addReg(Register RegNo, unsigned flags=0, unsigned SubReg=0) const
Add a new virtual register operand.
Definition MachineInstrBuilder.h:141

llvm::MachineInstrBuilder::addMBB
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
Definition MachineInstrBuilder.h:190

llvm::MachineInstr
Representation of each machine instruction.
Definition MachineInstr.h:72

llvm::MachineInstr::collectDebugValues
LLVM_ABI void collectDebugValues(SmallVectorImpl< MachineInstr * > &DbgValues)
Scan instructions immediately following MI and collect any matching DBG_VALUEs.
Definition MachineInstr.cpp:2525

llvm::MachineInstr::eraseFromParent
LLVM_ABI void eraseFromParent()
Unlink 'this' from the containing basic block and delete it.
Definition MachineInstr.cpp:787

llvm::MachineInstr::getOperand
const MachineOperand & getOperand(unsigned i) const
Definition MachineInstr.h:606

llvm::MachineMemOperand
A description of a memory reference used in the backend.
Definition MachineMemOperand.h:130

llvm::MachineMemOperand::Flags
Flags
Flags values. These may be or'd together.
Definition MachineMemOperand.h:133

llvm::MachineMemOperand::MOVolatile
@ MOVolatile
The memory access is volatile.
Definition MachineMemOperand.h:141

llvm::MachineMemOperand::MODereferenceable
@ MODereferenceable
The memory access is dereferenceable (i.e., doesn't trap).
Definition MachineMemOperand.h:145

llvm::MachineMemOperand::MOLoad
@ MOLoad
The memory access reads data.
Definition MachineMemOperand.h:137

llvm::MachineMemOperand::MOInvariant
@ MOInvariant
The memory access always returns the same value (or traps).
Definition MachineMemOperand.h:147

llvm::MachineMemOperand::MOStore
@ MOStore
The memory access writes data.
Definition MachineMemOperand.h:139

llvm::MachineOperand
MachineOperand class - Representation of each machine instruction operand.
Definition MachineOperand.h:49

llvm::MachineOperand::isKill
bool isKill() const
Definition MachineOperand.h:402

llvm::MachineOperand::setIsKill
void setIsKill(bool Val=true)
Definition MachineOperand.h:523

llvm::MachineOperand::setIsUndef
void setIsUndef(bool Val=true)
Definition MachineOperand.h:534

llvm::MachineOperand::getReg
Register getReg() const
getReg - Returns the register number.
Definition MachineOperand.h:372

llvm::MachineOperand::CreateReg
static MachineOperand CreateReg(Register Reg, bool isDef, bool isImp=false, bool isKill=false, bool isDead=false, bool isUndef=false, bool isEarlyClobber=false, unsigned SubReg=0, bool isDebug=false, bool isInternalRead=false, bool isRenamable=false)
Definition MachineOperand.h:851

llvm::MachineRegisterInfo
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
Definition MachineRegisterInfo.h:53

llvm::MemSDNode::getMemoryVT
EVT getMemoryVT() const
Return the type of the in-memory value.
Definition SelectionDAGNodes.h:1488

llvm::MutableArrayRef
MutableArrayRef - Represent a mutable reference to an array (0 or more elements consecutively in memo...
Definition ArrayRef.h:298

llvm::PointerType
Class to represent pointers.
Definition DerivedTypes.h:702

llvm::PointerType::getAddressSpace
unsigned getAddressSpace() const
Return the address space of the Pointer type.
Definition DerivedTypes.h:742

llvm::Register
Wrapper class representing virtual and physical registers.
Definition Register.h:20

llvm::Register::isVirtual
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
Definition Register.h:79

llvm::SDLoc
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Definition SelectionDAGNodes.h:1236

llvm::SDNode
Represents one node in the SelectionDAG.
Definition SelectionDAGNodes.h:512

llvm::SDNode::getAsAPIntVal
const APInt & getAsAPIntVal() const
Helper method returns the APInt value of a ConstantSDNode.
Definition SelectionDAGNodes.h:1802

llvm::SDNode::getOpcode
unsigned getOpcode() const
Return the SelectionDAG opcode value for this node.
Definition SelectionDAGNodes.h:703

llvm::SDNode::hasOneUse
bool hasOneUse() const
Return true if there is exactly one use of this node.
Definition SelectionDAGNodes.h:775

llvm::SDNode::isOnlyUserOf
LLVM_ABI bool isOnlyUserOf(const SDNode *N) const
Return true if this node is the only use of N.
Definition SelectionDAG.cpp:13153

llvm::SDNode::use_size
size_t use_size() const
Return the number of uses of this node.
Definition SelectionDAGNodes.h:779

llvm::SDNode::getSimpleValueType
MVT getSimpleValueType(unsigned ResNo) const
Return the type of a specified result as a simple type.
Definition SelectionDAGNodes.h:1121

llvm::SDNode::getAsZExtVal
uint64_t getAsZExtVal() const
Helper method returns the zero-extended integer value of a ConstantSDNode.
Definition SelectionDAGNodes.h:1794

llvm::SDNode::getNumOperands
unsigned getNumOperands() const
Return the number of values used by this operation.
Definition SelectionDAGNodes.h:1024

llvm::SDNode::getOperand
const SDValue & getOperand(unsigned Num) const
Definition SelectionDAGNodes.h:1045

llvm::SDNode::getValueType
EVT getValueType(unsigned ResNo) const
Return the type of a specified result.
Definition SelectionDAGNodes.h:1115

llvm::SDNode::isUndef
bool isUndef() const
Returns true if the node type is UNDEF or POISON.
Definition SelectionDAGNodes.h:710

llvm::SDValue
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
Definition SelectionDAGNodes.h:147

llvm::SDValue::isUndef
bool isUndef() const
Definition SelectionDAGNodes.h:1303

llvm::SDValue::getNode
SDNode * getNode() const
get the SDNode which holds the desired result
Definition SelectionDAGNodes.h:161

llvm::SDValue::hasOneUse
bool hasOneUse() const
Return true if there is exactly one node using value ResNo of Node.
Definition SelectionDAGNodes.h:1313

llvm::SDValue::getValue
SDValue getValue(unsigned R) const
Definition SelectionDAGNodes.h:181

llvm::SDValue::getValueType
EVT getValueType() const
Return the ValueType of the referenced return value.
Definition SelectionDAGNodes.h:1271

llvm::SDValue::getValueSizeInBits
TypeSize getValueSizeInBits() const
Returns the size of the value in bits.
Definition SelectionDAGNodes.h:201

llvm::SDValue::getOperand
const SDValue & getOperand(unsigned i) const
Definition SelectionDAGNodes.h:1279

llvm::SDValue::getScalarValueSizeInBits
uint64_t getScalarValueSizeInBits() const
Definition SelectionDAGNodes.h:205

llvm::SDValue::getConstantOperandVal
uint64_t getConstantOperandVal(unsigned i) const
Definition SelectionDAGNodes.h:1283

llvm::SDValue::getSimpleValueType
MVT getSimpleValueType() const
Return the simple ValueType of the referenced return value.
Definition SelectionDAGNodes.h:192

llvm::SDValue::getOpcode
unsigned getOpcode() const
Definition SelectionDAGNodes.h:1267

llvm::SelectionDAG
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
Definition SelectionDAG.h:229

llvm::SelectionDAG::getExtLoad
LLVM_ABI SDValue getExtLoad(ISD::LoadExtType ExtType, const SDLoc &dl, EVT VT, SDValue Chain, SDValue Ptr, MachinePointerInfo PtrInfo, EVT MemVT, MaybeAlign Alignment=MaybeAlign(), MachineMemOperand::Flags MMOFlags=MachineMemOperand::MONone, const AAMDNodes &AAInfo=AAMDNodes())
Definition SelectionDAG.cpp:9868

llvm::SelectionDAG::getTargetGlobalAddress
SDValue getTargetGlobalAddress(const GlobalValue *GV, const SDLoc &DL, EVT VT, int64_t offset=0, unsigned TargetFlags=0)
Definition SelectionDAG.h:758

llvm::SelectionDAG::getCopyToReg
SDValue getCopyToReg(SDValue Chain, const SDLoc &dl, Register Reg, SDValue N)
Definition SelectionDAG.h:818

llvm::SelectionDAG::getMergeValues
LLVM_ABI SDValue getMergeValues(ArrayRef< SDValue > Ops, const SDLoc &dl)
Create a MERGE_VALUES node from the given operands.
Definition SelectionDAG.cpp:9611

llvm::SelectionDAG::getVTList
LLVM_ABI SDVTList getVTList(EVT VT)
Return an SDVTList that represents the list of values specified.
Definition SelectionDAG.cpp:11278

llvm::SelectionDAG::getShiftAmountConstant
LLVM_ABI SDValue getShiftAmountConstant(uint64_t Val, EVT VT, const SDLoc &DL)
Definition SelectionDAG.cpp:1805

llvm::SelectionDAG::getAllOnesConstant
LLVM_ABI SDValue getAllOnesConstant(const SDLoc &DL, EVT VT, bool IsTarget=false, bool IsOpaque=false)
Definition SelectionDAG.cpp:1794

llvm::SelectionDAG::getMachineNode
LLVM_ABI MachineSDNode * getMachineNode(unsigned Opcode, const SDLoc &dl, EVT VT)
These are used for target selectors to create a new node with specified return type(s),...
Definition SelectionDAG.cpp:11719

llvm::SelectionDAG::getFreeze
LLVM_ABI SDValue getFreeze(SDValue V)
Return a freeze using the SDLoc of the value operand.
Definition SelectionDAG.cpp:2501

llvm::SelectionDAG::getSetCC
SDValue getSetCC(const SDLoc &DL, EVT VT, SDValue LHS, SDValue RHS, ISD::CondCode Cond, SDValue Chain=SDValue(), bool IsSignaling=false)
Helper function to make it easier to build SetCC's if you just have an ISD::CondCode instead of an SD...
Definition SelectionDAG.h:1335

llvm::SelectionDAG::isSafeToSpeculativelyExecute
bool isSafeToSpeculativelyExecute(unsigned Opcode) const
Some opcodes may create immediate undefined behavior when used with some values (integer division-by-...
Definition SelectionDAG.h:2607

llvm::SelectionDAG::getExtractSubvector
SDValue getExtractSubvector(const SDLoc &DL, EVT VT, SDValue Vec, unsigned Idx)
Return the VT typed sub-vector of Vec at Idx.
Definition SelectionDAG.h:968

llvm::SelectionDAG::getRegister
LLVM_ABI SDValue getRegister(Register Reg, EVT VT)
Definition SelectionDAG.cpp:2367

llvm::SelectionDAG::getLoad
LLVM_ABI SDValue getLoad(EVT VT, const SDLoc &dl, SDValue Chain, SDValue Ptr, MachinePointerInfo PtrInfo, MaybeAlign Alignment=MaybeAlign(), MachineMemOperand::Flags MMOFlags=MachineMemOperand::MONone, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr)
Loads are not normal binary operators: their result type is not determined by their operands,...
Definition SelectionDAG.cpp:9851

llvm::SelectionDAG::getInsertSubvector
SDValue getInsertSubvector(const SDLoc &DL, SDValue Vec, SDValue SubVec, unsigned Idx)
Insert SubVec at the Idx element of Vec.
Definition SelectionDAG.h:961

llvm::SelectionDAG::getMemcpy
LLVM_ABI SDValue getMemcpy(SDValue Chain, const SDLoc &dl, SDValue Dst, SDValue Src, SDValue Size, Align Alignment, bool isVol, bool AlwaysInline, const CallInst *CI, std::optional< bool > OverrideTailCall, MachinePointerInfo DstPtrInfo, MachinePointerInfo SrcPtrInfo, const AAMDNodes &AAInfo=AAMDNodes(), BatchAAResults *BatchAA=nullptr)
Definition SelectionDAG.cpp:9187

llvm::SelectionDAG::addNoMergeSiteInfo
void addNoMergeSiteInfo(const SDNode *Node, bool NoMerge)
Set NoMergeSiteInfo to be associated with Node if NoMerge is true.
Definition SelectionDAG.h:2579

llvm::SelectionDAG::getNOT
LLVM_ABI SDValue getNOT(const SDLoc &DL, SDValue Val, EVT VT)
Create a bitwise NOT operation as (XOR Val, -1).
Definition SelectionDAG.cpp:1616

llvm::SelectionDAG::getTargetLoweringInfo
const TargetLowering & getTargetLoweringInfo() const
Definition SelectionDAG.h:504

llvm::SelectionDAG::MaxRecursionDepth
static constexpr unsigned MaxRecursionDepth
Definition SelectionDAG.h:459

llvm::SelectionDAG::getTargetJumpTable
SDValue getTargetJumpTable(int JTI, EVT VT, unsigned TargetFlags=0)
Definition SelectionDAG.h:769

llvm::SelectionDAG::getUNDEF
SDValue getUNDEF(EVT VT)
Return an UNDEF node. UNDEF does not have a useful SDLoc.
Definition SelectionDAG.h:1184

llvm::SelectionDAG::getCALLSEQ_END
SDValue getCALLSEQ_END(SDValue Chain, SDValue Op1, SDValue Op2, SDValue InGlue, const SDLoc &DL)
Return a new CALLSEQ_END node, which always must have a glue result (to ensure it's not CSE'd).
Definition SelectionDAG.h:1161

llvm::SelectionDAG::getBuildVector
SDValue getBuildVector(EVT VT, const SDLoc &DL, ArrayRef< SDValue > Ops)
Return an ISD::BUILD_VECTOR node.
Definition SelectionDAG.h:873

llvm::SelectionDAG::isSplatValue
LLVM_ABI bool isSplatValue(SDValue V, const APInt &DemandedElts, APInt &UndefElts, unsigned Depth=0) const
Test whether V has a splatted value for all the demanded elements.
Definition SelectionDAG.cpp:2892

llvm::SelectionDAG::getBitcast
LLVM_ABI SDValue getBitcast(EVT VT, SDValue V)
Return a bitcast using the SDLoc of the value operand, and casting to the provided type.
Definition SelectionDAG.cpp:2472

llvm::SelectionDAG::getCopyFromReg
SDValue getCopyFromReg(SDValue Chain, const SDLoc &dl, Register Reg, EVT VT)
Definition SelectionDAG.h:844

llvm::SelectionDAG::getSelect
SDValue getSelect(const SDLoc &DL, EVT VT, SDValue Cond, SDValue LHS, SDValue RHS, SDNodeFlags Flags=SDNodeFlags())
Helper function to make it easier to build Select's if you just have operands and don't want to check...
Definition SelectionDAG.h:1364

llvm::SelectionDAG::getNegative
LLVM_ABI SDValue getNegative(SDValue Val, const SDLoc &DL, EVT VT)
Create negative operation as (SUB 0, Val).
Definition SelectionDAG.cpp:1611

llvm::SelectionDAG::setNodeMemRefs
LLVM_ABI void setNodeMemRefs(MachineSDNode *N, ArrayRef< MachineMemOperand * > NewMemRefs)
Mutate the specified machine node's memory references to the provided list.
Definition SelectionDAG.cpp:11487

llvm::SelectionDAG::getDataLayout
const DataLayout & getDataLayout() const
Definition SelectionDAG.h:498

llvm::SelectionDAG::getConstant
LLVM_ABI SDValue getConstant(uint64_t Val, const SDLoc &DL, EVT VT, bool isTarget=false, bool isOpaque=false)
Create a ConstantSDNode wrapping a constant value.
Definition SelectionDAG.cpp:1660

llvm::SelectionDAG::getSignedTargetConstant
SDValue getSignedTargetConstant(int64_t Val, const SDLoc &DL, EVT VT, bool isOpaque=false)
Definition SelectionDAG.h:719

llvm::SelectionDAG::ReplaceAllUsesWith
LLVM_ABI void ReplaceAllUsesWith(SDValue From, SDValue To)
Modify anything using 'From' to use 'To' instead.
Definition SelectionDAG.cpp:12236

llvm::SelectionDAG::getCommutedVectorShuffle
LLVM_ABI SDValue getCommutedVectorShuffle(const ShuffleVectorSDNode &SV)
Returns an ISD::VECTOR_SHUFFLE node semantically equivalent to the shuffle node in input but with swa...
Definition SelectionDAG.cpp:2357

llvm::SelectionDAG::SplitVector
LLVM_ABI std::pair< SDValue, SDValue > SplitVector(const SDValue &N, const SDLoc &DL, const EVT &LoVT, const EVT &HiVT)
Split the vector with EXTRACT_SUBVECTOR using the provided VTs and return the low/high part.
Definition SelectionDAG.cpp:13647

llvm::SelectionDAG::getStore
LLVM_ABI SDValue getStore(SDValue Chain, const SDLoc &dl, SDValue Val, SDValue Ptr, MachinePointerInfo PtrInfo, Align Alignment, MachineMemOperand::Flags MMOFlags=MachineMemOperand::MONone, const AAMDNodes &AAInfo=AAMDNodes())
Helper function to build ISD::STORE nodes.
Definition SelectionDAG.cpp:9901

llvm::SelectionDAG::getSignedConstant
LLVM_ABI SDValue getSignedConstant(int64_t Val, const SDLoc &DL, EVT VT, bool isTarget=false, bool isOpaque=false)
Definition SelectionDAG.cpp:1788

llvm::SelectionDAG::getCALLSEQ_START
SDValue getCALLSEQ_START(SDValue Chain, uint64_t InSize, uint64_t OutSize, const SDLoc &DL)
Return a new CALLSEQ_START node, that starts new call frame, in which InSize bytes are set up inside ...
Definition SelectionDAG.h:1149

llvm::SelectionDAG::FoldConstantArithmetic
LLVM_ABI SDValue FoldConstantArithmetic(unsigned Opcode, const SDLoc &DL, EVT VT, ArrayRef< SDValue > Ops, SDNodeFlags Flags=SDNodeFlags())
Definition SelectionDAG.cpp:6958

llvm::SelectionDAG::getExternalSymbol
LLVM_ABI SDValue getExternalSymbol(const char *Sym, EVT VT)
Definition SelectionDAG.cpp:2061

llvm::SelectionDAG::getTarget
const TargetMachine & getTarget() const
Definition SelectionDAG.h:499

llvm::SelectionDAG::WidenVector
LLVM_ABI SDValue WidenVector(const SDValue &N, const SDLoc &DL)
Widen the vector up to the next power of two using INSERT_SUBVECTOR.
Definition SelectionDAG.cpp:13682

llvm::SelectionDAG::getIntPtrConstant
LLVM_ABI SDValue getIntPtrConstant(uint64_t Val, const SDLoc &DL, bool isTarget=false)
Definition SelectionDAG.cpp:1800

llvm::SelectionDAG::getValueType
LLVM_ABI SDValue getValueType(EVT)
Definition SelectionDAG.cpp:2047

llvm::SelectionDAG::getNode
LLVM_ABI SDValue getNode(unsigned Opcode, const SDLoc &DL, EVT VT, ArrayRef< SDUse > Ops)
Gets or creates the specified node.
Definition SelectionDAG.cpp:10909

llvm::SelectionDAG::getTargetConstant
SDValue getTargetConstant(uint64_t Val, const SDLoc &DL, EVT VT, bool isOpaque=false)
Definition SelectionDAG.h:707

llvm::SelectionDAG::getTargetBlockAddress
SDValue getTargetBlockAddress(const BlockAddress *BA, EVT VT, int64_t Offset=0, unsigned TargetFlags=0)
Definition SelectionDAG.h:813

llvm::SelectionDAG::getVectorIdxConstant
LLVM_ABI SDValue getVectorIdxConstant(uint64_t Val, const SDLoc &DL, bool isTarget=false)
Definition SelectionDAG.cpp:1818

llvm::SelectionDAG::ReplaceAllUsesOfValueWith
LLVM_ABI void ReplaceAllUsesOfValueWith(SDValue From, SDValue To)
Replace any uses of From with To, leaving uses of other values produced by From.getNode() alone.
Definition SelectionDAG.cpp:12397

llvm::SelectionDAG::getMachineFunction
MachineFunction & getMachineFunction() const
Definition SelectionDAG.h:493

llvm::SelectionDAG::getSplatBuildVector
SDValue getSplatBuildVector(EVT VT, const SDLoc &DL, SDValue Op)
Return a splat ISD::BUILD_VECTOR node, consisting of Op splatted to all elements.
Definition SelectionDAG.h:890

llvm::SelectionDAG::getFrameIndex
LLVM_ABI SDValue getFrameIndex(int FI, EVT VT, bool isTarget=false)
Definition SelectionDAG.cpp:1934

llvm::SelectionDAG::computeKnownBits
LLVM_ABI KnownBits computeKnownBits(SDValue Op, unsigned Depth=0) const
Determine which bits of Op are known to be either zero or one and return them in Known.
Definition SelectionDAG.cpp:3282

llvm::SelectionDAG::getRegisterMask
LLVM_ABI SDValue getRegisterMask(const uint32_t *RegMask)
Definition SelectionDAG.cpp:2383

llvm::SelectionDAG::getZExtOrTrunc
LLVM_ABI SDValue getZExtOrTrunc(SDValue Op, const SDLoc &DL, EVT VT)
Convert Op, which must be of integer type, to the integer type VT, by either zero-extending or trunca...
Definition SelectionDAG.cpp:1502

llvm::SelectionDAG::getCondCode
LLVM_ABI SDValue getCondCode(ISD::CondCode Cond)
Definition SelectionDAG.cpp:2099

llvm::SelectionDAG::MaskedValueIsZero
LLVM_ABI bool MaskedValueIsZero(SDValue Op, const APInt &Mask, unsigned Depth=0) const
Return true if 'Op & Mask' is known to be zero.
Definition SelectionDAG.cpp:2840

llvm::SelectionDAG::getContext
LLVMContext * getContext() const
Definition SelectionDAG.h:511

llvm::SelectionDAG::getTargetExternalSymbol
LLVM_ABI SDValue getTargetExternalSymbol(const char *Sym, EVT VT, unsigned TargetFlags=0)
Definition SelectionDAG.cpp:2083

llvm::SelectionDAG::CreateStackTemporary
LLVM_ABI SDValue CreateStackTemporary(TypeSize Bytes, Align Alignment)
Create a stack temporary based on the size in bytes and the alignment.
Definition SelectionDAG.cpp:2596

llvm::SelectionDAG::getTargetConstantPool
SDValue getTargetConstantPool(const Constant *C, EVT VT, MaybeAlign Align=std::nullopt, int Offset=0, unsigned TargetFlags=0)
Definition SelectionDAG.h:778

llvm::SelectionDAG::getEntryNode
SDValue getEntryNode() const
Return the token chain corresponding to the entry of the function.
Definition SelectionDAG.h:581

llvm::SelectionDAG::getSplat
SDValue getSplat(EVT VT, const SDLoc &DL, SDValue Op)
Returns a node representing a splat of one value into all lanes of the provided vector type.
Definition SelectionDAG.h:923

llvm::SelectionDAG::SplitScalar
LLVM_ABI std::pair< SDValue, SDValue > SplitScalar(const SDValue &N, const SDLoc &DL, const EVT &LoVT, const EVT &HiVT)
Split the scalar node with EXTRACT_ELEMENT using the provided VTs and return the low/high part.
Definition SelectionDAG.cpp:13587

llvm::SelectionDAG::getVectorShuffle
LLVM_ABI SDValue getVectorShuffle(EVT VT, const SDLoc &dl, SDValue N1, SDValue N2, ArrayRef< int > Mask)
Return an ISD::VECTOR_SHUFFLE node.
Definition SelectionDAG.cpp:2186

llvm::ShuffleVectorInst::isReverseMask
static LLVM_ABI bool isReverseMask(ArrayRef< int > Mask, int NumSrcElts)
Return true if this shuffle mask swaps the order of elements from exactly one source vector.
Definition Instructions.cpp:1953

llvm::ShuffleVectorSDNode::getMask
ArrayRef< int > getMask() const
Definition SelectionDAGNodes.h:1704

llvm::SmallSet
SmallSet - This maintains a set of unique values, optimizing for the case when the set is small (less...
Definition SmallSet.h:133

llvm::SmallSet::count
size_type count(const T &V) const
count - Return 1 if the element is in the set, 0 otherwise.
Definition SmallSet.h:175

llvm::SmallSet::insert
std::pair< const_iterator, bool > insert(const T &V)
insert - Insert an element into the set if it isn't already there.
Definition SmallSet.h:183

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition SmallVector.h:574

llvm::SmallVectorImpl::assign
void assign(size_type NumElts, ValueParamT Elt)
Definition SmallVector.h:705

llvm::SmallVectorImpl::const_iterator
typename SuperClass::const_iterator const_iterator
Definition SmallVector.h:579

llvm::SmallVectorImpl::clear
void clear()
Definition SmallVector.h:611

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition SmallVector.h:417

llvm::SmallVectorTemplateCommon::size
size_t size() const
Definition SmallVector.h:80

llvm::SmallVectorTemplateCommon::empty
bool empty() const
Definition SmallVector.h:83

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition SmallVector.h:1203

llvm::StackOffset
StackOffset holds a fixed and a scalable offset in bytes.
Definition TypeSize.h:30

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55

llvm::StringRef::split
std::pair< StringRef, StringRef > split(char Separator) const
Split into two substrings around the first occurrence of a separator character.
Definition StringRef.h:712

llvm::StringRef::starts_with
bool starts_with(StringRef Prefix) const
Check if this string starts with the given Prefix.
Definition StringRef.h:261

llvm::StringRef::size
constexpr size_t size() const
size - Get the string size.
Definition StringRef.h:146

llvm::TargetInstrInfo
TargetInstrInfo - Interface to description of machine instruction set.
Definition TargetInstrInfo.h:114

llvm::TargetLoweringBase::setBooleanVectorContents
void setBooleanVectorContents(BooleanContent Ty)
Specify how the target extends the result of a vector boolean value from a vector of i1 to a wider ty...
Definition TargetLowering.h:2597

llvm::TargetLoweringBase::setOperationAction
void setOperationAction(unsigned Op, MVT VT, LegalizeAction Action)
Indicate that the specified operation does not work with the specified type and indicate what to do a...
Definition TargetLowering.h:2660

llvm::TargetLoweringBase::Enabled
@ Enabled
Definition TargetLowering.h:597

llvm::TargetLoweringBase::Unspecified
@ Unspecified
Definition TargetLowering.h:595

llvm::TargetLoweringBase::Custom
@ Custom
Definition TargetLowering.h:207

llvm::TargetLoweringBase::Expand
@ Expand
Definition TargetLowering.h:205

llvm::TargetLoweringBase::Promote
@ Promote
Definition TargetLowering.h:204

llvm::TargetLoweringBase::LibCall
@ LibCall
Definition TargetLowering.h:206

llvm::TargetLoweringBase::emitPatchPoint
MachineBasicBlock * emitPatchPoint(MachineInstr &MI, MachineBasicBlock *MBB) const
Replace/modify any TargetFrameIndex operands with a targte-dependent sequence of memory operands that...
Definition TargetLoweringBase.cpp:1508

llvm::TargetLoweringBase::getRegClassFor
virtual const TargetRegisterClass * getRegClassFor(MVT VT, bool isDivergent=false) const
Return the register class that should be used for the specified value type.
Definition TargetLowering.h:1062

llvm::TargetLoweringBase::getTargetMachine
const TargetMachine & getTargetMachine() const
Definition TargetLowering.h:374

llvm::TargetLoweringBase::getNumRegistersForCallingConv
virtual unsigned getNumRegistersForCallingConv(LLVMContext &Context, CallingConv::ID CC, EVT VT) const
Certain targets require unusual breakdowns of certain types.
Definition TargetLowering.h:1866

llvm::TargetLoweringBase::isZExtFree
virtual bool isZExtFree(Type *FromTy, Type *ToTy) const
Return true if any actual instruction that defines a value of type FromTy implicitly zero-extends the...
Definition TargetLowering.h:3183

llvm::TargetLoweringBase::getRegisterTypeForCallingConv
virtual MVT getRegisterTypeForCallingConv(LLVMContext &Context, CallingConv::ID CC, EVT VT) const
Certain combinations of ABIs, Targets and features require that types are legal for some operations a...
Definition TargetLowering.h:1858

llvm::TargetLoweringBase::LegalizeTypeAction
LegalizeTypeAction
This enum indicates whether a types are legal for a target, and if not, what action should be used to...
Definition TargetLowering.h:212

llvm::TargetLoweringBase::TypeSoftenFloat
@ TypeSoftenFloat
Definition TargetLowering.h:216

llvm::TargetLoweringBase::TypeWidenVector
@ TypeWidenVector
Definition TargetLowering.h:220

llvm::TargetLoweringBase::setMaxBytesForAlignment
void setMaxBytesForAlignment(unsigned MaxBytes)
Definition TargetLowering.h:2870

llvm::TargetLoweringBase::setPrefLoopAlignment
void setPrefLoopAlignment(Align Alignment)
Set the target's preferred loop alignment.
Definition TargetLowering.h:2869

llvm::TargetLoweringBase::setMaxAtomicSizeInBitsSupported
void setMaxAtomicSizeInBitsSupported(unsigned SizeInBits)
Set the maximum atomic operation size supported by the backend.
Definition TargetLowering.h:2883

llvm::TargetLoweringBase::getPreferredVectorAction
virtual TargetLoweringBase::LegalizeTypeAction getPreferredVectorAction(MVT VT) const
Return the preferred vector type legalization action.
Definition TargetLowering.h:538

llvm::TargetLoweringBase::setMinFunctionAlignment
void setMinFunctionAlignment(Align Alignment)
Set the target's minimum function alignment.
Definition TargetLowering.h:2856

llvm::TargetLoweringBase::setBooleanContents
void setBooleanContents(BooleanContent Ty)
Specify how the target extends the result of integer and floating point boolean values from i1 to a w...
Definition TargetLowering.h:2583

llvm::TargetLoweringBase::computeRegisterProperties
void computeRegisterProperties(const TargetRegisterInfo *TRI)
Once all of the register classes are added, this allows us to compute derived properties we expose.
Definition TargetLoweringBase.cpp:1628

llvm::TargetLoweringBase::getTypeToTransformTo
virtual EVT getTypeToTransformTo(LLVMContext &Context, EVT VT) const
For types supported by the target, this is an identity function.
Definition TargetLowering.h:1173

llvm::TargetLoweringBase::addRegisterClass
void addRegisterClass(MVT VT, const TargetRegisterClass *RC)
Add the specified register class as an available regclass for the specified value type.
Definition TargetLowering.h:2643

llvm::TargetLoweringBase::isTypeLegal
bool isTypeLegal(EVT VT) const
Return true if the target has native support for the specified value type.
Definition TargetLowering.h:1113

llvm::TargetLoweringBase::getPointerTy
virtual MVT getPointerTy(const DataLayout &DL, uint32_t AS=0) const
Return the pointer type for the given address space, defaults to the pointer type from the data layou...
Definition TargetLowering.h:381

llvm::TargetLoweringBase::setPrefFunctionAlignment
void setPrefFunctionAlignment(Align Alignment)
Set the target's preferred function alignment.
Definition TargetLowering.h:2862

llvm::TargetLoweringBase::setTruncStoreAction
void setTruncStoreAction(MVT ValVT, MVT MemVT, LegalizeAction Action)
Indicate that the specified truncating store does not work with the specified type and indicate what ...
Definition TargetLowering.h:2723

llvm::TargetLoweringBase::ZeroOrOneBooleanContent
@ ZeroOrOneBooleanContent
Definition TargetLowering.h:239

llvm::TargetLoweringBase::ZeroOrNegativeOneBooleanContent
@ ZeroOrNegativeOneBooleanContent
Definition TargetLowering.h:240

llvm::TargetLoweringBase::isOperationLegalOrCustom
bool isOperationLegalOrCustom(unsigned Op, EVT VT, bool LegalOnly=false) const
Return true if the specified operation is legal on this target or can be made legal with custom lower...
Definition TargetLowering.h:1370

llvm::TargetLoweringBase::isBinOp
virtual bool isBinOp(unsigned Opcode) const
Return true if the node is a math/logic binary operator.
Definition TargetLowering.h:3058

llvm::TargetLoweringBase::setMinCmpXchgSizeInBits
void setMinCmpXchgSizeInBits(unsigned SizeInBits)
Sets the minimum cmpxchg or ll/sc size supported by the backend.
Definition TargetLowering.h:2900

llvm::TargetLoweringBase::setStackPointerRegisterToSaveRestore
void setStackPointerRegisterToSaveRestore(Register R)
If set to a physical register, this specifies the register that llvm.savestack/llvm....
Definition TargetLowering.h:2618

llvm::TargetLoweringBase::AtomicExpansionKind
AtomicExpansionKind
Enum that specifies what an atomic load/AtomicRMWInst is expanded to, if at all.
Definition TargetLowering.h:256

llvm::TargetLoweringBase::AtomicExpansionKind::CmpXChg
@ CmpXChg
Definition TargetLowering.h:264

llvm::TargetLoweringBase::AtomicExpansionKind::None
@ None
Definition TargetLowering.h:257

llvm::TargetLoweringBase::AtomicExpansionKind::CustomExpand
@ CustomExpand
Definition TargetLowering.h:271

llvm::TargetLoweringBase::AtomicExpansionKind::MaskedIntrinsic
@ MaskedIntrinsic
Definition TargetLowering.h:265

llvm::TargetLoweringBase::setCondCodeAction
void setCondCodeAction(ArrayRef< ISD::CondCode > CCs, MVT VT, LegalizeAction Action)
Indicate that the specified condition code is or isn't supported on the target and indicate what to d...
Definition TargetLowering.h:2784

llvm::TargetLoweringBase::setTargetDAGCombine
void setTargetDAGCombine(ArrayRef< ISD::NodeType > NTs)
Targets should invoke this method for each target independent node that they want to provide a custom...
Definition TargetLowering.h:2848

llvm::TargetLoweringBase::setLoadExtAction
void setLoadExtAction(unsigned ExtType, MVT ValVT, MVT MemVT, LegalizeAction Action)
Indicate that the specified load with extension does not work with the specified type and indicate wh...
Definition TargetLowering.h:2677

llvm::TargetLoweringBase::getTypeAction
LegalizeTypeAction getTypeAction(LLVMContext &Context, EVT VT) const
Return how we should legalize values of this type, either it is already legal (return 'Legal') or we ...
Definition TargetLowering.h:1160

llvm::TargetLoweringBase::ArgListTy
std::vector< ArgListEntry > ArgListTy
Definition TargetLowering.h:341

llvm::TargetLoweringBase::isOperationLegalOrCustomOrPromote
bool isOperationLegalOrCustomOrPromote(unsigned Op, EVT VT, bool LegalOnly=false) const
Return true if the specified operation is legal on this target or can be made legal with custom lower...
Definition TargetLowering.h:1398

llvm::TargetLowering
This class defines information used to lower LLVM code to legal SelectionDAG operators that the targe...
Definition TargetLowering.h:3988

llvm::TargetLowering::ConstraintType
ConstraintType
Definition TargetLowering.h:5185

llvm::TargetLowering::C_RegisterClass
@ C_RegisterClass
Definition TargetLowering.h:5187

llvm::TargetLowering::C_Memory
@ C_Memory
Definition TargetLowering.h:5188

llvm::TargetLowering::C_Immediate
@ C_Immediate
Definition TargetLowering.h:5190

llvm::TargetLowering::SimplifyDemandedVectorElts
bool SimplifyDemandedVectorElts(SDValue Op, const APInt &DemandedEltMask, APInt &KnownUndef, APInt &KnownZero, TargetLoweringOpt &TLO, unsigned Depth=0, bool AssumeSingleUse=false) const
Look at Vector Op.
Definition TargetLowering.cpp:3169

llvm::TargetLowering::getInlineAsmMemConstraint
virtual InlineAsm::ConstraintCode getInlineAsmMemConstraint(StringRef ConstraintCode) const
Definition TargetLowering.h:5297

llvm::TargetLowering::SimplifyMultipleUseDemandedBits
SDValue SimplifyMultipleUseDemandedBits(SDValue Op, const APInt &DemandedBits, const APInt &DemandedElts, SelectionDAG &DAG, unsigned Depth=0) const
More limited version of SimplifyDemandedBits that can be used to "lookthrough" ops that don't contrib...
Definition TargetLowering.cpp:708

llvm::TargetLowering::getConstraintType
virtual ConstraintType getConstraintType(StringRef Constraint) const
Given a constraint, return the type of constraint it is for this target.
Definition TargetLowering.cpp:5719

llvm::TargetLowering::LowerCallTo
std::pair< SDValue, SDValue > LowerCallTo(CallLoweringInfo &CLI) const
This function lowers an abstract call to a function into an actual call.
Definition SelectionDAGBuilder.cpp:11135

llvm::TargetLowering::getRegForInlineAsmConstraint
virtual std::pair< unsigned, const TargetRegisterClass * > getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI, StringRef Constraint, MVT VT) const
Given a physical register constraint (e.g.
Definition TargetLowering.cpp:5863

llvm::TargetLowering::SimplifyDemandedBits
bool SimplifyDemandedBits(SDValue Op, const APInt &DemandedBits, const APInt &DemandedElts, KnownBits &Known, TargetLoweringOpt &TLO, unsigned Depth=0, bool AssumeSingleUse=false) const
Look at Op.
Definition TargetLowering.cpp:1160

llvm::TargetLowering::SimplifyDemandedBitsForTargetNode
virtual bool SimplifyDemandedBitsForTargetNode(SDValue Op, const APInt &DemandedBits, const APInt &DemandedElts, KnownBits &Known, TargetLoweringOpt &TLO, unsigned Depth=0) const
Attempt to simplify any target nodes based on the demanded bits/elts, returning true on success.
Definition TargetLowering.cpp:3949

llvm::TargetLowering::TargetLowering
TargetLowering(const TargetLowering &)=delete

llvm::TargetLowering::LowerAsmOperandForConstraint
virtual void LowerAsmOperandForConstraint(SDValue Op, StringRef Constraint, std::vector< SDValue > &Ops, SelectionDAG &DAG) const
Lower the specified operand into the Ops vector.
Definition TargetLowering.cpp:5781

llvm::TargetLowering::makeLibCall
std::pair< SDValue, SDValue > makeLibCall(SelectionDAG &DAG, RTLIB::LibcallImpl LibcallImpl, EVT RetVT, ArrayRef< SDValue > Ops, MakeLibCallOptions CallOptions, const SDLoc &dl, SDValue Chain=SDValue()) const
Returns a pair of (return value, chain).
Definition TargetLowering.cpp:155

llvm::TargetMachine
Primary interface to the complete machine description for the target machine.
Definition TargetMachine.h:83

llvm::TargetMachine::useTLSDESC
bool useTLSDESC() const
Returns true if this target uses TLS Descriptors.
Definition TargetMachine.cpp:260

llvm::TargetMachine::useEmulatedTLS
bool useEmulatedTLS() const
Returns true if this target uses emulated TLS.
Definition TargetMachine.cpp:259

llvm::TargetMachine::shouldAssumeDSOLocal
bool shouldAssumeDSOLocal(const GlobalValue *GV) const
Definition TargetMachine.cpp:202

llvm::TargetMachine::getCodeModel
CodeModel::Model getCodeModel() const
Returns the code model.
Definition TargetMachine.h:264

llvm::TargetRegisterClass
Definition TargetRegisterInfo.h:45

llvm::TargetRegisterInfo
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
Definition TargetRegisterInfo.h:242

llvm::TargetSubtargetInfo::getInstrInfo
virtual const TargetInstrInfo * getInstrInfo() const
Definition TargetSubtargetInfo.h:100

llvm::Twine
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition Twine.h:82

llvm::TypeSize
Definition TypeSize.h:332

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45

llvm::Type::getIntegerBitWidth
LLVM_ABI unsigned getIntegerBitWidth() const
Definition DerivedTypes.h:99

llvm::Type::getPrimitiveSizeInBits
LLVM_ABI TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
Definition Type.cpp:197

llvm::Type::isIntegerTy
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition Type.h:240

llvm::Type::getIntNTy
static LLVM_ABI IntegerType * getIntNTy(LLVMContext &C, unsigned N)
Definition Type.cpp:300

llvm::VTSDNode
This class is used to represent EVT's, which are used to parameterize some operations.
Definition SelectionDAGNodes.h:2523

llvm::VTSDNode::getVT
EVT getVT() const
Definition SelectionDAGNodes.h:2533

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:256

llvm::Value::replaceAllUsesWith
LLVM_ABI void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
Definition Value.cpp:553

llvm::cl::opt
Definition CommandLine.h:1455

llvm::ilist_node_impl::getIterator
self_iterator getIterator()
Definition ilist_node.h:123

uint32_t

uint64_t

uint8_t

ErrorHandling.h

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

false
Definition MachinePipeliner.cpp:244

llvm::AMDGPU::HSAMD::Kernel::Arg::Key::Align
constexpr char Align[]
Key for Kernel::Arg::Metadata::mAlign.
Definition AMDGPUMetadata.h:183

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition AMDGPUMetadata.h:396

llvm::AMDGPU::Imm
@ Imm
Definition AMDGPURegBankLegalizeRules.h:133

llvm::ARM::ProfileKind::M
@ M
Definition ARMTargetParser.h:171

llvm::BitmaskEnumDetail::Mask
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
Definition BitmaskEnum.h:126

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24

llvm::CallingConv::PreserveMost
@ PreserveMost
Used for runtime calls that preserves most registers.
Definition CallingConv.h:63

llvm::CallingConv::GHC
@ GHC
Used by the Glasgow Haskell Compiler (GHC).
Definition CallingConv.h:50

llvm::CallingConv::Fast
@ Fast
Attempts to make calls as fast as possible (e.g.
Definition CallingConv.h:41

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34

llvm::CodeModel::Model
Model
Definition CodeGen.h:31

llvm::CodeModel::Medium
@ Medium
Definition CodeGen.h:31

llvm::CodeModel::Large
@ Large
Definition CodeGen.h:31

llvm::CodeModel::Small
@ Small
Definition CodeGen.h:31

llvm::IRSimilarity::Legal
@ Legal
Definition IRSimilarityIdentifier.h:77

llvm::ISD::NodeType
NodeType
ISD::NodeType enum - This enum defines the target-independent operators for a SelectionDAG.
Definition ISDOpcodes.h:41

llvm::ISD::SETCC
@ SETCC
SetCC operator - This evaluates to a true value iff the condition is true.
Definition ISDOpcodes.h:809

llvm::ISD::STACKRESTORE
@ STACKRESTORE
STACKRESTORE has two operands, an input chain and a pointer to restore to it returns an output chain.
Definition ISDOpcodes.h:1244

llvm::ISD::STACKSAVE
@ STACKSAVE
STACKSAVE - STACKSAVE has one operand, an input chain.
Definition ISDOpcodes.h:1240

llvm::ISD::STRICT_FSETCC
@ STRICT_FSETCC
STRICT_FSETCC/STRICT_FSETCCS - Constrained versions of SETCC, used for floating-point operands only.
Definition ISDOpcodes.h:506

llvm::ISD::STORE
@ STORE
Definition ISDOpcodes.h:1150

llvm::ISD::DELETED_NODE
@ DELETED_NODE
DELETED_NODE - This is an illegal value that is used to catch errors.
Definition ISDOpcodes.h:45

llvm::ISD::FP_TO_BF16
@ FP_TO_BF16
Definition ISDOpcodes.h:1003

llvm::ISD::JumpTable
@ JumpTable
Definition ISDOpcodes.h:91

llvm::ISD::VECREDUCE_SMIN
@ VECREDUCE_SMIN
Definition ISDOpcodes.h:1499

llvm::ISD::SREM
@ SREM
Definition ISDOpcodes.h:264

llvm::ISD::SMUL_LOHI
@ SMUL_LOHI
SMUL_LOHI/UMUL_LOHI - Multiply two integers of type iN, producing a signed/unsigned value of type i[2...
Definition ISDOpcodes.h:270

llvm::ISD::UDIV
@ UDIV
Definition ISDOpcodes.h:263

llvm::ISD::INSERT_SUBVECTOR
@ INSERT_SUBVECTOR
INSERT_SUBVECTOR(VECTOR1, VECTOR2, IDX) - Returns a vector with VECTOR2 inserted into VECTOR1.
Definition ISDOpcodes.h:595

llvm::ISD::UINT_TO_FP
@ UINT_TO_FP
Definition ISDOpcodes.h:871

llvm::ISD::UMIN
@ UMIN
Definition ISDOpcodes.h:728

llvm::ISD::BSWAP
@ BSWAP
Byte Swap and Counting operators.
Definition ISDOpcodes.h:773

llvm::ISD::ROTR
@ ROTR
Definition ISDOpcodes.h:768

llvm::ISD::FPOW
@ FPOW
Definition ISDOpcodes.h:1023

llvm::ISD::VAEND
@ VAEND
VAEND, VASTART - VAEND and VASTART have three operands: an input chain, pointer, and a SRCVALUE.
Definition ISDOpcodes.h:1273

llvm::ISD::ConstantFP
@ ConstantFP
Definition ISDOpcodes.h:87

llvm::ISD::FTRUNC
@ FTRUNC
Definition ISDOpcodes.h:1042

llvm::ISD::SDIV
@ SDIV
Definition ISDOpcodes.h:262

llvm::ISD::FMAXNUM_IEEE
@ FMAXNUM_IEEE
Definition ISDOpcodes.h:1084

llvm::ISD::ADD
@ ADD
Simple integer binary arithmetic operators.
Definition ISDOpcodes.h:259

llvm::ISD::LOAD
@ LOAD
LOAD and STORE have token chains as their first operand, then the same operands as an LLVM load/store...
Definition ISDOpcodes.h:1149

llvm::ISD::ANY_EXTEND
@ ANY_EXTEND
ANY_EXTEND - Used for integer types. The high bits are undefined.
Definition ISDOpcodes.h:843

llvm::ISD::FSUB
@ FSUB
Definition ISDOpcodes.h:413

llvm::ISD::FMA
@ FMA
FMA - Perform a * b + c with no intermediate rounding step.
Definition ISDOpcodes.h:513

llvm::ISD::INTRINSIC_VOID
@ INTRINSIC_VOID
OUTCHAIN = INTRINSIC_VOID(INCHAIN, INTRINSICID, arg1, arg2, ...) This node represents a target intrin...
Definition ISDOpcodes.h:215

llvm::ISD::RETURNADDR
@ RETURNADDR
Definition ISDOpcodes.h:111

llvm::ISD::GlobalAddress
@ GlobalAddress
Definition ISDOpcodes.h:88

llvm::ISD::SINT_TO_FP
@ SINT_TO_FP
[SU]INT_TO_FP - These operators convert integers (whose interpreted sign depends on the first letter)...
Definition ISDOpcodes.h:870

llvm::ISD::CONCAT_VECTORS
@ CONCAT_VECTORS
CONCAT_VECTORS(VECTOR0, VECTOR1, ...) - Given a number of values of vector type with the same length ...
Definition ISDOpcodes.h:579

llvm::ISD::FADD
@ FADD
Simple binary floating point operators.
Definition ISDOpcodes.h:412

llvm::ISD::ABS
@ ABS
ABS - Determine the unsigned absolute value of a signed integer value of the same bitwidth.
Definition ISDOpcodes.h:746

llvm::ISD::MEMBARRIER
@ MEMBARRIER
MEMBARRIER - Compiler barrier only; generate a no-op.
Definition ISDOpcodes.h:1346

llvm::ISD::ATOMIC_FENCE
@ ATOMIC_FENCE
OUTCHAIN = ATOMIC_FENCE(INCHAIN, ordering, scope) This corresponds to the fence instruction.
Definition ISDOpcodes.h:1351

llvm::ISD::FP_TO_FP16
@ FP_TO_FP16
Definition ISDOpcodes.h:994

llvm::ISD::VECREDUCE_SMAX
@ VECREDUCE_SMAX
Definition ISDOpcodes.h:1498

llvm::ISD::SRL
@ SRL
Definition ISDOpcodes.h:766

llvm::ISD::STRICT_FSETCCS
@ STRICT_FSETCCS
Definition ISDOpcodes.h:507

llvm::ISD::FP16_TO_FP
@ FP16_TO_FP
FP16_TO_FP, FP_TO_FP16 - These operators are used to perform promotions and truncation for half-preci...
Definition ISDOpcodes.h:993

llvm::ISD::BITCAST
@ BITCAST
BITCAST - This operator converts between integer, vector and FP values, as if the value was stored to...
Definition ISDOpcodes.h:983

llvm::ISD::BUILD_PAIR
@ BUILD_PAIR
BUILD_PAIR - This is the opposite of EXTRACT_ELEMENT in some ways.
Definition ISDOpcodes.h:249

llvm::ISD::FFLOOR
@ FFLOOR
Definition ISDOpcodes.h:1047

llvm::ISD::BUILTIN_OP_END
@ BUILTIN_OP_END
BUILTIN_OP_END - This must be the last enum value in this list.
Definition ISDOpcodes.h:1603

llvm::ISD::GlobalTLSAddress
@ GlobalTLSAddress
Definition ISDOpcodes.h:89

llvm::ISD::SRA
@ SRA
Definition ISDOpcodes.h:765

llvm::ISD::SIGN_EXTEND
@ SIGN_EXTEND
Conversion operators.
Definition ISDOpcodes.h:834

llvm::ISD::FLOG2
@ FLOG2
Definition ISDOpcodes.h:1036

llvm::ISD::SCALAR_TO_VECTOR
@ SCALAR_TO_VECTOR
SCALAR_TO_VECTOR(VAL) - This represents the operation of loading a scalar value into element 0 of the...
Definition ISDOpcodes.h:664

llvm::ISD::UADDSAT
@ UADDSAT
Definition ISDOpcodes.h:361

llvm::ISD::WRITE_REGISTER
@ WRITE_REGISTER
Definition ISDOpcodes.h:135

llvm::ISD::FMAXNUM
@ FMAXNUM
Definition ISDOpcodes.h:1068

llvm::ISD::FRINT
@ FRINT
Definition ISDOpcodes.h:1043

llvm::ISD::PREFETCH
@ PREFETCH
PREFETCH - This corresponds to a prefetch intrinsic.
Definition ISDOpcodes.h:1339

llvm::ISD::FSINCOS
@ FSINCOS
FSINCOS - Compute both fsin and fcos as a single operation.
Definition ISDOpcodes.h:1098

llvm::ISD::FNEG
@ FNEG
Perform various unary floating-point operations inspired by libm.
Definition ISDOpcodes.h:1010

llvm::ISD::BR_CC
@ BR_CC
BR_CC - Conditional branch.
Definition ISDOpcodes.h:1195

llvm::ISD::CTTZ
@ CTTZ
Definition ISDOpcodes.h:774

llvm::ISD::FP_TO_UINT
@ FP_TO_UINT
Definition ISDOpcodes.h:917

llvm::ISD::BR_JT
@ BR_JT
BR_JT - Jumptable branch.
Definition ISDOpcodes.h:1174

llvm::ISD::OR
@ OR
Definition ISDOpcodes.h:739

llvm::ISD::FCANONICALIZE
@ FCANONICALIZE
Returns platform specific canonical encoding of a floating point number.
Definition ISDOpcodes.h:536

llvm::ISD::IS_FPCLASS
@ IS_FPCLASS
Performs a check of floating point class property, defined by IEEE-754.
Definition ISDOpcodes.h:543

llvm::ISD::SSUBSAT
@ SSUBSAT
RESULT = [US]SUBSAT(LHS, RHS) - Perform saturation subtraction on 2 integers with the same bit width ...
Definition ISDOpcodes.h:369

llvm::ISD::SRA_PARTS
@ SRA_PARTS
Definition ISDOpcodes.h:824

llvm::ISD::SELECT
@ SELECT
Select(COND, TRUEVAL, FALSEVAL).
Definition ISDOpcodes.h:786

llvm::ISD::UMUL_LOHI
@ UMUL_LOHI
Definition ISDOpcodes.h:271

llvm::ISD::UNDEF
@ UNDEF
UNDEF - An undefined node.
Definition ISDOpcodes.h:228

llvm::ISD::VECREDUCE_UMAX
@ VECREDUCE_UMAX
Definition ISDOpcodes.h:1500

llvm::ISD::VACOPY
@ VACOPY
VACOPY - VACOPY has 5 operands: an input chain, a destination pointer, a source pointer,...
Definition ISDOpcodes.h:1269

llvm::ISD::USUBSAT
@ USUBSAT
Definition ISDOpcodes.h:370

llvm::ISD::VECREDUCE_ADD
@ VECREDUCE_ADD
Integer reductions may have a result type larger than the vector element type.
Definition ISDOpcodes.h:1493

llvm::ISD::MULHU
@ MULHU
MULHU/MULHS - Multiply high - Multiply two integers of type iN, producing an unsigned/signed value of...
Definition ISDOpcodes.h:703

llvm::ISD::SHL
@ SHL
Shift and rotation operations.
Definition ISDOpcodes.h:764

llvm::ISD::VECTOR_SHUFFLE
@ VECTOR_SHUFFLE
VECTOR_SHUFFLE(VEC1, VEC2) - Returns a vector, of the same type as VEC1/VEC2.
Definition ISDOpcodes.h:644

llvm::ISD::EXTRACT_SUBVECTOR
@ EXTRACT_SUBVECTOR
EXTRACT_SUBVECTOR(VECTOR, IDX) - Returns a subvector from VECTOR.
Definition ISDOpcodes.h:609

llvm::ISD::FMINNUM_IEEE
@ FMINNUM_IEEE
FMINNUM_IEEE/FMAXNUM_IEEE - Perform floating-point minimumNumber or maximumNumber on two values,...
Definition ISDOpcodes.h:1083

llvm::ISD::FCOS
@ FCOS
Definition ISDOpcodes.h:1015

llvm::ISD::READ_REGISTER
@ READ_REGISTER
READ_REGISTER, WRITE_REGISTER - This node represents llvm.register on the DAG, which implements the n...
Definition ISDOpcodes.h:134

llvm::ISD::XOR
@ XOR
Definition ISDOpcodes.h:740

llvm::ISD::EXTRACT_VECTOR_ELT
@ EXTRACT_VECTOR_ELT
EXTRACT_VECTOR_ELT(VECTOR, IDX) - Returns a single element from VECTOR identified by the (potentially...
Definition ISDOpcodes.h:571

llvm::ISD::CopyToReg
@ CopyToReg
CopyToReg - This node has three operands: a chain, a register number to set to this value,...
Definition ISDOpcodes.h:219

llvm::ISD::ZERO_EXTEND
@ ZERO_EXTEND
ZERO_EXTEND - Used for integer types, zeroing the new bits.
Definition ISDOpcodes.h:840

llvm::ISD::DEBUGTRAP
@ DEBUGTRAP
DEBUGTRAP - Trap intended to get the attention of a debugger.
Definition ISDOpcodes.h:1329

llvm::ISD::CTPOP
@ CTPOP
Definition ISDOpcodes.h:776

llvm::ISD::SELECT_CC
@ SELECT_CC
Select with condition operator - This selects between a true value and a false value (ops #2 and #3) ...
Definition ISDOpcodes.h:801

llvm::ISD::FMUL
@ FMUL
Definition ISDOpcodes.h:414

llvm::ISD::VECREDUCE_XOR
@ VECREDUCE_XOR
Definition ISDOpcodes.h:1497

llvm::ISD::ATOMIC_CMP_SWAP
@ ATOMIC_CMP_SWAP
Val, OUTCHAIN = ATOMIC_CMP_SWAP(INCHAIN, ptr, cmp, swap) For double-word atomic operations: ValLo,...
Definition ISDOpcodes.h:1366

llvm::ISD::SRL_PARTS
@ SRL_PARTS
Definition ISDOpcodes.h:825

llvm::ISD::FMINNUM
@ FMINNUM
FMINNUM/FMAXNUM - Perform floating-point minimum maximum on two values, following IEEE-754 definition...
Definition ISDOpcodes.h:1067

llvm::ISD::SUB
@ SUB
Definition ISDOpcodes.h:260

llvm::ISD::MULHS
@ MULHS
Definition ISDOpcodes.h:704

llvm::ISD::VECREDUCE_AND
@ VECREDUCE_AND
Definition ISDOpcodes.h:1495

llvm::ISD::DYNAMIC_STACKALLOC
@ DYNAMIC_STACKALLOC
DYNAMIC_STACKALLOC - Allocate some number of bytes on the stack aligned to a specified boundary.
Definition ISDOpcodes.h:1159

llvm::ISD::ConstantPool
@ ConstantPool
Definition ISDOpcodes.h:92

llvm::ISD::SIGN_EXTEND_INREG
@ SIGN_EXTEND_INREG
SIGN_EXTEND_INREG - This operator atomically performs a SHL/SRA pair to sign extend a small value in ...
Definition ISDOpcodes.h:878

llvm::ISD::SMIN
@ SMIN
[US]{MIN/MAX} - Binary minimum or maximum of signed or unsigned integers.
Definition ISDOpcodes.h:726

llvm::ISD::Constant
@ Constant
Definition ISDOpcodes.h:86

llvm::ISD::FP_EXTEND
@ FP_EXTEND
X = FP_EXTEND(Y) - Extend a smaller FP type into a larger FP type.
Definition ISDOpcodes.h:968

llvm::ISD::VECREDUCE_OR
@ VECREDUCE_OR
Definition ISDOpcodes.h:1496

llvm::ISD::VSELECT
@ VSELECT
Select with a vector condition (op #0) and two vector operands (ops #1 and #2), returning a vector re...
Definition ISDOpcodes.h:795

llvm::ISD::FROUNDEVEN
@ FROUNDEVEN
Definition ISDOpcodes.h:1046

llvm::ISD::VECREDUCE_UMIN
@ VECREDUCE_UMIN
Definition ISDOpcodes.h:1501

llvm::ISD::EH_DWARF_CFA
@ EH_DWARF_CFA
EH_DWARF_CFA - This node represents the pointer to the DWARF Canonical Frame Address (CFA),...
Definition ISDOpcodes.h:145

llvm::ISD::FDIV
@ FDIV
Definition ISDOpcodes.h:415

llvm::ISD::BF16_TO_FP
@ BF16_TO_FP
BF16_TO_FP, FP_TO_BF16 - These operators are used to perform promotions and truncation for bfloat16.
Definition ISDOpcodes.h:1002

llvm::ISD::FRAMEADDR
@ FRAMEADDR
FRAMEADDR, RETURNADDR - These nodes represent llvm.frameaddress and llvm.returnaddress on the DAG.
Definition ISDOpcodes.h:110

llvm::ISD::FREM
@ FREM
Definition ISDOpcodes.h:416

llvm::ISD::FP_TO_SINT
@ FP_TO_SINT
FP_TO_[US]INT - Convert a floating point value to a signed or unsigned integer.
Definition ISDOpcodes.h:916

llvm::ISD::AND
@ AND
Bitwise operators - logical and, logical or, logical xor.
Definition ISDOpcodes.h:738

llvm::ISD::TRAP
@ TRAP
TRAP - Trapping instruction.
Definition ISDOpcodes.h:1326

llvm::ISD::INTRINSIC_WO_CHAIN
@ INTRINSIC_WO_CHAIN
RESULT = INTRINSIC_WO_CHAIN(INTRINSICID, arg1, arg2, ...) This node represents a target intrinsic fun...
Definition ISDOpcodes.h:200

llvm::ISD::UREM
@ UREM
Definition ISDOpcodes.h:265

llvm::ISD::FREEZE
@ FREEZE
FREEZE - FREEZE(VAL) returns an arbitrary value if VAL is UNDEF (or is evaluated to UNDEF),...
Definition ISDOpcodes.h:236

llvm::ISD::INSERT_VECTOR_ELT
@ INSERT_VECTOR_ELT
INSERT_VECTOR_ELT(VECTOR, VAL, IDX) - Returns VECTOR with the element at IDX replaced with VAL.
Definition ISDOpcodes.h:560

llvm::ISD::TokenFactor
@ TokenFactor
TokenFactor - This node takes multiple tokens as input and produces a single token result.
Definition ISDOpcodes.h:53

llvm::ISD::FSIN
@ FSIN
Definition ISDOpcodes.h:1014

llvm::ISD::FCEIL
@ FCEIL
Definition ISDOpcodes.h:1041

llvm::ISD::MUL
@ MUL
Definition ISDOpcodes.h:261

llvm::ISD::LROUND
@ LROUND
Definition ISDOpcodes.h:1048

llvm::ISD::CTLZ
@ CTLZ
Definition ISDOpcodes.h:775

llvm::ISD::VASTART
@ VASTART
Definition ISDOpcodes.h:1274

llvm::ISD::FSQRT
@ FSQRT
Definition ISDOpcodes.h:1012

llvm::ISD::TRUNCATE
@ TRUNCATE
TRUNCATE - Completely drop the high bits.
Definition ISDOpcodes.h:846

llvm::ISD::VAARG
@ VAARG
VAARG - VAARG has four operands: an input chain, a pointer, a SRCVALUE, and the alignment.
Definition ISDOpcodes.h:1264

llvm::ISD::BRCOND
@ BRCOND
BRCOND - Conditional branch.
Definition ISDOpcodes.h:1188

llvm::ISD::ROTL
@ ROTL
Definition ISDOpcodes.h:767

llvm::ISD::BlockAddress
@ BlockAddress
Definition ISDOpcodes.h:94

llvm::ISD::SHL_PARTS
@ SHL_PARTS
SHL_PARTS/SRA_PARTS/SRL_PARTS - These operators are used for expanded integer shift operations.
Definition ISDOpcodes.h:823

llvm::ISD::AssertSext
@ AssertSext
AssertSext, AssertZext - These nodes record if a register contains a value that has already been zero...
Definition ISDOpcodes.h:62

llvm::ISD::BITREVERSE
@ BITREVERSE
Definition ISDOpcodes.h:777

llvm::ISD::SADDSAT
@ SADDSAT
RESULT = [US]ADDSAT(LHS, RHS) - Perform saturation addition on 2 integers with the same bit width (W)...
Definition ISDOpcodes.h:360

llvm::ISD::AssertZext
@ AssertZext
Definition ISDOpcodes.h:63

llvm::ISD::SMAX
@ SMAX
Definition ISDOpcodes.h:727

llvm::ISD::UMAX
@ UMAX
Definition ISDOpcodes.h:729

llvm::ISD::ABDS
@ ABDS
ABDS/ABDU - Absolute difference - Return the absolute difference between two numbers interpreted as s...
Definition ISDOpcodes.h:721

llvm::ISD::INTRINSIC_W_CHAIN
@ INTRINSIC_W_CHAIN
RESULT,OUTCHAIN = INTRINSIC_W_CHAIN(INCHAIN, INTRINSICID, arg1, ...) This node represents a target in...
Definition ISDOpcodes.h:208

llvm::ISD::ABDU
@ ABDU
Definition ISDOpcodes.h:722

llvm::ISD::BUILD_VECTOR
@ BUILD_VECTOR
BUILD_VECTOR(ELT0, ELT1, ELT2, ELT3,...) - Return a fixed-width vector with the specified,...
Definition ISDOpcodes.h:551

llvm::ISD::getSetCCInverse
LLVM_ABI CondCode getSetCCInverse(CondCode Operation, EVT Type)
Return the operation corresponding to !(X op Y), where 'op' is a valid SetCC operation.
Definition SelectionDAG.cpp:627

llvm::ISD::isFreezeUndef
LLVM_ABI bool isFreezeUndef(const SDNode *N)
Return true if the specified node is FREEZE(UNDEF).
Definition SelectionDAG.cpp:346

llvm::ISD::getSetCCSwappedOperands
LLVM_ABI CondCode getSetCCSwappedOperands(CondCode Operation)
Return the operation corresponding to (Y op X) when given the operation for (X op Y).
Definition SelectionDAG.cpp:604

llvm::ISD::isBuildVectorAllZeros
LLVM_ABI bool isBuildVectorAllZeros(const SDNode *N)
Return true if the specified node is a BUILD_VECTOR where all of the elements are 0 or undef.
Definition SelectionDAG.cpp:270

llvm::ISD::CondCode
CondCode
ISD::CondCode enum - These are ordered carefully to make the bitfields below work out,...
Definition ISDOpcodes.h:1720

llvm::ISD::SETNE
@ SETNE
Definition ISDOpcodes.h:1745

llvm::ISD::SETUGT
@ SETUGT
Definition ISDOpcodes.h:1732

llvm::ISD::SETOGT
@ SETOGT
Definition ISDOpcodes.h:1724

llvm::ISD::SETULT
@ SETULT
Definition ISDOpcodes.h:1734

llvm::ISD::SETGT
@ SETGT
Definition ISDOpcodes.h:1741

llvm::ISD::SETLT
@ SETLT
Definition ISDOpcodes.h:1743

llvm::ISD::SETGE
@ SETGE
Definition ISDOpcodes.h:1742

llvm::ISD::SETUGE
@ SETUGE
Definition ISDOpcodes.h:1733

llvm::ISD::SETLE
@ SETLE
Definition ISDOpcodes.h:1744

llvm::ISD::SETULE
@ SETULE
Definition ISDOpcodes.h:1735

llvm::ISD::SETOGE
@ SETOGE
Definition ISDOpcodes.h:1725

llvm::ISD::SETEQ
@ SETEQ
Definition ISDOpcodes.h:1740

llvm::ISD::isBuildVectorAllOnes
LLVM_ABI bool isBuildVectorAllOnes(const SDNode *N)
Return true if the specified node is a BUILD_VECTOR where all of the elements are ~0 or undef.
Definition SelectionDAG.cpp:266

llvm::ISD::getVecReduceBaseOpcode
LLVM_ABI NodeType getVecReduceBaseOpcode(unsigned VecReduceOpcode)
Get underlying scalar opcode for VECREDUCE opcode.
Definition SelectionDAG.cpp:436

llvm::ISD::LoadExtType
LoadExtType
LoadExtType enum - This enum defines the three variants of LOADEXT (load with extension).
Definition ISDOpcodes.h:1700

llvm::ISD::NON_EXTLOAD
@ NON_EXTLOAD
Definition ISDOpcodes.h:1700

llvm::ISD::SEXTLOAD
@ SEXTLOAD
Definition ISDOpcodes.h:1700

llvm::ISD::ZEXTLOAD
@ ZEXTLOAD
Definition ISDOpcodes.h:1700

llvm::ISD::EXTLOAD
@ EXTLOAD
Definition ISDOpcodes.h:1700

llvm::ISD::isIntEqualitySetCC
bool isIntEqualitySetCC(CondCode Code)
Return true if this is a setcc instruction that performs an equality comparison when used with intege...
Definition ISDOpcodes.h:1765

llvm::Intrinsic
This namespace contains an enum with a value for every intrinsic/builtin function known by LLVM.
Definition GenericSSAContext.h:27

llvm::Intrinsic::getOrInsertDeclaration
LLVM_ABI Function * getOrInsertDeclaration(Module *M, ID id, ArrayRef< Type * > Tys={})
Look up the Function declaration of the intrinsic id in the Module M.
Definition Intrinsics.cpp:755

llvm::Intrinsic::ID
unsigned ID
Definition GenericSSAContext.h:28

llvm::LoongArchABI::ABI
ABI
Definition LoongArchBaseInfo.h:119

llvm::LoongArchABI::ABI_LP64F
@ ABI_LP64F
Definition LoongArchBaseInfo.h:124

llvm::LoongArchABI::ABI_LP64S
@ ABI_LP64S
Definition LoongArchBaseInfo.h:123

llvm::LoongArchABI::ABI_ILP32S
@ ABI_ILP32S
Definition LoongArchBaseInfo.h:120

llvm::LoongArchABI::ABI_ILP32F
@ ABI_ILP32F
Definition LoongArchBaseInfo.h:121

llvm::LoongArchABI::ABI_ILP32D
@ ABI_ILP32D
Definition LoongArchBaseInfo.h:122

llvm::LoongArchABI::ABI_LP64D
@ ABI_LP64D
Definition LoongArchBaseInfo.h:125

llvm::LoongArchABI::getTargetABI
ABI getTargetABI(StringRef ABIName)
Definition LoongArchBaseInfo.cpp:176

llvm::LoongArchII::MO_CALL
@ MO_CALL
Definition LoongArchBaseInfo.h:31

llvm::LoongArchII::MO_CALL_PLT
@ MO_CALL_PLT
Definition LoongArchBaseInfo.h:32

llvm::LoongArchMatInt::generateInstSeq
InstSeq generateInstSeq(int64_t Val)
Definition LoongArchMatInt.cpp:15

llvm::M68kBeads::DReg
@ DReg
Definition M68kBaseInfo.h:106

llvm::M68k::MemAddrModeKind::j
@ j
Definition M68kBaseInfo.h:52

llvm::M68k::MemAddrModeKind::U
@ U
Definition M68kBaseInfo.h:61

llvm::M68k::MemAddrModeKind::V
@ V
Definition M68kBaseInfo.h:63

llvm::RISCVFenceField::R
@ R
Definition RISCVBaseInfo.h:474

llvm::RTLIB::getSINTTOFP
LLVM_ABI Libcall getSINTTOFP(EVT OpVT, EVT RetVT)
getSINTTOFP - Return the SINTTOFP_*_* value for the given types, or UNKNOWN_LIBCALL if there is none.
Definition TargetLoweringBase.cpp:424

llvm::RTLIB::getUINTTOFP
LLVM_ABI Libcall getUINTTOFP(EVT OpVT, EVT RetVT)
getUINTTOFP - Return the UINTTOFP_*_* value for the given types, or UNKNOWN_LIBCALL if there is none.
Definition TargetLoweringBase.cpp:472

llvm::RTLIB::getFPTOSINT
LLVM_ABI Libcall getFPTOSINT(EVT OpVT, EVT RetVT)
getFPTOSINT - Return the FPTOSINT_*_* value for the given types, or UNKNOWN_LIBCALL if there is none.
Definition TargetLoweringBase.cpp:326

llvm::RTLIB::getFPROUND
LLVM_ABI Libcall getFPROUND(EVT OpVT, EVT RetVT)
getFPROUND - Return the FPROUND_*_* value for the given types, or UNKNOWN_LIBCALL if there is none.
Definition TargetLoweringBase.cpp:279

llvm::RegState::Kill
@ Kill
The last use of a register.
Definition MachineInstrBuilder.h:51

llvm::SPII::Load
@ Load
Definition SparcInstrInfo.h:32

llvm::SyncScope::SingleThread
@ SingleThread
Synchronized with respect to signal handlers executing in the same thread.
Definition LLVMContext.h:55

llvm::SyncScope::ID
uint8_t ID
Definition LLVMContext.h:47

llvm::TLSModel::LocalDynamic
@ LocalDynamic
Definition CodeGen.h:47

llvm::TLSModel::InitialExec
@ InitialExec
Definition CodeGen.h:48

llvm::TLSModel::GeneralDynamic
@ GeneralDynamic
Definition CodeGen.h:46

llvm::TLSModel::LocalExec
@ LocalExec
Definition CodeGen.h:49

llvm::cl::Hidden
@ Hidden
Definition CommandLine.h:139

llvm::cl::values
ValuesClass values(OptsTy... Options)
Helper to build a ValuesClass by forwarding a variable number of arguments as an initializer list to ...
Definition CommandLine.h:713

llvm::cl::init
initializer< Ty > init(const Ty &Val)
Definition CommandLine.h:445

llvm::codeview::ExportFlags::IsData
@ IsData
Definition CodeView.h:466

llvm::codeview::ExportFlags::IsConstant
@ IsConstant
Definition CodeView.h:465

llvm::dwarf_linker::DebugSectionKind::DebugLoc
@ DebugLoc
Definition DWARFLinkerBase.h:34

llvm::lltok::APFloat
@ APFloat
Definition LLToken.h:519

llvm::logicalview::LVAttributeKind::Zero
@ Zero
Definition LVOptions.h:130

llvm::ms_demangle::QualifierMangleMode::Result
@ Result
Definition MicrosoftDemangle.h:132

llvm::objcarc::Sequence
Sequence
A sequence of states that a pointer may go through in which an objc_retain and objc_release are actua...
Definition PtrState.h:41

llvm::rdf::Node
NodeAddr< NodeBase * > Node
Definition RDFGraph.h:381

llvm::sampleprof::Base
@ Base
Definition Discriminator.h:58

llvm::sframe::ABI
ABI
Definition SFrame.h:46

llvm::tgtok::Bits
@ Bits
Definition TGLexer.h:78

llvm::tgtok::TrueVal
@ TrueVal
Definition TGLexer.h:57

llvm::tgtok::FalseVal
@ FalseVal
Definition TGLexer.h:58

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition AddressRanges.h:18

llvm::ThreadPriority::Low
@ Low
Lower the current thread's priority such that it does not affect foreground tasks significantly.
Definition Threading.h:280

llvm::Offset
@ Offset
Definition DWP.cpp:532

llvm::Value
FunctionAddr VTableAddr Value
Definition InstrProf.h:137

llvm::all_of
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1737

llvm::BuildMI
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
Definition MachineInstrBuilder.h:391

llvm::isInt
constexpr bool isInt(int64_t x)
Checks if an integer fits into the given bit width.
Definition MathExtras.h:165

llvm::isNullConstant
LLVM_ABI bool isNullConstant(SDValue V)
Returns true if V is a constant integer zero.
Definition SelectionDAG.cpp:12829

llvm::Depth
@ Depth
Definition SIMachineScheduler.h:36

llvm::peekThroughBitcasts
LLVM_ABI SDValue peekThroughBitcasts(SDValue V)
Return the non-bitcasted source operand of V if it exists.
Definition SelectionDAG.cpp:12921

llvm::dyn_cast
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643

llvm::AlignStyle::Left
@ Left
Definition FormatCommon.h:17

llvm::isIntOrFPConstant
bool isIntOrFPConstant(SDValue V)
Return true if V is either a integer or FP constant.
Definition SelectionDAGNodes.h:1976

llvm::bit_width
int bit_width(T Value)
Returns the number of bits needed to represent Value if Value is nonzero.
Definition bit.h:303

llvm::isPowerOf2_64
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
Definition MathExtras.h:284

llvm::widenShuffleMaskElts
LLVM_ABI bool widenShuffleMaskElts(int Scale, ArrayRef< int > Mask, SmallVectorImpl< int > &ScaledMask)
Try to transform a shuffle mask by replacing elements with the scaled index for an equivalent mask of...
Definition VectorUtils.cpp:540

llvm::Log2_64
unsigned Log2_64(uint64_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
Definition MathExtras.h:337

llvm::isShiftedMask_64
constexpr bool isShiftedMask_64(uint64_t Value)
Return true if the argument contains a non-empty sequence of ones with the remainder zero (64 bit ver...
Definition MathExtras.h:273

llvm::any_of
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1744

llvm::HexPrintStyle::Lower
@ Lower
Definition NativeFormatting.h:23

llvm::getImm
MachineInstr * getImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
Definition SPIRVUtils.cpp:1070

llvm::None
@ None
Definition CodeGenData.h:107

llvm::dbgs
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:207

llvm::report_fatal_error
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
Definition Error.cpp:167

llvm::isMask_64
constexpr bool isMask_64(uint64_t Value)
Return true if the argument is a non-empty sequence of ones starting at the least significant bit wit...
Definition MathExtras.h:261

llvm::isUInt
constexpr bool isUInt(uint64_t x)
Checks if an unsigned integer fits into the given bit width.
Definition MathExtras.h:189

llvm::CaptureComponents::Address
@ Address
Definition ModRef.h:313

llvm::SmallVector
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
Definition SmallVector.h:1129

llvm::isa
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547

llvm::PackElem::Hi
@ Hi
Definition VECustomDAG.h:132

llvm::PackElem::Lo
@ Lo
Definition VECustomDAG.h:131

llvm::AtomicOrdering
AtomicOrdering
Atomic ordering for LLVM's memory model.
Definition AtomicOrdering.h:56

llvm::AtomicOrdering::Monotonic
@ Monotonic
Definition AtomicOrdering.h:59

llvm::AtomicOrdering::AcquireRelease
@ AcquireRelease
Definition AtomicOrdering.h:63

llvm::AtomicOrdering::Acquire
@ Acquire
Definition AtomicOrdering.h:61

llvm::AtomicOrdering::Release
@ Release
Definition AtomicOrdering.h:62

llvm::AtomicOrdering::SequentiallyConsistent
@ SequentiallyConsistent
Definition AtomicOrdering.h:64

llvm::IRMemLocation::Other
@ Other
Any other memory.
Definition ModRef.h:68

llvm::getKillRegState
unsigned getKillRegState(bool B)
Definition MachineInstrBuilder.h:565

llvm::MCPhysReg
uint16_t MCPhysReg
An unsigned integer type large enough to represent all physical registers, but not necessarily virtua...
Definition MCRegister.h:21

llvm::Next
FunctionAddr VTableAddr Next
Definition InstrProf.h:141

llvm::Op
DWARFExpression::Operation Op
Definition DWARFExpressionPrinter.cpp:22

llvm::ArrayRef
ArrayRef(const T &OneElt) -> ArrayRef< T >

llvm::isShiftedInt
constexpr bool isShiftedInt(int64_t x)
Checks if a signed integer is an N bit number shifted left by S.
Definition MathExtras.h:182

llvm::BitWidth
constexpr unsigned BitWidth
Definition BitmaskEnum.h:219

llvm::join_items
std::string join_items(Sep Separator, Args &&... Items)
Joins the strings in the parameter pack Items, adding Separator between the elements....
Definition StringExtras.h:508

llvm::cast
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559

llvm::isOneConstant
LLVM_ABI bool isOneConstant(SDValue V)
Returns true if V is a constant integer one.
Definition SelectionDAG.cpp:12848

llvm::ValueType
PointerUnion< const Value *, const PseudoSourceValue * > ValueType
Definition ScheduleDAGInstrs.h:105

llvm::VFParamKind::Vector
@ Vector
Definition VFABIDemangler.h:27

llvm::isAllOnesConstant
LLVM_ABI bool isAllOnesConstant(SDValue V)
Returns true if V is an integer constant with all bits set.
Definition SelectionDAG.cpp:12843

llvm::reportFatalUsageError
LLVM_ABI void reportFatalUsageError(Error Err)
Report a fatal error that does not indicate a bug in LLVM.
Definition Error.cpp:180

std::swap
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition BitVector.h:872

N
#define N

InsertionPoint
Definition CFIFixup.cpp:186

RegInfo
Definition AMDGPUAsmParser.cpp:2826

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39

llvm::EVT
Extended Value Type.
Definition ValueTypes.h:35

llvm::EVT::changeVectorElementTypeToInteger
EVT changeVectorElementTypeToInteger() const
Return a vector with the same number of elements as this vector, but with the element type converted ...
Definition ValueTypes.h:94

llvm::EVT::getStoreSize
TypeSize getStoreSize() const
Return the number of bytes overwritten by a store of the specified value type.
Definition ValueTypes.h:395

llvm::EVT::isSimple
bool isSimple() const
Test if the given EVT is simple (as opposed to being extended).
Definition ValueTypes.h:137

llvm::EVT::isFloatingPoint
bool isFloatingPoint() const
Return true if this is a FP or a vector FP type.
Definition ValueTypes.h:147

llvm::EVT::getSizeInBits
TypeSize getSizeInBits() const
Return the size of the specified value type in bits.
Definition ValueTypes.h:373

llvm::EVT::getScalarSizeInBits
uint64_t getScalarSizeInBits() const
Definition ValueTypes.h:385

llvm::EVT::getSimpleVT
MVT getSimpleVT() const
Return the SimpleValueType held in the specified simple EVT.
Definition ValueTypes.h:316

llvm::EVT::is128BitVector
bool is128BitVector() const
Return true if this is a 128-bit vector type.
Definition ValueTypes.h:207

llvm::EVT::getIntegerVT
static EVT getIntegerVT(LLVMContext &Context, unsigned BitWidth)
Returns the EVT that represents an integer with the given number of bits.
Definition ValueTypes.h:65

llvm::EVT::getFixedSizeInBits
uint64_t getFixedSizeInBits() const
Return the size of the specified fixed width value type in bits.
Definition ValueTypes.h:381

llvm::EVT::getFloatingPointVT
static EVT getFloatingPointVT(unsigned BitWidth)
Returns the EVT that represents a floating-point type with the given number of bits.
Definition ValueTypes.h:59

llvm::EVT::isVector
bool isVector() const
Return true if this is a vector value type.
Definition ValueTypes.h:168

llvm::EVT::getScalarType
EVT getScalarType() const
If this is a vector type, return the element type, otherwise return this.
Definition ValueTypes.h:323

llvm::EVT::is256BitVector
bool is256BitVector() const
Return true if this is a 256-bit vector type.
Definition ValueTypes.h:212

llvm::EVT::getTypeForEVT
LLVM_ABI Type * getTypeForEVT(LLVMContext &Context) const
This method returns an LLVM type corresponding to the specified EVT.
Definition ValueTypes.cpp:218

llvm::EVT::getVectorElementType
EVT getVectorElementType() const
Given a vector type, return the type of each element.
Definition ValueTypes.h:328

llvm::EVT::isScalarInteger
bool isScalarInteger() const
Return true if this is an integer, but not a vector.
Definition ValueTypes.h:157

llvm::EVT::getVectorNumElements
unsigned getVectorNumElements() const
Given a vector type, return the number of elements it contains.
Definition ValueTypes.h:336

llvm::EVT::getHalfNumVectorElementsVT
EVT getHalfNumVectorElementsVT(LLVMContext &Context) const
Definition ValueTypes.h:453

llvm::EVT::isInteger
bool isInteger() const
Return true if this is an integer or a vector integer type.
Definition ValueTypes.h:152

llvm::ISD::ArgFlagsTy
Definition TargetCallingConv.h:27

llvm::ISD::ArgFlagsTy::isSplitEnd
bool isSplitEnd() const
Definition TargetCallingConv.h:141

llvm::ISD::ArgFlagsTy::getNonZeroOrigAlign
Align getNonZeroOrigAlign() const
Definition TargetCallingConv.h:169

llvm::ISD::ArgFlagsTy::isSplit
bool isSplit() const
Definition TargetCallingConv.h:138

llvm::ISD::ArgFlagsTy::isVarArg
bool isVarArg() const
Definition TargetCallingConv.h:150

llvm::ISD::InputArg
InputArg - This struct carries flags and type information about a single incoming (formal) argument o...
Definition TargetCallingConv.h:204

llvm::KnownBits
Definition KnownBits.h:24

llvm::KnownBits::One
APInt One
Definition KnownBits.h:26

llvm::KnownBits::Zero
APInt Zero
Definition KnownBits.h:25

llvm::LoongArchRegisterInfo
Definition LoongArchRegisterInfo.h:24

llvm::MachinePointerInfo
This class contains a discriminated union of information about pointers in memory operands,...
Definition MachineMemOperand.h:42

llvm::MachinePointerInfo::getStack
static LLVM_ABI MachinePointerInfo getStack(MachineFunction &MF, int64_t Offset, uint8_t ID=0)
Stack pointer relative access.
Definition MachineOperand.cpp:1105

llvm::MachinePointerInfo::getGOT
static LLVM_ABI MachinePointerInfo getGOT(MachineFunction &MF)
Return a MachinePointerInfo record that refers to a GOT entry.
Definition MachineOperand.cpp:1101

llvm::MachinePointerInfo::getFixedStack
static LLVM_ABI MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.
Definition MachineOperand.cpp:1092

llvm::MemOp
Definition TargetLowering.h:118

llvm::SDVTList
This represents a list of ValueType's that has been intern'd by a SelectionDAG.
Definition SelectionDAGNodes.h:80

llvm::TargetLoweringBase::AddrMode
This represents an addressing mode of: BaseGV + BaseOffs + BaseReg + Scale*ScaleReg + ScalableOffset*...
Definition TargetLowering.h:2933

llvm::TargetLoweringBase::AddrMode::BaseOffs
int64_t BaseOffs
Definition TargetLowering.h:2935

llvm::TargetLoweringBase::AddrMode::BaseGV
GlobalValue * BaseGV
Definition TargetLowering.h:2934

llvm::TargetLoweringBase::AddrMode::HasBaseReg
bool HasBaseReg
Definition TargetLowering.h:2936

llvm::TargetLoweringBase::AddrMode::Scale
int64_t Scale
Definition TargetLowering.h:2937

llvm::TargetLoweringBase::IntrinsicInfo
Definition TargetLowering.h:1230

llvm::TargetLowering::CallLoweringInfo
This structure contains all information that is necessary for lowering calls.
Definition TargetLowering.h:4755

llvm::TargetLowering::CallLoweringInfo::IsTailCall
bool IsTailCall
Definition TargetLowering.h:4774

llvm::TargetLowering::CallLoweringInfo::Callee
SDValue Callee
Definition TargetLowering.h:4781

llvm::TargetLowering::CallLoweringInfo::DL
SDLoc DL
Definition TargetLowering.h:4784

llvm::TargetLowering::CallLoweringInfo::IsVarArg
bool IsVarArg
Definition TargetLowering.h:4763

llvm::TargetLowering::CallLoweringInfo::Ins
SmallVector< ISD::InputArg, 32 > Ins
Definition TargetLowering.h:4788

llvm::TargetLowering::CallLoweringInfo::Chain
SDValue Chain
Definition TargetLowering.h:4756

llvm::TargetLowering::CallLoweringInfo::NoMerge
bool NoMerge
Definition TargetLowering.h:4770

llvm::TargetLowering::CallLoweringInfo::CB
const CallBase * CB
Definition TargetLowering.h:4785

llvm::TargetLowering::CallLoweringInfo::Outs
SmallVector< ISD::OutputArg, 32 > Outs
Definition TargetLowering.h:4786

llvm::TargetLowering::CallLoweringInfo::OutVals
SmallVector< SDValue, 32 > OutVals
Definition TargetLowering.h:4787

llvm::TargetLowering::CallLoweringInfo::CallConv
CallingConv::ID CallConv
Definition TargetLowering.h:4780

llvm::TargetLowering::CallLoweringInfo::DAG
SelectionDAG & DAG
Definition TargetLowering.h:4783

llvm::TargetLowering::DAGCombinerInfo
Definition TargetLowering.h:4459

llvm::TargetLowering::DAGCombinerInfo::isBeforeLegalizeOps
bool isBeforeLegalizeOps() const
Definition TargetLowering.h:4471

llvm::TargetLowering::DAGCombinerInfo::isBeforeLegalize
bool isBeforeLegalize() const
Definition TargetLowering.h:4470

llvm::TargetLowering::DAGCombinerInfo::DAG
SelectionDAG & DAG
Definition TargetLowering.h:4465

llvm::TargetLowering::DAGCombinerInfo::CombineTo
LLVM_ABI SDValue CombineTo(SDNode *N, ArrayRef< SDValue > To, bool AddTo=true)
Definition DAGCombiner.cpp:941

llvm::TargetLowering::MakeLibCallOptions
This structure is used to pass arguments to makeLibCall function.
Definition TargetLowering.h:4957

llvm::TargetLowering::MakeLibCallOptions::setTypeListBeforeSoften
MakeLibCallOptions & setTypeListBeforeSoften(ArrayRef< EVT > OpsVT, EVT RetVT)
Definition TargetLowering.h:4994

llvm::TargetLowering::TargetLoweringOpt
A convenience struct that encapsulates a DAG, and two SDValues for returning information from TargetL...
Definition TargetLowering.h:4165

llvm::TargetLowering::TargetLoweringOpt::DAG
SelectionDAG & DAG
Definition TargetLowering.h:4166

llvm::TargetLowering::TargetLoweringOpt::CombineTo
bool CombineTo(SDValue O, SDValue N)
Definition TargetLowering.h:4179

llvm::cl::desc
Definition CommandLine.h:411