LLVM 22.0.0git
LegalizeDAG.cpp
Go to the documentation of this file.
1//===- LegalizeDAG.cpp - Implement SelectionDAG::Legalize -----------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements the SelectionDAG::Legalize method.
10//
11//===----------------------------------------------------------------------===//
12
13#include "llvm/ADT/APFloat.h"
14#include "llvm/ADT/APInt.h"
15#include "llvm/ADT/ArrayRef.h"
17#include "llvm/ADT/SetVector.h"
19#include "llvm/ADT/SmallSet.h"
36#include "llvm/IR/CallingConv.h"
37#include "llvm/IR/Constants.h"
38#include "llvm/IR/DataLayout.h"
40#include "llvm/IR/Function.h"
41#include "llvm/IR/Metadata.h"
42#include "llvm/IR/Type.h"
45#include "llvm/Support/Debug.h"
51#include <cassert>
52#include <cstdint>
53#include <tuple>
54#include <utility>
55
56using namespace llvm;
57
58#define DEBUG_TYPE "legalizedag"
59
60namespace {
61
62/// Keeps track of state when getting the sign of a floating-point value as an
63/// integer.
64struct FloatSignAsInt {
65 EVT FloatVT;
66 SDValue Chain;
67 SDValue FloatPtr;
68 SDValue IntPtr;
69 MachinePointerInfo IntPointerInfo;
70 MachinePointerInfo FloatPointerInfo;
71 SDValue IntValue;
72 APInt SignMask;
73 uint8_t SignBit;
74};
75
76//===----------------------------------------------------------------------===//
77/// This takes an arbitrary SelectionDAG as input and
78/// hacks on it until the target machine can handle it. This involves
79/// eliminating value sizes the machine cannot handle (promoting small sizes to
80/// large sizes or splitting up large values into small values) as well as
81/// eliminating operations the machine cannot handle.
82///
83/// This code also does a small amount of optimization and recognition of idioms
84/// as part of its processing. For example, if a target does not support a
85/// 'setcc' instruction efficiently, but does support 'brcc' instruction, this
86/// will attempt merge setcc and brc instructions into brcc's.
87class SelectionDAGLegalize {
88 const TargetMachine &TM;
89 const TargetLowering &TLI;
90 SelectionDAG &DAG;
91
92 /// The set of nodes which have already been legalized. We hold a
93 /// reference to it in order to update as necessary on node deletion.
94 SmallPtrSetImpl<SDNode *> &LegalizedNodes;
95
96 /// A set of all the nodes updated during legalization.
97 SmallSetVector<SDNode *, 16> *UpdatedNodes;
98
99 EVT getSetCCResultType(EVT VT) const {
100 return TLI.getSetCCResultType(DAG.getDataLayout(), *DAG.getContext(), VT);
101 }
102
103 // Libcall insertion helpers.
104
105public:
106 SelectionDAGLegalize(SelectionDAG &DAG,
107 SmallPtrSetImpl<SDNode *> &LegalizedNodes,
108 SmallSetVector<SDNode *, 16> *UpdatedNodes = nullptr)
109 : TM(DAG.getTarget()), TLI(DAG.getTargetLoweringInfo()), DAG(DAG),
110 LegalizedNodes(LegalizedNodes), UpdatedNodes(UpdatedNodes) {}
111
112 /// Legalizes the given operation.
113 void LegalizeOp(SDNode *Node);
114
115private:
116 SDValue OptimizeFloatStore(StoreSDNode *ST);
117
118 void LegalizeLoadOps(SDNode *Node);
119 void LegalizeStoreOps(SDNode *Node);
120
121 SDValue ExpandINSERT_VECTOR_ELT(SDValue Op);
122
123 /// Return a vector shuffle operation which
124 /// performs the same shuffe in terms of order or result bytes, but on a type
125 /// whose vector element type is narrower than the original shuffle type.
126 /// e.g. <v4i32> <0, 1, 0, 1> -> v8i16 <0, 1, 2, 3, 0, 1, 2, 3>
127 SDValue ShuffleWithNarrowerEltType(EVT NVT, EVT VT, const SDLoc &dl,
128 SDValue N1, SDValue N2,
129 ArrayRef<int> Mask) const;
130
131 std::pair<SDValue, SDValue> ExpandLibCall(RTLIB::Libcall LC, SDNode *Node,
133 bool IsSigned, EVT RetVT);
134 std::pair<SDValue, SDValue> ExpandLibCall(RTLIB::Libcall LC, SDNode *Node, bool isSigned);
135
136 void ExpandFPLibCall(SDNode *Node, RTLIB::Libcall LC,
138 void ExpandFPLibCall(SDNode *Node, RTLIB::Libcall Call_F32,
139 RTLIB::Libcall Call_F64, RTLIB::Libcall Call_F80,
140 RTLIB::Libcall Call_F128,
141 RTLIB::Libcall Call_PPCF128,
143
144 void
145 ExpandFastFPLibCall(SDNode *Node, bool IsFast,
146 std::pair<RTLIB::Libcall, RTLIB::Libcall> Call_F32,
147 std::pair<RTLIB::Libcall, RTLIB::Libcall> Call_F64,
148 std::pair<RTLIB::Libcall, RTLIB::Libcall> Call_F80,
149 std::pair<RTLIB::Libcall, RTLIB::Libcall> Call_F128,
150 std::pair<RTLIB::Libcall, RTLIB::Libcall> Call_PPCF128,
152
153 SDValue ExpandIntLibCall(SDNode *Node, bool isSigned, RTLIB::Libcall Call_I8,
154 RTLIB::Libcall Call_I16, RTLIB::Libcall Call_I32,
155 RTLIB::Libcall Call_I64, RTLIB::Libcall Call_I128);
156 void ExpandArgFPLibCall(SDNode *Node,
157 RTLIB::Libcall Call_F32, RTLIB::Libcall Call_F64,
158 RTLIB::Libcall Call_F80, RTLIB::Libcall Call_F128,
159 RTLIB::Libcall Call_PPCF128,
161 SDValue ExpandBitCountingLibCall(SDNode *Node, RTLIB::Libcall CallI32,
162 RTLIB::Libcall CallI64,
163 RTLIB::Libcall CallI128);
164 void ExpandDivRemLibCall(SDNode *Node, SmallVectorImpl<SDValue> &Results);
165
166 SDValue ExpandSincosStretLibCall(SDNode *Node) const;
167
168 SDValue EmitStackConvert(SDValue SrcOp, EVT SlotVT, EVT DestVT,
169 const SDLoc &dl);
170 SDValue EmitStackConvert(SDValue SrcOp, EVT SlotVT, EVT DestVT,
171 const SDLoc &dl, SDValue ChainIn);
172 SDValue ExpandBUILD_VECTOR(SDNode *Node);
173 SDValue ExpandSPLAT_VECTOR(SDNode *Node);
174 SDValue ExpandSCALAR_TO_VECTOR(SDNode *Node);
175 void ExpandDYNAMIC_STACKALLOC(SDNode *Node,
177 void getSignAsIntValue(FloatSignAsInt &State, const SDLoc &DL,
178 SDValue Value) const;
179 SDValue modifySignAsInt(const FloatSignAsInt &State, const SDLoc &DL,
180 SDValue NewIntValue) const;
181 SDValue ExpandFCOPYSIGN(SDNode *Node) const;
182 SDValue ExpandFABS(SDNode *Node) const;
183 SDValue ExpandFNEG(SDNode *Node) const;
184 SDValue expandLdexp(SDNode *Node) const;
185 SDValue expandFrexp(SDNode *Node) const;
186
187 SDValue ExpandLegalINT_TO_FP(SDNode *Node, SDValue &Chain);
188 void PromoteLegalINT_TO_FP(SDNode *N, const SDLoc &dl,
190 void PromoteLegalFP_TO_INT(SDNode *N, const SDLoc &dl,
192 SDValue PromoteLegalFP_TO_INT_SAT(SDNode *Node, const SDLoc &dl);
193
194 /// Implements vector reduce operation promotion.
195 ///
196 /// All vector operands are promoted to a vector type with larger element
197 /// type, and the start value is promoted to a larger scalar type. Then the
198 /// result is truncated back to the original scalar type.
199 SDValue PromoteReduction(SDNode *Node);
200
201 SDValue ExpandPARITY(SDValue Op, const SDLoc &dl);
202
203 SDValue ExpandExtractFromVectorThroughStack(SDValue Op);
204 SDValue ExpandInsertToVectorThroughStack(SDValue Op);
205 SDValue ExpandVectorBuildThroughStack(SDNode* Node);
206 SDValue ExpandConcatVectors(SDNode *Node);
207
208 SDValue ExpandConstantFP(ConstantFPSDNode *CFP, bool UseCP);
209 SDValue ExpandConstant(ConstantSDNode *CP);
210
211 // if ExpandNode returns false, LegalizeOp falls back to ConvertNodeToLibcall
212 bool ExpandNode(SDNode *Node);
213 void ConvertNodeToLibcall(SDNode *Node);
214 void PromoteNode(SDNode *Node);
215
216public:
217 // Node replacement helpers
218
219 void ReplacedNode(SDNode *N) {
220 LegalizedNodes.erase(N);
221 if (UpdatedNodes)
222 UpdatedNodes->insert(N);
223 }
224
225 void ReplaceNode(SDNode *Old, SDNode *New) {
226 LLVM_DEBUG(dbgs() << " ... replacing: "; Old->dump(&DAG);
227 dbgs() << " with: "; New->dump(&DAG));
228
229 assert(Old->getNumValues() == New->getNumValues() &&
230 "Replacing one node with another that produces a different number "
231 "of values!");
232 DAG.ReplaceAllUsesWith(Old, New);
233 if (UpdatedNodes)
234 UpdatedNodes->insert(New);
235 ReplacedNode(Old);
236 }
237
238 void ReplaceNode(SDValue Old, SDValue New) {
239 LLVM_DEBUG(dbgs() << " ... replacing: "; Old->dump(&DAG);
240 dbgs() << " with: "; New->dump(&DAG));
241
242 DAG.ReplaceAllUsesWith(Old, New);
243 if (UpdatedNodes)
244 UpdatedNodes->insert(New.getNode());
245 ReplacedNode(Old.getNode());
246 }
247
248 void ReplaceNode(SDNode *Old, const SDValue *New) {
249 LLVM_DEBUG(dbgs() << " ... replacing: "; Old->dump(&DAG));
250
251 DAG.ReplaceAllUsesWith(Old, New);
252 for (unsigned i = 0, e = Old->getNumValues(); i != e; ++i) {
253 LLVM_DEBUG(dbgs() << (i == 0 ? " with: " : " and: ");
254 New[i]->dump(&DAG));
255 if (UpdatedNodes)
256 UpdatedNodes->insert(New[i].getNode());
257 }
258 ReplacedNode(Old);
259 }
260
261 void ReplaceNodeWithValue(SDValue Old, SDValue New) {
262 LLVM_DEBUG(dbgs() << " ... replacing: "; Old->dump(&DAG);
263 dbgs() << " with: "; New->dump(&DAG));
264
265 DAG.ReplaceAllUsesOfValueWith(Old, New);
266 if (UpdatedNodes)
267 UpdatedNodes->insert(New.getNode());
268 ReplacedNode(Old.getNode());
269 }
270};
271
272} // end anonymous namespace
273
274// Helper function that generates an MMO that considers the alignment of the
275// stack, and the size of the stack object
277 MachineFunction &MF,
278 bool isObjectScalable) {
279 auto &MFI = MF.getFrameInfo();
280 int FI = cast<FrameIndexSDNode>(StackPtr)->getIndex();
282 LocationSize ObjectSize = isObjectScalable
284 : LocationSize::precise(MFI.getObjectSize(FI));
286 ObjectSize, MFI.getObjectAlign(FI));
287}
288
289/// Return a vector shuffle operation which
290/// performs the same shuffle in terms of order or result bytes, but on a type
291/// whose vector element type is narrower than the original shuffle type.
292/// e.g. <v4i32> <0, 1, 0, 1> -> v8i16 <0, 1, 2, 3, 0, 1, 2, 3>
293SDValue SelectionDAGLegalize::ShuffleWithNarrowerEltType(
294 EVT NVT, EVT VT, const SDLoc &dl, SDValue N1, SDValue N2,
295 ArrayRef<int> Mask) const {
296 unsigned NumMaskElts = VT.getVectorNumElements();
297 unsigned NumDestElts = NVT.getVectorNumElements();
298 unsigned NumEltsGrowth = NumDestElts / NumMaskElts;
299
300 assert(NumEltsGrowth && "Cannot promote to vector type with fewer elts!");
301
302 if (NumEltsGrowth == 1)
303 return DAG.getVectorShuffle(NVT, dl, N1, N2, Mask);
304
305 SmallVector<int, 8> NewMask;
306 for (unsigned i = 0; i != NumMaskElts; ++i) {
307 int Idx = Mask[i];
308 for (unsigned j = 0; j != NumEltsGrowth; ++j) {
309 if (Idx < 0)
310 NewMask.push_back(-1);
311 else
312 NewMask.push_back(Idx * NumEltsGrowth + j);
313 }
314 }
315 assert(NewMask.size() == NumDestElts && "Non-integer NumEltsGrowth?");
316 assert(TLI.isShuffleMaskLegal(NewMask, NVT) && "Shuffle not legal?");
317 return DAG.getVectorShuffle(NVT, dl, N1, N2, NewMask);
318}
319
320/// Expands the ConstantFP node to an integer constant or
321/// a load from the constant pool.
323SelectionDAGLegalize::ExpandConstantFP(ConstantFPSDNode *CFP, bool UseCP) {
324 bool Extend = false;
325 SDLoc dl(CFP);
326
327 // If a FP immediate is precise when represented as a float and if the
328 // target can do an extending load from float to double, we put it into
329 // the constant pool as a float, even if it's is statically typed as a
330 // double. This shrinks FP constants and canonicalizes them for targets where
331 // an FP extending load is the same cost as a normal load (such as on the x87
332 // fp stack or PPC FP unit).
333 EVT VT = CFP->getValueType(0);
334 ConstantFP *LLVMC = const_cast<ConstantFP*>(CFP->getConstantFPValue());
335 if (!UseCP) {
336 assert((VT == MVT::f64 || VT == MVT::f32) && "Invalid type expansion");
337 return DAG.getConstant(LLVMC->getValueAPF().bitcastToAPInt(), dl,
338 (VT == MVT::f64) ? MVT::i64 : MVT::i32);
339 }
340
341 APFloat APF = CFP->getValueAPF();
342 EVT OrigVT = VT;
343 EVT SVT = VT;
344
345 // We don't want to shrink SNaNs. Converting the SNaN back to its real type
346 // can cause it to be changed into a QNaN on some platforms (e.g. on SystemZ).
347 if (!APF.isSignaling()) {
348 while (SVT != MVT::f32 && SVT != MVT::f16 && SVT != MVT::bf16) {
349 SVT = (MVT::SimpleValueType)(SVT.getSimpleVT().SimpleTy - 1);
351 // Only do this if the target has a native EXTLOAD instruction from
352 // smaller type.
353 TLI.isLoadExtLegal(ISD::EXTLOAD, OrigVT, SVT) &&
354 TLI.ShouldShrinkFPConstant(OrigVT)) {
355 Type *SType = SVT.getTypeForEVT(*DAG.getContext());
357 Instruction::FPTrunc, LLVMC, SType, DAG.getDataLayout()));
358 VT = SVT;
359 Extend = true;
360 }
361 }
362 }
363
364 SDValue CPIdx =
365 DAG.getConstantPool(LLVMC, TLI.getPointerTy(DAG.getDataLayout()));
366 Align Alignment = cast<ConstantPoolSDNode>(CPIdx)->getAlign();
367 if (Extend) {
369 ISD::EXTLOAD, dl, OrigVT, DAG.getEntryNode(), CPIdx,
371 Alignment);
372 return Result;
373 }
374 SDValue Result = DAG.getLoad(
375 OrigVT, dl, DAG.getEntryNode(), CPIdx,
377 return Result;
378}
379
380/// Expands the Constant node to a load from the constant pool.
381SDValue SelectionDAGLegalize::ExpandConstant(ConstantSDNode *CP) {
382 SDLoc dl(CP);
383 EVT VT = CP->getValueType(0);
384 SDValue CPIdx = DAG.getConstantPool(CP->getConstantIntValue(),
385 TLI.getPointerTy(DAG.getDataLayout()));
386 Align Alignment = cast<ConstantPoolSDNode>(CPIdx)->getAlign();
387 SDValue Result = DAG.getLoad(
388 VT, dl, DAG.getEntryNode(), CPIdx,
390 return Result;
391}
392
393SDValue SelectionDAGLegalize::ExpandINSERT_VECTOR_ELT(SDValue Op) {
394 SDValue Vec = Op.getOperand(0);
395 SDValue Val = Op.getOperand(1);
396 SDValue Idx = Op.getOperand(2);
397 SDLoc dl(Op);
398
399 if (ConstantSDNode *InsertPos = dyn_cast<ConstantSDNode>(Idx)) {
400 // SCALAR_TO_VECTOR requires that the type of the value being inserted
401 // match the element type of the vector being created, except for
402 // integers in which case the inserted value can be over width.
403 EVT EltVT = Vec.getValueType().getVectorElementType();
404 if (Val.getValueType() == EltVT ||
405 (EltVT.isInteger() && Val.getValueType().bitsGE(EltVT))) {
406 SDValue ScVec = DAG.getNode(ISD::SCALAR_TO_VECTOR, dl,
407 Vec.getValueType(), Val);
408
409 unsigned NumElts = Vec.getValueType().getVectorNumElements();
410 // We generate a shuffle of InVec and ScVec, so the shuffle mask
411 // should be 0,1,2,3,4,5... with the appropriate element replaced with
412 // elt 0 of the RHS.
413 SmallVector<int, 8> ShufOps;
414 for (unsigned i = 0; i != NumElts; ++i)
415 ShufOps.push_back(i != InsertPos->getZExtValue() ? i : NumElts);
416
417 return DAG.getVectorShuffle(Vec.getValueType(), dl, Vec, ScVec, ShufOps);
418 }
419 }
420 return ExpandInsertToVectorThroughStack(Op);
421}
422
423SDValue SelectionDAGLegalize::OptimizeFloatStore(StoreSDNode* ST) {
424 if (!ISD::isNormalStore(ST))
425 return SDValue();
426
427 LLVM_DEBUG(dbgs() << "Optimizing float store operations\n");
428 // Turn 'store float 1.0, Ptr' -> 'store int 0x12345678, Ptr'
429 // FIXME: move this to the DAG Combiner! Note that we can't regress due
430 // to phase ordering between legalized code and the dag combiner. This
431 // probably means that we need to integrate dag combiner and legalizer
432 // together.
433 // We generally can't do this one for long doubles.
434 SDValue Chain = ST->getChain();
435 SDValue Ptr = ST->getBasePtr();
436 SDValue Value = ST->getValue();
437 MachineMemOperand::Flags MMOFlags = ST->getMemOperand()->getFlags();
438 AAMDNodes AAInfo = ST->getAAInfo();
439 SDLoc dl(ST);
440
441 // Don't optimise TargetConstantFP
442 if (Value.getOpcode() == ISD::TargetConstantFP)
443 return SDValue();
444
445 if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(Value)) {
446 if (CFP->getValueType(0) == MVT::f32 &&
447 TLI.isTypeLegal(MVT::i32)) {
448 SDValue Con = DAG.getConstant(CFP->getValueAPF().
449 bitcastToAPInt().zextOrTrunc(32),
450 SDLoc(CFP), MVT::i32);
451 return DAG.getStore(Chain, dl, Con, Ptr, ST->getPointerInfo(),
452 ST->getBaseAlign(), MMOFlags, AAInfo);
453 }
454
455 if (CFP->getValueType(0) == MVT::f64 &&
456 !TLI.isFPImmLegal(CFP->getValueAPF(), MVT::f64)) {
457 // If this target supports 64-bit registers, do a single 64-bit store.
458 if (TLI.isTypeLegal(MVT::i64)) {
460 zextOrTrunc(64), SDLoc(CFP), MVT::i64);
461 return DAG.getStore(Chain, dl, Con, Ptr, ST->getPointerInfo(),
462 ST->getBaseAlign(), MMOFlags, AAInfo);
463 }
464
465 if (TLI.isTypeLegal(MVT::i32) && !ST->isVolatile()) {
466 // Otherwise, if the target supports 32-bit registers, use 2 32-bit
467 // stores. If the target supports neither 32- nor 64-bits, this
468 // xform is certainly not worth it.
469 const APInt &IntVal = CFP->getValueAPF().bitcastToAPInt();
470 SDValue Lo = DAG.getConstant(IntVal.trunc(32), dl, MVT::i32);
471 SDValue Hi = DAG.getConstant(IntVal.lshr(32).trunc(32), dl, MVT::i32);
472 if (DAG.getDataLayout().isBigEndian())
473 std::swap(Lo, Hi);
474
475 Lo = DAG.getStore(Chain, dl, Lo, Ptr, ST->getPointerInfo(),
476 ST->getBaseAlign(), MMOFlags, AAInfo);
477 Ptr = DAG.getMemBasePlusOffset(Ptr, TypeSize::getFixed(4), dl);
478 Hi = DAG.getStore(Chain, dl, Hi, Ptr,
479 ST->getPointerInfo().getWithOffset(4),
480 ST->getBaseAlign(), MMOFlags, AAInfo);
481
482 return DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Lo, Hi);
483 }
484 }
485 }
486 return SDValue();
487}
488
489void SelectionDAGLegalize::LegalizeStoreOps(SDNode *Node) {
490 StoreSDNode *ST = cast<StoreSDNode>(Node);
491 SDValue Chain = ST->getChain();
492 SDValue Ptr = ST->getBasePtr();
493 SDLoc dl(Node);
494
495 MachineMemOperand::Flags MMOFlags = ST->getMemOperand()->getFlags();
496 AAMDNodes AAInfo = ST->getAAInfo();
497
498 if (!ST->isTruncatingStore()) {
499 LLVM_DEBUG(dbgs() << "Legalizing store operation\n");
500 if (SDNode *OptStore = OptimizeFloatStore(ST).getNode()) {
501 ReplaceNode(ST, OptStore);
502 return;
503 }
504
505 SDValue Value = ST->getValue();
506 MVT VT = Value.getSimpleValueType();
507 switch (TLI.getOperationAction(ISD::STORE, VT)) {
508 default: llvm_unreachable("This action is not supported yet!");
509 case TargetLowering::Legal: {
510 // If this is an unaligned store and the target doesn't support it,
511 // expand it.
512 EVT MemVT = ST->getMemoryVT();
513 const DataLayout &DL = DAG.getDataLayout();
514 if (!TLI.allowsMemoryAccessForAlignment(*DAG.getContext(), DL, MemVT,
515 *ST->getMemOperand())) {
516 LLVM_DEBUG(dbgs() << "Expanding unsupported unaligned store\n");
517 SDValue Result = TLI.expandUnalignedStore(ST, DAG);
518 ReplaceNode(SDValue(ST, 0), Result);
519 } else
520 LLVM_DEBUG(dbgs() << "Legal store\n");
521 break;
522 }
523 case TargetLowering::Custom: {
524 LLVM_DEBUG(dbgs() << "Trying custom lowering\n");
525 SDValue Res = TLI.LowerOperation(SDValue(Node, 0), DAG);
526 if (Res && Res != SDValue(Node, 0))
527 ReplaceNode(SDValue(Node, 0), Res);
528 return;
529 }
530 case TargetLowering::Promote: {
531 MVT NVT = TLI.getTypeToPromoteTo(ISD::STORE, VT);
532 assert(NVT.getSizeInBits() == VT.getSizeInBits() &&
533 "Can only promote stores to same size type");
534 Value = DAG.getNode(ISD::BITCAST, dl, NVT, Value);
535 SDValue Result = DAG.getStore(Chain, dl, Value, Ptr, ST->getPointerInfo(),
536 ST->getBaseAlign(), MMOFlags, AAInfo);
537 ReplaceNode(SDValue(Node, 0), Result);
538 break;
539 }
540 }
541 return;
542 }
543
544 LLVM_DEBUG(dbgs() << "Legalizing truncating store operations\n");
545 SDValue Value = ST->getValue();
546 EVT StVT = ST->getMemoryVT();
547 TypeSize StWidth = StVT.getSizeInBits();
548 TypeSize StSize = StVT.getStoreSizeInBits();
549 auto &DL = DAG.getDataLayout();
550
551 if (StWidth != StSize) {
552 // Promote to a byte-sized store with upper bits zero if not
553 // storing an integral number of bytes. For example, promote
554 // TRUNCSTORE:i1 X -> TRUNCSTORE:i8 (and X, 1)
555 EVT NVT = EVT::getIntegerVT(*DAG.getContext(), StSize.getFixedValue());
556 Value = DAG.getZeroExtendInReg(Value, dl, StVT);
558 DAG.getTruncStore(Chain, dl, Value, Ptr, ST->getPointerInfo(), NVT,
559 ST->getBaseAlign(), MMOFlags, AAInfo);
560 ReplaceNode(SDValue(Node, 0), Result);
561 } else if (!StVT.isVector() && !isPowerOf2_64(StWidth.getFixedValue())) {
562 // If not storing a power-of-2 number of bits, expand as two stores.
563 assert(!StVT.isVector() && "Unsupported truncstore!");
564 unsigned StWidthBits = StWidth.getFixedValue();
565 unsigned LogStWidth = Log2_32(StWidthBits);
566 assert(LogStWidth < 32);
567 unsigned RoundWidth = 1 << LogStWidth;
568 assert(RoundWidth < StWidthBits);
569 unsigned ExtraWidth = StWidthBits - RoundWidth;
570 assert(ExtraWidth < RoundWidth);
571 assert(!(RoundWidth % 8) && !(ExtraWidth % 8) &&
572 "Store size not an integral number of bytes!");
573 EVT RoundVT = EVT::getIntegerVT(*DAG.getContext(), RoundWidth);
574 EVT ExtraVT = EVT::getIntegerVT(*DAG.getContext(), ExtraWidth);
575 SDValue Lo, Hi;
576 unsigned IncrementSize;
577
578 if (DL.isLittleEndian()) {
579 // TRUNCSTORE:i24 X -> TRUNCSTORE:i16 X, TRUNCSTORE@+2:i8 (srl X, 16)
580 // Store the bottom RoundWidth bits.
581 Lo = DAG.getTruncStore(Chain, dl, Value, Ptr, ST->getPointerInfo(),
582 RoundVT, ST->getBaseAlign(), MMOFlags, AAInfo);
583
584 // Store the remaining ExtraWidth bits.
585 IncrementSize = RoundWidth / 8;
586 Ptr =
587 DAG.getMemBasePlusOffset(Ptr, TypeSize::getFixed(IncrementSize), dl);
588 Hi = DAG.getNode(
589 ISD::SRL, dl, Value.getValueType(), Value,
590 DAG.getShiftAmountConstant(RoundWidth, Value.getValueType(), dl));
591 Hi = DAG.getTruncStore(Chain, dl, Hi, Ptr,
592 ST->getPointerInfo().getWithOffset(IncrementSize),
593 ExtraVT, ST->getBaseAlign(), MMOFlags, AAInfo);
594 } else {
595 // Big endian - avoid unaligned stores.
596 // TRUNCSTORE:i24 X -> TRUNCSTORE:i16 (srl X, 8), TRUNCSTORE@+2:i8 X
597 // Store the top RoundWidth bits.
598 Hi = DAG.getNode(
599 ISD::SRL, dl, Value.getValueType(), Value,
600 DAG.getShiftAmountConstant(ExtraWidth, Value.getValueType(), dl));
601 Hi = DAG.getTruncStore(Chain, dl, Hi, Ptr, ST->getPointerInfo(), RoundVT,
602 ST->getBaseAlign(), MMOFlags, AAInfo);
603
604 // Store the remaining ExtraWidth bits.
605 IncrementSize = RoundWidth / 8;
606 Ptr = DAG.getNode(ISD::ADD, dl, Ptr.getValueType(), Ptr,
607 DAG.getConstant(IncrementSize, dl,
608 Ptr.getValueType()));
609 Lo = DAG.getTruncStore(Chain, dl, Value, Ptr,
610 ST->getPointerInfo().getWithOffset(IncrementSize),
611 ExtraVT, ST->getBaseAlign(), MMOFlags, AAInfo);
612 }
613
614 // The order of the stores doesn't matter.
615 SDValue Result = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Lo, Hi);
616 ReplaceNode(SDValue(Node, 0), Result);
617 } else {
618 switch (TLI.getTruncStoreAction(ST->getValue().getValueType(), StVT)) {
619 default: llvm_unreachable("This action is not supported yet!");
620 case TargetLowering::Legal: {
621 EVT MemVT = ST->getMemoryVT();
622 // If this is an unaligned store and the target doesn't support it,
623 // expand it.
624 if (!TLI.allowsMemoryAccessForAlignment(*DAG.getContext(), DL, MemVT,
625 *ST->getMemOperand())) {
626 SDValue Result = TLI.expandUnalignedStore(ST, DAG);
627 ReplaceNode(SDValue(ST, 0), Result);
628 }
629 break;
630 }
631 case TargetLowering::Custom: {
632 SDValue Res = TLI.LowerOperation(SDValue(Node, 0), DAG);
633 if (Res && Res != SDValue(Node, 0))
634 ReplaceNode(SDValue(Node, 0), Res);
635 return;
636 }
637 case TargetLowering::Expand:
638 assert(!StVT.isVector() &&
639 "Vector Stores are handled in LegalizeVectorOps");
640
642
643 // TRUNCSTORE:i16 i32 -> STORE i16
644 if (TLI.isTypeLegal(StVT)) {
645 Value = DAG.getNode(ISD::TRUNCATE, dl, StVT, Value);
646 Result = DAG.getStore(Chain, dl, Value, Ptr, ST->getPointerInfo(),
647 ST->getBaseAlign(), MMOFlags, AAInfo);
648 } else {
649 // The in-memory type isn't legal. Truncate to the type it would promote
650 // to, and then do a truncstore.
651 Value = DAG.getNode(ISD::TRUNCATE, dl,
652 TLI.getTypeToTransformTo(*DAG.getContext(), StVT),
653 Value);
654 Result = DAG.getTruncStore(Chain, dl, Value, Ptr, ST->getPointerInfo(),
655 StVT, ST->getBaseAlign(), MMOFlags, AAInfo);
656 }
657
658 ReplaceNode(SDValue(Node, 0), Result);
659 break;
660 }
661 }
662}
663
664void SelectionDAGLegalize::LegalizeLoadOps(SDNode *Node) {
665 LoadSDNode *LD = cast<LoadSDNode>(Node);
666 SDValue Chain = LD->getChain(); // The chain.
667 SDValue Ptr = LD->getBasePtr(); // The base pointer.
668 SDValue Value; // The value returned by the load op.
669 SDLoc dl(Node);
670
671 ISD::LoadExtType ExtType = LD->getExtensionType();
672 if (ExtType == ISD::NON_EXTLOAD) {
673 LLVM_DEBUG(dbgs() << "Legalizing non-extending load operation\n");
674 MVT VT = Node->getSimpleValueType(0);
675 SDValue RVal = SDValue(Node, 0);
676 SDValue RChain = SDValue(Node, 1);
677
678 switch (TLI.getOperationAction(Node->getOpcode(), VT)) {
679 default: llvm_unreachable("This action is not supported yet!");
680 case TargetLowering::Legal: {
681 EVT MemVT = LD->getMemoryVT();
682 const DataLayout &DL = DAG.getDataLayout();
683 // If this is an unaligned load and the target doesn't support it,
684 // expand it.
685 if (!TLI.allowsMemoryAccessForAlignment(*DAG.getContext(), DL, MemVT,
686 *LD->getMemOperand())) {
687 std::tie(RVal, RChain) = TLI.expandUnalignedLoad(LD, DAG);
688 }
689 break;
690 }
691 case TargetLowering::Custom:
692 if (SDValue Res = TLI.LowerOperation(RVal, DAG)) {
693 RVal = Res;
694 RChain = Res.getValue(1);
695 }
696 break;
697
698 case TargetLowering::Promote: {
699 MVT NVT = TLI.getTypeToPromoteTo(Node->getOpcode(), VT);
700 assert(NVT.getSizeInBits() == VT.getSizeInBits() &&
701 "Can only promote loads to same size type");
702
703 // If the range metadata type does not match the legalized memory
704 // operation type, remove the range metadata.
705 if (const MDNode *MD = LD->getRanges()) {
706 ConstantInt *Lower = mdconst::extract<ConstantInt>(MD->getOperand(0));
707 if (Lower->getBitWidth() != NVT.getScalarSizeInBits() ||
708 !NVT.isInteger())
709 LD->getMemOperand()->clearRanges();
710 }
711 SDValue Res = DAG.getLoad(NVT, dl, Chain, Ptr, LD->getMemOperand());
712 RVal = DAG.getNode(ISD::BITCAST, dl, VT, Res);
713 RChain = Res.getValue(1);
714 break;
715 }
716 }
717 if (RChain.getNode() != Node) {
718 assert(RVal.getNode() != Node && "Load must be completely replaced");
719 DAG.ReplaceAllUsesOfValueWith(SDValue(Node, 0), RVal);
720 DAG.ReplaceAllUsesOfValueWith(SDValue(Node, 1), RChain);
721 if (UpdatedNodes) {
722 UpdatedNodes->insert(RVal.getNode());
723 UpdatedNodes->insert(RChain.getNode());
724 }
725 ReplacedNode(Node);
726 }
727 return;
728 }
729
730 LLVM_DEBUG(dbgs() << "Legalizing extending load operation\n");
731 EVT SrcVT = LD->getMemoryVT();
732 TypeSize SrcWidth = SrcVT.getSizeInBits();
733 MachineMemOperand::Flags MMOFlags = LD->getMemOperand()->getFlags();
734 AAMDNodes AAInfo = LD->getAAInfo();
735
736 if (SrcWidth != SrcVT.getStoreSizeInBits() &&
737 // Some targets pretend to have an i1 loading operation, and actually
738 // load an i8. This trick is correct for ZEXTLOAD because the top 7
739 // bits are guaranteed to be zero; it helps the optimizers understand
740 // that these bits are zero. It is also useful for EXTLOAD, since it
741 // tells the optimizers that those bits are undefined. It would be
742 // nice to have an effective generic way of getting these benefits...
743 // Until such a way is found, don't insist on promoting i1 here.
744 (SrcVT != MVT::i1 ||
745 TLI.getLoadExtAction(ExtType, Node->getValueType(0), MVT::i1) ==
746 TargetLowering::Promote)) {
747 // Promote to a byte-sized load if not loading an integral number of
748 // bytes. For example, promote EXTLOAD:i20 -> EXTLOAD:i24.
749 unsigned NewWidth = SrcVT.getStoreSizeInBits();
750 EVT NVT = EVT::getIntegerVT(*DAG.getContext(), NewWidth);
751 SDValue Ch;
752
753 // The extra bits are guaranteed to be zero, since we stored them that
754 // way. A zext load from NVT thus automatically gives zext from SrcVT.
755
756 ISD::LoadExtType NewExtType =
758
759 SDValue Result = DAG.getExtLoad(NewExtType, dl, Node->getValueType(0),
760 Chain, Ptr, LD->getPointerInfo(), NVT,
761 LD->getBaseAlign(), MMOFlags, AAInfo);
762
763 Ch = Result.getValue(1); // The chain.
764
765 if (ExtType == ISD::SEXTLOAD)
766 // Having the top bits zero doesn't help when sign extending.
768 Result.getValueType(),
769 Result, DAG.getValueType(SrcVT));
770 else if (ExtType == ISD::ZEXTLOAD || NVT == Result.getValueType())
771 // All the top bits are guaranteed to be zero - inform the optimizers.
773 Result.getValueType(), Result,
774 DAG.getValueType(SrcVT));
775
776 Value = Result;
777 Chain = Ch;
778 } else if (!isPowerOf2_64(SrcWidth.getKnownMinValue())) {
779 // If not loading a power-of-2 number of bits, expand as two loads.
780 assert(!SrcVT.isVector() && "Unsupported extload!");
781 unsigned SrcWidthBits = SrcWidth.getFixedValue();
782 unsigned LogSrcWidth = Log2_32(SrcWidthBits);
783 assert(LogSrcWidth < 32);
784 unsigned RoundWidth = 1 << LogSrcWidth;
785 assert(RoundWidth < SrcWidthBits);
786 unsigned ExtraWidth = SrcWidthBits - RoundWidth;
787 assert(ExtraWidth < RoundWidth);
788 assert(!(RoundWidth % 8) && !(ExtraWidth % 8) &&
789 "Load size not an integral number of bytes!");
790 EVT RoundVT = EVT::getIntegerVT(*DAG.getContext(), RoundWidth);
791 EVT ExtraVT = EVT::getIntegerVT(*DAG.getContext(), ExtraWidth);
792 SDValue Lo, Hi, Ch;
793 unsigned IncrementSize;
794 auto &DL = DAG.getDataLayout();
795
796 if (DL.isLittleEndian()) {
797 // EXTLOAD:i24 -> ZEXTLOAD:i16 | (shl EXTLOAD@+2:i8, 16)
798 // Load the bottom RoundWidth bits.
799 Lo = DAG.getExtLoad(ISD::ZEXTLOAD, dl, Node->getValueType(0), Chain, Ptr,
800 LD->getPointerInfo(), RoundVT, LD->getBaseAlign(),
801 MMOFlags, AAInfo);
802
803 // Load the remaining ExtraWidth bits.
804 IncrementSize = RoundWidth / 8;
805 Ptr =
806 DAG.getMemBasePlusOffset(Ptr, TypeSize::getFixed(IncrementSize), dl);
807 Hi = DAG.getExtLoad(ExtType, dl, Node->getValueType(0), Chain, Ptr,
808 LD->getPointerInfo().getWithOffset(IncrementSize),
809 ExtraVT, LD->getBaseAlign(), MMOFlags, AAInfo);
810
811 // Build a factor node to remember that this load is independent of
812 // the other one.
813 Ch = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Lo.getValue(1),
814 Hi.getValue(1));
815
816 // Move the top bits to the right place.
817 Hi = DAG.getNode(
818 ISD::SHL, dl, Hi.getValueType(), Hi,
819 DAG.getShiftAmountConstant(RoundWidth, Hi.getValueType(), dl));
820
821 // Join the hi and lo parts.
822 Value = DAG.getNode(ISD::OR, dl, Node->getValueType(0), Lo, Hi);
823 } else {
824 // Big endian - avoid unaligned loads.
825 // EXTLOAD:i24 -> (shl EXTLOAD:i16, 8) | ZEXTLOAD@+2:i8
826 // Load the top RoundWidth bits.
827 Hi = DAG.getExtLoad(ExtType, dl, Node->getValueType(0), Chain, Ptr,
828 LD->getPointerInfo(), RoundVT, LD->getBaseAlign(),
829 MMOFlags, AAInfo);
830
831 // Load the remaining ExtraWidth bits.
832 IncrementSize = RoundWidth / 8;
833 Ptr =
834 DAG.getMemBasePlusOffset(Ptr, TypeSize::getFixed(IncrementSize), dl);
835 Lo = DAG.getExtLoad(ISD::ZEXTLOAD, dl, Node->getValueType(0), Chain, Ptr,
836 LD->getPointerInfo().getWithOffset(IncrementSize),
837 ExtraVT, LD->getBaseAlign(), MMOFlags, AAInfo);
838
839 // Build a factor node to remember that this load is independent of
840 // the other one.
841 Ch = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Lo.getValue(1),
842 Hi.getValue(1));
843
844 // Move the top bits to the right place.
845 Hi = DAG.getNode(
846 ISD::SHL, dl, Hi.getValueType(), Hi,
847 DAG.getShiftAmountConstant(ExtraWidth, Hi.getValueType(), dl));
848
849 // Join the hi and lo parts.
850 Value = DAG.getNode(ISD::OR, dl, Node->getValueType(0), Lo, Hi);
851 }
852
853 Chain = Ch;
854 } else {
855 bool isCustom = false;
856 switch (TLI.getLoadExtAction(ExtType, Node->getValueType(0),
857 SrcVT.getSimpleVT())) {
858 default: llvm_unreachable("This action is not supported yet!");
859 case TargetLowering::Custom:
860 isCustom = true;
861 [[fallthrough]];
862 case TargetLowering::Legal:
863 Value = SDValue(Node, 0);
864 Chain = SDValue(Node, 1);
865
866 if (isCustom) {
867 if (SDValue Res = TLI.LowerOperation(SDValue(Node, 0), DAG)) {
868 Value = Res;
869 Chain = Res.getValue(1);
870 }
871 } else {
872 // If this is an unaligned load and the target doesn't support it,
873 // expand it.
874 EVT MemVT = LD->getMemoryVT();
875 const DataLayout &DL = DAG.getDataLayout();
876 if (!TLI.allowsMemoryAccess(*DAG.getContext(), DL, MemVT,
877 *LD->getMemOperand())) {
878 std::tie(Value, Chain) = TLI.expandUnalignedLoad(LD, DAG);
879 }
880 }
881 break;
882
883 case TargetLowering::Expand: {
884 EVT DestVT = Node->getValueType(0);
885 if (!TLI.isLoadExtLegal(ISD::EXTLOAD, DestVT, SrcVT)) {
886 // If the source type is not legal, see if there is a legal extload to
887 // an intermediate type that we can then extend further.
888 EVT LoadVT = TLI.getRegisterType(SrcVT.getSimpleVT());
889 if ((LoadVT.isFloatingPoint() == SrcVT.isFloatingPoint()) &&
890 (TLI.isTypeLegal(SrcVT) || // Same as SrcVT == LoadVT?
891 TLI.isLoadExtLegal(ExtType, LoadVT, SrcVT))) {
892 // If we are loading a legal type, this is a non-extload followed by a
893 // full extend.
894 ISD::LoadExtType MidExtType =
895 (LoadVT == SrcVT) ? ISD::NON_EXTLOAD : ExtType;
896
897 SDValue Load = DAG.getExtLoad(MidExtType, dl, LoadVT, Chain, Ptr,
898 SrcVT, LD->getMemOperand());
899 unsigned ExtendOp =
901 Value = DAG.getNode(ExtendOp, dl, Node->getValueType(0), Load);
902 Chain = Load.getValue(1);
903 break;
904 }
905
906 // Handle the special case of fp16 extloads. EXTLOAD doesn't have the
907 // normal undefined upper bits behavior to allow using an in-reg extend
908 // with the illegal FP type, so load as an integer and do the
909 // from-integer conversion.
910 EVT SVT = SrcVT.getScalarType();
911 if (SVT == MVT::f16 || SVT == MVT::bf16) {
912 EVT ISrcVT = SrcVT.changeTypeToInteger();
913 EVT IDestVT = DestVT.changeTypeToInteger();
914 EVT ILoadVT = TLI.getRegisterType(IDestVT.getSimpleVT());
915
916 SDValue Result = DAG.getExtLoad(ISD::ZEXTLOAD, dl, ILoadVT, Chain,
917 Ptr, ISrcVT, LD->getMemOperand());
918 Value =
919 DAG.getNode(SVT == MVT::f16 ? ISD::FP16_TO_FP : ISD::BF16_TO_FP,
920 dl, DestVT, Result);
921 Chain = Result.getValue(1);
922 break;
923 }
924 }
925
926 assert(!SrcVT.isVector() &&
927 "Vector Loads are handled in LegalizeVectorOps");
928
929 // FIXME: This does not work for vectors on most targets. Sign-
930 // and zero-extend operations are currently folded into extending
931 // loads, whether they are legal or not, and then we end up here
932 // without any support for legalizing them.
933 assert(ExtType != ISD::EXTLOAD &&
934 "EXTLOAD should always be supported!");
935 // Turn the unsupported load into an EXTLOAD followed by an
936 // explicit zero/sign extend inreg.
938 Node->getValueType(0),
939 Chain, Ptr, SrcVT,
940 LD->getMemOperand());
941 SDValue ValRes;
942 if (ExtType == ISD::SEXTLOAD)
943 ValRes = DAG.getNode(ISD::SIGN_EXTEND_INREG, dl,
944 Result.getValueType(),
945 Result, DAG.getValueType(SrcVT));
946 else
947 ValRes = DAG.getZeroExtendInReg(Result, dl, SrcVT);
948 Value = ValRes;
949 Chain = Result.getValue(1);
950 break;
951 }
952 }
953 }
954
955 // Since loads produce two values, make sure to remember that we legalized
956 // both of them.
957 if (Chain.getNode() != Node) {
958 assert(Value.getNode() != Node && "Load must be completely replaced");
960 DAG.ReplaceAllUsesOfValueWith(SDValue(Node, 1), Chain);
961 if (UpdatedNodes) {
962 UpdatedNodes->insert(Value.getNode());
963 UpdatedNodes->insert(Chain.getNode());
964 }
965 ReplacedNode(Node);
966 }
967}
968
969/// Return a legal replacement for the given operation, with all legal operands.
970void SelectionDAGLegalize::LegalizeOp(SDNode *Node) {
971 LLVM_DEBUG(dbgs() << "\nLegalizing: "; Node->dump(&DAG));
972
973 // Allow illegal target nodes and illegal registers.
974 if (Node->getOpcode() == ISD::TargetConstant ||
975 Node->getOpcode() == ISD::Register)
976 return;
977
978#ifndef NDEBUG
979 for (unsigned i = 0, e = Node->getNumValues(); i != e; ++i)
980 assert(TLI.getTypeAction(*DAG.getContext(), Node->getValueType(i)) ==
981 TargetLowering::TypeLegal &&
982 "Unexpected illegal type!");
983
984 for (const SDValue &Op : Node->op_values())
985 assert((TLI.getTypeAction(*DAG.getContext(), Op.getValueType()) ==
986 TargetLowering::TypeLegal ||
987 Op.getOpcode() == ISD::TargetConstant ||
988 Op.getOpcode() == ISD::Register) &&
989 "Unexpected illegal type!");
990#endif
991
992 // Figure out the correct action; the way to query this varies by opcode
993 TargetLowering::LegalizeAction Action = TargetLowering::Legal;
994 bool SimpleFinishLegalizing = true;
995 switch (Node->getOpcode()) {
996 case ISD::POISON: {
997 // TODO: Currently, POISON is being lowered to UNDEF here. However, there is
998 // an open concern that this transformation may not be ideal, as targets
999 // should ideally handle POISON directly. Changing this behavior would
1000 // require adding support for POISON in TableGen, which is a large change.
1001 // Additionally, many existing test cases rely on the current behavior
1002 // (e.g., llvm/test/CodeGen/PowerPC/vec_shuffle.ll). A broader discussion
1003 // and incremental changes might be needed to properly support POISON
1004 // without breaking existing targets and tests.
1005 SDValue UndefNode = DAG.getUNDEF(Node->getValueType(0));
1006 ReplaceNode(Node, UndefNode.getNode());
1007 return;
1008 }
1012 case ISD::STACKSAVE:
1013 Action = TLI.getOperationAction(Node->getOpcode(), MVT::Other);
1014 break;
1016 Action = TLI.getOperationAction(Node->getOpcode(),
1017 Node->getValueType(0));
1018 break;
1019 case ISD::VAARG:
1020 Action = TLI.getOperationAction(Node->getOpcode(),
1021 Node->getValueType(0));
1022 if (Action != TargetLowering::Promote)
1023 Action = TLI.getOperationAction(Node->getOpcode(), MVT::Other);
1024 break;
1025 case ISD::SET_FPENV:
1026 case ISD::SET_FPMODE:
1027 Action = TLI.getOperationAction(Node->getOpcode(),
1028 Node->getOperand(1).getValueType());
1029 break;
1030 case ISD::FP_TO_FP16:
1031 case ISD::FP_TO_BF16:
1032 case ISD::SINT_TO_FP:
1033 case ISD::UINT_TO_FP:
1035 case ISD::LROUND:
1036 case ISD::LLROUND:
1037 case ISD::LRINT:
1038 case ISD::LLRINT:
1039 Action = TLI.getOperationAction(Node->getOpcode(),
1040 Node->getOperand(0).getValueType());
1041 break;
1046 case ISD::STRICT_LRINT:
1047 case ISD::STRICT_LLRINT:
1048 case ISD::STRICT_LROUND:
1050 // These pseudo-ops are the same as the other STRICT_ ops except
1051 // they are registered with setOperationAction() using the input type
1052 // instead of the output type.
1053 Action = TLI.getOperationAction(Node->getOpcode(),
1054 Node->getOperand(1).getValueType());
1055 break;
1057 EVT InnerType = cast<VTSDNode>(Node->getOperand(1))->getVT();
1058 Action = TLI.getOperationAction(Node->getOpcode(), InnerType);
1059 break;
1060 }
1061 case ISD::ATOMIC_STORE:
1062 Action = TLI.getOperationAction(Node->getOpcode(),
1063 Node->getOperand(1).getValueType());
1064 break;
1065 case ISD::SELECT_CC:
1066 case ISD::STRICT_FSETCC:
1068 case ISD::SETCC:
1069 case ISD::SETCCCARRY:
1070 case ISD::VP_SETCC:
1071 case ISD::BR_CC: {
1072 unsigned Opc = Node->getOpcode();
1073 unsigned CCOperand = Opc == ISD::SELECT_CC ? 4
1074 : Opc == ISD::STRICT_FSETCC ? 3
1075 : Opc == ISD::STRICT_FSETCCS ? 3
1076 : Opc == ISD::SETCCCARRY ? 3
1077 : (Opc == ISD::SETCC || Opc == ISD::VP_SETCC) ? 2
1078 : 1;
1079 unsigned CompareOperand = Opc == ISD::BR_CC ? 2
1080 : Opc == ISD::STRICT_FSETCC ? 1
1081 : Opc == ISD::STRICT_FSETCCS ? 1
1082 : 0;
1083 MVT OpVT = Node->getOperand(CompareOperand).getSimpleValueType();
1084 ISD::CondCode CCCode =
1085 cast<CondCodeSDNode>(Node->getOperand(CCOperand))->get();
1086 Action = TLI.getCondCodeAction(CCCode, OpVT);
1087 if (Action == TargetLowering::Legal) {
1088 if (Node->getOpcode() == ISD::SELECT_CC)
1089 Action = TLI.getOperationAction(Node->getOpcode(),
1090 Node->getValueType(0));
1091 else
1092 Action = TLI.getOperationAction(Node->getOpcode(), OpVT);
1093 }
1094 break;
1095 }
1096 case ISD::LOAD:
1097 case ISD::STORE:
1098 // FIXME: Model these properly. LOAD and STORE are complicated, and
1099 // STORE expects the unlegalized operand in some cases.
1100 SimpleFinishLegalizing = false;
1101 break;
1102 case ISD::CALLSEQ_START:
1103 case ISD::CALLSEQ_END:
1104 // FIXME: This shouldn't be necessary. These nodes have special properties
1105 // dealing with the recursive nature of legalization. Removing this
1106 // special case should be done as part of making LegalizeDAG non-recursive.
1107 SimpleFinishLegalizing = false;
1108 break;
1110 case ISD::GET_ROUNDING:
1111 case ISD::MERGE_VALUES:
1112 case ISD::EH_RETURN:
1114 case ISD::EH_DWARF_CFA:
1118 // These operations lie about being legal: when they claim to be legal,
1119 // they should actually be expanded.
1120 Action = TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0));
1121 if (Action == TargetLowering::Legal)
1122 Action = TargetLowering::Expand;
1123 break;
1126 case ISD::FRAMEADDR:
1127 case ISD::RETURNADDR:
1129 case ISD::SPONENTRY:
1130 // These operations lie about being legal: when they claim to be legal,
1131 // they should actually be custom-lowered.
1132 Action = TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0));
1133 if (Action == TargetLowering::Legal)
1134 Action = TargetLowering::Custom;
1135 break;
1136 case ISD::CLEAR_CACHE:
1137 // This operation is typically going to be LibCall unless the target wants
1138 // something differrent.
1139 Action = TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0));
1140 break;
1143 // READCYCLECOUNTER and READSTEADYCOUNTER return a i64, even if type
1144 // legalization might have expanded that to several smaller types.
1145 Action = TLI.getOperationAction(Node->getOpcode(), MVT::i64);
1146 break;
1147 case ISD::READ_REGISTER:
1149 // Named register is legal in the DAG, but blocked by register name
1150 // selection if not implemented by target (to chose the correct register)
1151 // They'll be converted to Copy(To/From)Reg.
1152 Action = TargetLowering::Legal;
1153 break;
1154 case ISD::UBSANTRAP:
1155 Action = TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0));
1156 if (Action == TargetLowering::Expand) {
1157 // replace ISD::UBSANTRAP with ISD::TRAP
1158 SDValue NewVal;
1159 NewVal = DAG.getNode(ISD::TRAP, SDLoc(Node), Node->getVTList(),
1160 Node->getOperand(0));
1161 ReplaceNode(Node, NewVal.getNode());
1162 LegalizeOp(NewVal.getNode());
1163 return;
1164 }
1165 break;
1166 case ISD::DEBUGTRAP:
1167 Action = TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0));
1168 if (Action == TargetLowering::Expand) {
1169 // replace ISD::DEBUGTRAP with ISD::TRAP
1170 SDValue NewVal;
1171 NewVal = DAG.getNode(ISD::TRAP, SDLoc(Node), Node->getVTList(),
1172 Node->getOperand(0));
1173 ReplaceNode(Node, NewVal.getNode());
1174 LegalizeOp(NewVal.getNode());
1175 return;
1176 }
1177 break;
1178 case ISD::SADDSAT:
1179 case ISD::UADDSAT:
1180 case ISD::SSUBSAT:
1181 case ISD::USUBSAT:
1182 case ISD::SSHLSAT:
1183 case ISD::USHLSAT:
1184 case ISD::SCMP:
1185 case ISD::UCMP:
1188 Action = TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0));
1189 break;
1190 case ISD::SMULFIX:
1191 case ISD::SMULFIXSAT:
1192 case ISD::UMULFIX:
1193 case ISD::UMULFIXSAT:
1194 case ISD::SDIVFIX:
1195 case ISD::SDIVFIXSAT:
1196 case ISD::UDIVFIX:
1197 case ISD::UDIVFIXSAT: {
1198 unsigned Scale = Node->getConstantOperandVal(2);
1199 Action = TLI.getFixedPointOperationAction(Node->getOpcode(),
1200 Node->getValueType(0), Scale);
1201 break;
1202 }
1203 case ISD::MSCATTER:
1204 Action = TLI.getOperationAction(Node->getOpcode(),
1205 cast<MaskedScatterSDNode>(Node)->getValue().getValueType());
1206 break;
1207 case ISD::MSTORE:
1208 Action = TLI.getOperationAction(Node->getOpcode(),
1209 cast<MaskedStoreSDNode>(Node)->getValue().getValueType());
1210 break;
1211 case ISD::VP_SCATTER:
1212 Action = TLI.getOperationAction(
1213 Node->getOpcode(),
1214 cast<VPScatterSDNode>(Node)->getValue().getValueType());
1215 break;
1216 case ISD::VP_STORE:
1217 Action = TLI.getOperationAction(
1218 Node->getOpcode(),
1219 cast<VPStoreSDNode>(Node)->getValue().getValueType());
1220 break;
1221 case ISD::EXPERIMENTAL_VP_STRIDED_STORE:
1222 Action = TLI.getOperationAction(
1223 Node->getOpcode(),
1224 cast<VPStridedStoreSDNode>(Node)->getValue().getValueType());
1225 break;
1228 case ISD::VECREDUCE_ADD:
1229 case ISD::VECREDUCE_MUL:
1230 case ISD::VECREDUCE_AND:
1231 case ISD::VECREDUCE_OR:
1232 case ISD::VECREDUCE_XOR:
1241 case ISD::IS_FPCLASS:
1242 Action = TLI.getOperationAction(
1243 Node->getOpcode(), Node->getOperand(0).getValueType());
1244 break;
1247 case ISD::VP_REDUCE_FADD:
1248 case ISD::VP_REDUCE_FMUL:
1249 case ISD::VP_REDUCE_ADD:
1250 case ISD::VP_REDUCE_MUL:
1251 case ISD::VP_REDUCE_AND:
1252 case ISD::VP_REDUCE_OR:
1253 case ISD::VP_REDUCE_XOR:
1254 case ISD::VP_REDUCE_SMAX:
1255 case ISD::VP_REDUCE_SMIN:
1256 case ISD::VP_REDUCE_UMAX:
1257 case ISD::VP_REDUCE_UMIN:
1258 case ISD::VP_REDUCE_FMAX:
1259 case ISD::VP_REDUCE_FMIN:
1260 case ISD::VP_REDUCE_FMAXIMUM:
1261 case ISD::VP_REDUCE_FMINIMUM:
1262 case ISD::VP_REDUCE_SEQ_FADD:
1263 case ISD::VP_REDUCE_SEQ_FMUL:
1264 Action = TLI.getOperationAction(
1265 Node->getOpcode(), Node->getOperand(1).getValueType());
1266 break;
1267 case ISD::VP_CTTZ_ELTS:
1268 case ISD::VP_CTTZ_ELTS_ZERO_UNDEF:
1269 Action = TLI.getOperationAction(Node->getOpcode(),
1270 Node->getOperand(0).getValueType());
1271 break;
1273 Action = TLI.getOperationAction(
1274 Node->getOpcode(),
1275 cast<MaskedHistogramSDNode>(Node)->getIndex().getValueType());
1276 break;
1277 default:
1278 if (Node->getOpcode() >= ISD::BUILTIN_OP_END) {
1279 Action = TLI.getCustomOperationAction(*Node);
1280 } else {
1281 Action = TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0));
1282 }
1283 break;
1284 }
1285
1286 if (SimpleFinishLegalizing) {
1287 SDNode *NewNode = Node;
1288 switch (Node->getOpcode()) {
1289 default: break;
1290 case ISD::SHL:
1291 case ISD::SRL:
1292 case ISD::SRA:
1293 case ISD::ROTL:
1294 case ISD::ROTR:
1295 case ISD::SSHLSAT:
1296 case ISD::USHLSAT: {
1297 // Legalizing shifts/rotates requires adjusting the shift amount
1298 // to the appropriate width.
1299 SDValue Op0 = Node->getOperand(0);
1300 SDValue Op1 = Node->getOperand(1);
1301 if (!Op1.getValueType().isVector()) {
1302 SDValue SAO = DAG.getShiftAmountOperand(Op0.getValueType(), Op1);
1303 // The getShiftAmountOperand() may create a new operand node or
1304 // return the existing one. If new operand is created we need
1305 // to update the parent node.
1306 // Do not try to legalize SAO here! It will be automatically legalized
1307 // in the next round.
1308 if (SAO != Op1)
1309 NewNode = DAG.UpdateNodeOperands(Node, Op0, SAO);
1310 }
1311 break;
1312 }
1313 case ISD::FSHL:
1314 case ISD::FSHR:
1315 case ISD::SRL_PARTS:
1316 case ISD::SRA_PARTS:
1317 case ISD::SHL_PARTS: {
1318 // Legalizing shifts/rotates requires adjusting the shift amount
1319 // to the appropriate width.
1320 SDValue Op0 = Node->getOperand(0);
1321 SDValue Op1 = Node->getOperand(1);
1322 SDValue Op2 = Node->getOperand(2);
1323 if (!Op2.getValueType().isVector()) {
1324 SDValue SAO = DAG.getShiftAmountOperand(Op0.getValueType(), Op2);
1325 // The getShiftAmountOperand() may create a new operand node or
1326 // return the existing one. If new operand is created we need
1327 // to update the parent node.
1328 if (SAO != Op2)
1329 NewNode = DAG.UpdateNodeOperands(Node, Op0, Op1, SAO);
1330 }
1331 break;
1332 }
1333 }
1334
1335 if (NewNode != Node) {
1336 ReplaceNode(Node, NewNode);
1337 Node = NewNode;
1338 }
1339 switch (Action) {
1340 case TargetLowering::Legal:
1341 LLVM_DEBUG(dbgs() << "Legal node: nothing to do\n");
1342 return;
1343 case TargetLowering::Custom:
1344 LLVM_DEBUG(dbgs() << "Trying custom legalization\n");
1345 // FIXME: The handling for custom lowering with multiple results is
1346 // a complete mess.
1347 if (SDValue Res = TLI.LowerOperation(SDValue(Node, 0), DAG)) {
1348 if (!(Res.getNode() != Node || Res.getResNo() != 0))
1349 return;
1350
1351 if (Node->getNumValues() == 1) {
1352 // Verify the new types match the original. Glue is waived because
1353 // ISD::ADDC can be legalized by replacing Glue with an integer type.
1354 assert((Res.getValueType() == Node->getValueType(0) ||
1355 Node->getValueType(0) == MVT::Glue) &&
1356 "Type mismatch for custom legalized operation");
1357 LLVM_DEBUG(dbgs() << "Successfully custom legalized node\n");
1358 // We can just directly replace this node with the lowered value.
1359 ReplaceNode(SDValue(Node, 0), Res);
1360 return;
1361 }
1362
1363 SmallVector<SDValue, 8> ResultVals;
1364 for (unsigned i = 0, e = Node->getNumValues(); i != e; ++i) {
1365 // Verify the new types match the original. Glue is waived because
1366 // ISD::ADDC can be legalized by replacing Glue with an integer type.
1367 assert((Res->getValueType(i) == Node->getValueType(i) ||
1368 Node->getValueType(i) == MVT::Glue) &&
1369 "Type mismatch for custom legalized operation");
1370 ResultVals.push_back(Res.getValue(i));
1371 }
1372 LLVM_DEBUG(dbgs() << "Successfully custom legalized node\n");
1373 ReplaceNode(Node, ResultVals.data());
1374 return;
1375 }
1376 LLVM_DEBUG(dbgs() << "Could not custom legalize node\n");
1377 [[fallthrough]];
1378 case TargetLowering::Expand:
1379 if (ExpandNode(Node))
1380 return;
1381 [[fallthrough]];
1382 case TargetLowering::LibCall:
1383 ConvertNodeToLibcall(Node);
1384 return;
1385 case TargetLowering::Promote:
1386 PromoteNode(Node);
1387 return;
1388 }
1389 }
1390
1391 switch (Node->getOpcode()) {
1392 default:
1393#ifndef NDEBUG
1394 dbgs() << "NODE: ";
1395 Node->dump( &DAG);
1396 dbgs() << "\n";
1397#endif
1398 llvm_unreachable("Do not know how to legalize this operator!");
1399
1400 case ISD::CALLSEQ_START:
1401 case ISD::CALLSEQ_END:
1402 break;
1403 case ISD::LOAD:
1404 return LegalizeLoadOps(Node);
1405 case ISD::STORE:
1406 return LegalizeStoreOps(Node);
1407 }
1408}
1409
1410SDValue SelectionDAGLegalize::ExpandExtractFromVectorThroughStack(SDValue Op) {
1411 SDValue Vec = Op.getOperand(0);
1412 SDValue Idx = Op.getOperand(1);
1413 SDLoc dl(Op);
1414
1415 // Before we generate a new store to a temporary stack slot, see if there is
1416 // already one that we can use. There often is because when we scalarize
1417 // vector operations (using SelectionDAG::UnrollVectorOp for example) a whole
1418 // series of EXTRACT_VECTOR_ELT nodes are generated, one for each element in
1419 // the vector. If all are expanded here, we don't want one store per vector
1420 // element.
1421
1422 // Caches for hasPredecessorHelper
1423 SmallPtrSet<const SDNode *, 32> Visited;
1425 Visited.insert(Op.getNode());
1426 Worklist.push_back(Idx.getNode());
1427 SDValue StackPtr, Ch;
1428 for (SDNode *User : Vec.getNode()->users()) {
1429 if (StoreSDNode *ST = dyn_cast<StoreSDNode>(User)) {
1430 if (ST->isIndexed() || ST->isTruncatingStore() ||
1431 ST->getValue() != Vec)
1432 continue;
1433
1434 // Make sure that nothing else could have stored into the destination of
1435 // this store.
1436 if (!ST->getChain().reachesChainWithoutSideEffects(DAG.getEntryNode()))
1437 continue;
1438
1439 // If the index is dependent on the store we will introduce a cycle when
1440 // creating the load (the load uses the index, and by replacing the chain
1441 // we will make the index dependent on the load). Also, the store might be
1442 // dependent on the extractelement and introduce a cycle when creating
1443 // the load.
1444 if (SDNode::hasPredecessorHelper(ST, Visited, Worklist) ||
1445 ST->hasPredecessor(Op.getNode()))
1446 continue;
1447
1448 StackPtr = ST->getBasePtr();
1449 Ch = SDValue(ST, 0);
1450 break;
1451 }
1452 }
1453
1454 EVT VecVT = Vec.getValueType();
1455
1456 if (!Ch.getNode()) {
1457 // Store the value to a temporary stack slot, then LOAD the returned part.
1458 StackPtr = DAG.CreateStackTemporary(VecVT);
1459 MachineMemOperand *StoreMMO = getStackAlignedMMO(
1460 StackPtr, DAG.getMachineFunction(), VecVT.isScalableVector());
1461 Ch = DAG.getStore(DAG.getEntryNode(), dl, Vec, StackPtr, StoreMMO);
1462 }
1463
1464 SDValue NewLoad;
1465 Align ElementAlignment =
1466 std::min(cast<StoreSDNode>(Ch)->getAlign(),
1468 Op.getValueType().getTypeForEVT(*DAG.getContext())));
1469
1470 if (Op.getValueType().isVector()) {
1471 StackPtr = TLI.getVectorSubVecPointer(DAG, StackPtr, VecVT,
1472 Op.getValueType(), Idx);
1473 NewLoad = DAG.getLoad(Op.getValueType(), dl, Ch, StackPtr,
1474 MachinePointerInfo(), ElementAlignment);
1475 } else {
1476 StackPtr = TLI.getVectorElementPointer(DAG, StackPtr, VecVT, Idx);
1477 NewLoad = DAG.getExtLoad(ISD::EXTLOAD, dl, Op.getValueType(), Ch, StackPtr,
1478 MachinePointerInfo(), VecVT.getVectorElementType(),
1479 ElementAlignment);
1480 }
1481
1482 // Replace the chain going out of the store, by the one out of the load.
1483 DAG.ReplaceAllUsesOfValueWith(Ch, SDValue(NewLoad.getNode(), 1));
1484
1485 // We introduced a cycle though, so update the loads operands, making sure
1486 // to use the original store's chain as an incoming chain.
1487 SmallVector<SDValue, 6> NewLoadOperands(NewLoad->ops());
1488 NewLoadOperands[0] = Ch;
1489 NewLoad =
1490 SDValue(DAG.UpdateNodeOperands(NewLoad.getNode(), NewLoadOperands), 0);
1491 return NewLoad;
1492}
1493
1494SDValue SelectionDAGLegalize::ExpandInsertToVectorThroughStack(SDValue Op) {
1495 assert(Op.getValueType().isVector() && "Non-vector insert subvector!");
1496
1497 SDValue Vec = Op.getOperand(0);
1498 SDValue Part = Op.getOperand(1);
1499 SDValue Idx = Op.getOperand(2);
1500 SDLoc dl(Op);
1501
1502 // Store the value to a temporary stack slot, then LOAD the returned part.
1503 EVT VecVT = Vec.getValueType();
1504 EVT PartVT = Part.getValueType();
1506 int FI = cast<FrameIndexSDNode>(StackPtr.getNode())->getIndex();
1507 MachinePointerInfo PtrInfo =
1509
1510 // First store the whole vector.
1511 Align BaseVecAlignment =
1513 SDValue Ch = DAG.getStore(DAG.getEntryNode(), dl, Vec, StackPtr, PtrInfo,
1514 BaseVecAlignment);
1515
1516 // Freeze the index so we don't poison the clamping code we're about to emit.
1517 Idx = DAG.getFreeze(Idx);
1518
1519 Type *PartTy = PartVT.getTypeForEVT(*DAG.getContext());
1520 Align PartAlignment = DAG.getDataLayout().getPrefTypeAlign(PartTy);
1521
1522 // Then store the inserted part.
1523 if (PartVT.isVector()) {
1524 SDValue SubStackPtr =
1525 TLI.getVectorSubVecPointer(DAG, StackPtr, VecVT, PartVT, Idx);
1526
1527 // Store the subvector.
1528 Ch = DAG.getStore(
1529 Ch, dl, Part, SubStackPtr,
1531 PartAlignment);
1532 } else {
1533 SDValue SubStackPtr =
1534 TLI.getVectorElementPointer(DAG, StackPtr, VecVT, Idx);
1535
1536 // Store the scalar value.
1537 Ch = DAG.getTruncStore(
1538 Ch, dl, Part, SubStackPtr,
1540 VecVT.getVectorElementType(), PartAlignment);
1541 }
1542
1543 assert(cast<StoreSDNode>(Ch)->getAlign() == PartAlignment &&
1544 "ElementAlignment does not match!");
1545
1546 // Finally, load the updated vector.
1547 return DAG.getLoad(Op.getValueType(), dl, Ch, StackPtr, PtrInfo,
1548 BaseVecAlignment);
1549}
1550
1551SDValue SelectionDAGLegalize::ExpandConcatVectors(SDNode *Node) {
1552 assert(Node->getOpcode() == ISD::CONCAT_VECTORS && "Unexpected opcode!");
1553 SDLoc DL(Node);
1555 unsigned NumOperands = Node->getNumOperands();
1556 MVT VectorIdxType = TLI.getVectorIdxTy(DAG.getDataLayout());
1557 EVT VectorValueType = Node->getOperand(0).getValueType();
1558 unsigned NumSubElem = VectorValueType.getVectorNumElements();
1559 EVT ElementValueType = TLI.getTypeToTransformTo(
1560 *DAG.getContext(), VectorValueType.getVectorElementType());
1561 for (unsigned I = 0; I < NumOperands; ++I) {
1562 SDValue SubOp = Node->getOperand(I);
1563 for (unsigned Idx = 0; Idx < NumSubElem; ++Idx) {
1564 Ops.push_back(DAG.getNode(ISD::EXTRACT_VECTOR_ELT, DL, ElementValueType,
1565 SubOp,
1566 DAG.getConstant(Idx, DL, VectorIdxType)));
1567 }
1568 }
1569 return DAG.getBuildVector(Node->getValueType(0), DL, Ops);
1570}
1571
1572SDValue SelectionDAGLegalize::ExpandVectorBuildThroughStack(SDNode* Node) {
1573 assert((Node->getOpcode() == ISD::BUILD_VECTOR ||
1574 Node->getOpcode() == ISD::CONCAT_VECTORS) &&
1575 "Unexpected opcode!");
1576
1577 // We can't handle this case efficiently. Allocate a sufficiently
1578 // aligned object on the stack, store each operand into it, then load
1579 // the result as a vector.
1580 // Create the stack frame object.
1581 EVT VT = Node->getValueType(0);
1582 EVT MemVT = isa<BuildVectorSDNode>(Node) ? VT.getVectorElementType()
1583 : Node->getOperand(0).getValueType();
1584 SDLoc dl(Node);
1585 SDValue FIPtr = DAG.CreateStackTemporary(VT);
1586 int FI = cast<FrameIndexSDNode>(FIPtr.getNode())->getIndex();
1587 MachinePointerInfo PtrInfo =
1589
1590 // Emit a store of each element to the stack slot.
1592 unsigned TypeByteSize = MemVT.getSizeInBits() / 8;
1593 assert(TypeByteSize > 0 && "Vector element type too small for stack store!");
1594
1595 // If the destination vector element type of a BUILD_VECTOR is narrower than
1596 // the source element type, only store the bits necessary.
1597 bool Truncate = isa<BuildVectorSDNode>(Node) &&
1598 MemVT.bitsLT(Node->getOperand(0).getValueType());
1599
1600 // Store (in the right endianness) the elements to memory.
1601 for (unsigned i = 0, e = Node->getNumOperands(); i != e; ++i) {
1602 // Ignore undef elements.
1603 if (Node->getOperand(i).isUndef()) continue;
1604
1605 unsigned Offset = TypeByteSize*i;
1606
1607 SDValue Idx =
1609
1610 if (Truncate)
1611 Stores.push_back(DAG.getTruncStore(DAG.getEntryNode(), dl,
1612 Node->getOperand(i), Idx,
1613 PtrInfo.getWithOffset(Offset), MemVT));
1614 else
1615 Stores.push_back(DAG.getStore(DAG.getEntryNode(), dl, Node->getOperand(i),
1616 Idx, PtrInfo.getWithOffset(Offset)));
1617 }
1618
1619 SDValue StoreChain;
1620 if (!Stores.empty()) // Not all undef elements?
1621 StoreChain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Stores);
1622 else
1623 StoreChain = DAG.getEntryNode();
1624
1625 // Result is a load from the stack slot.
1626 return DAG.getLoad(VT, dl, StoreChain, FIPtr, PtrInfo);
1627}
1628
1629/// Bitcast a floating-point value to an integer value. Only bitcast the part
1630/// containing the sign bit if the target has no integer value capable of
1631/// holding all bits of the floating-point value.
1632void SelectionDAGLegalize::getSignAsIntValue(FloatSignAsInt &State,
1633 const SDLoc &DL,
1634 SDValue Value) const {
1635 EVT FloatVT = Value.getValueType();
1636 unsigned NumBits = FloatVT.getScalarSizeInBits();
1637 State.FloatVT = FloatVT;
1638 EVT IVT = EVT::getIntegerVT(*DAG.getContext(), NumBits);
1639 // Convert to an integer of the same size.
1640 if (TLI.isTypeLegal(IVT)) {
1641 State.IntValue = DAG.getNode(ISD::BITCAST, DL, IVT, Value);
1642 State.SignMask = APInt::getSignMask(NumBits);
1643 State.SignBit = NumBits - 1;
1644 return;
1645 }
1646
1647 auto &DataLayout = DAG.getDataLayout();
1648 // Store the float to memory, then load the sign part out as an integer.
1649 MVT LoadTy = TLI.getRegisterType(MVT::i8);
1650 // First create a temporary that is aligned for both the load and store.
1651 SDValue StackPtr = DAG.CreateStackTemporary(FloatVT, LoadTy);
1652 int FI = cast<FrameIndexSDNode>(StackPtr.getNode())->getIndex();
1653 // Then store the float to it.
1654 State.FloatPtr = StackPtr;
1655 MachineFunction &MF = DAG.getMachineFunction();
1656 State.FloatPointerInfo = MachinePointerInfo::getFixedStack(MF, FI);
1657 State.Chain = DAG.getStore(DAG.getEntryNode(), DL, Value, State.FloatPtr,
1658 State.FloatPointerInfo);
1659
1660 SDValue IntPtr;
1661 if (DataLayout.isBigEndian()) {
1662 assert(FloatVT.isByteSized() && "Unsupported floating point type!");
1663 // Load out a legal integer with the same sign bit as the float.
1664 IntPtr = StackPtr;
1665 State.IntPointerInfo = State.FloatPointerInfo;
1666 } else {
1667 // Advance the pointer so that the loaded byte will contain the sign bit.
1668 unsigned ByteOffset = (NumBits / 8) - 1;
1669 IntPtr =
1670 DAG.getMemBasePlusOffset(StackPtr, TypeSize::getFixed(ByteOffset), DL);
1671 State.IntPointerInfo = MachinePointerInfo::getFixedStack(MF, FI,
1672 ByteOffset);
1673 }
1674
1675 State.IntPtr = IntPtr;
1676 State.IntValue = DAG.getExtLoad(ISD::EXTLOAD, DL, LoadTy, State.Chain, IntPtr,
1677 State.IntPointerInfo, MVT::i8);
1678 State.SignMask = APInt::getOneBitSet(LoadTy.getScalarSizeInBits(), 7);
1679 State.SignBit = 7;
1680}
1681
1682/// Replace the integer value produced by getSignAsIntValue() with a new value
1683/// and cast the result back to a floating-point type.
1684SDValue SelectionDAGLegalize::modifySignAsInt(const FloatSignAsInt &State,
1685 const SDLoc &DL,
1686 SDValue NewIntValue) const {
1687 if (!State.Chain)
1688 return DAG.getNode(ISD::BITCAST, DL, State.FloatVT, NewIntValue);
1689
1690 // Override the part containing the sign bit in the value stored on the stack.
1691 SDValue Chain = DAG.getTruncStore(State.Chain, DL, NewIntValue, State.IntPtr,
1692 State.IntPointerInfo, MVT::i8);
1693 return DAG.getLoad(State.FloatVT, DL, Chain, State.FloatPtr,
1694 State.FloatPointerInfo);
1695}
1696
1697SDValue SelectionDAGLegalize::ExpandFCOPYSIGN(SDNode *Node) const {
1698 SDLoc DL(Node);
1699 SDValue Mag = Node->getOperand(0);
1700 SDValue Sign = Node->getOperand(1);
1701
1702 // Get sign bit into an integer value.
1703 FloatSignAsInt SignAsInt;
1704 getSignAsIntValue(SignAsInt, DL, Sign);
1705
1706 EVT IntVT = SignAsInt.IntValue.getValueType();
1707 SDValue SignMask = DAG.getConstant(SignAsInt.SignMask, DL, IntVT);
1708 SDValue SignBit = DAG.getNode(ISD::AND, DL, IntVT, SignAsInt.IntValue,
1709 SignMask);
1710
1711 // If FABS is legal transform
1712 // FCOPYSIGN(x, y) => SignBit(y) ? -FABS(x) : FABS(x)
1713 EVT FloatVT = Mag.getValueType();
1714 if (TLI.isOperationLegalOrCustom(ISD::FABS, FloatVT) &&
1715 TLI.isOperationLegalOrCustom(ISD::FNEG, FloatVT)) {
1716 SDValue AbsValue = DAG.getNode(ISD::FABS, DL, FloatVT, Mag);
1717 SDValue NegValue = DAG.getNode(ISD::FNEG, DL, FloatVT, AbsValue);
1718 SDValue Cond = DAG.getSetCC(DL, getSetCCResultType(IntVT), SignBit,
1719 DAG.getConstant(0, DL, IntVT), ISD::SETNE);
1720 return DAG.getSelect(DL, FloatVT, Cond, NegValue, AbsValue);
1721 }
1722
1723 // Transform Mag value to integer, and clear the sign bit.
1724 FloatSignAsInt MagAsInt;
1725 getSignAsIntValue(MagAsInt, DL, Mag);
1726 EVT MagVT = MagAsInt.IntValue.getValueType();
1727 SDValue ClearSignMask = DAG.getConstant(~MagAsInt.SignMask, DL, MagVT);
1728 SDValue ClearedSign = DAG.getNode(ISD::AND, DL, MagVT, MagAsInt.IntValue,
1729 ClearSignMask);
1730
1731 // Get the signbit at the right position for MagAsInt.
1732 int ShiftAmount = SignAsInt.SignBit - MagAsInt.SignBit;
1733 EVT ShiftVT = IntVT;
1734 if (SignBit.getScalarValueSizeInBits() <
1735 ClearedSign.getScalarValueSizeInBits()) {
1736 SignBit = DAG.getNode(ISD::ZERO_EXTEND, DL, MagVT, SignBit);
1737 ShiftVT = MagVT;
1738 }
1739 if (ShiftAmount > 0) {
1740 SDValue ShiftCnst = DAG.getConstant(ShiftAmount, DL, ShiftVT);
1741 SignBit = DAG.getNode(ISD::SRL, DL, ShiftVT, SignBit, ShiftCnst);
1742 } else if (ShiftAmount < 0) {
1743 SDValue ShiftCnst = DAG.getConstant(-ShiftAmount, DL, ShiftVT);
1744 SignBit = DAG.getNode(ISD::SHL, DL, ShiftVT, SignBit, ShiftCnst);
1745 }
1746 if (SignBit.getScalarValueSizeInBits() >
1747 ClearedSign.getScalarValueSizeInBits()) {
1748 SignBit = DAG.getNode(ISD::TRUNCATE, DL, MagVT, SignBit);
1749 }
1750
1751 // Store the part with the modified sign and convert back to float.
1752 SDValue CopiedSign = DAG.getNode(ISD::OR, DL, MagVT, ClearedSign, SignBit,
1754
1755 return modifySignAsInt(MagAsInt, DL, CopiedSign);
1756}
1757
1758SDValue SelectionDAGLegalize::ExpandFNEG(SDNode *Node) const {
1759 // Get the sign bit as an integer.
1760 SDLoc DL(Node);
1761 FloatSignAsInt SignAsInt;
1762 getSignAsIntValue(SignAsInt, DL, Node->getOperand(0));
1763 EVT IntVT = SignAsInt.IntValue.getValueType();
1764
1765 // Flip the sign.
1766 SDValue SignMask = DAG.getConstant(SignAsInt.SignMask, DL, IntVT);
1767 SDValue SignFlip =
1768 DAG.getNode(ISD::XOR, DL, IntVT, SignAsInt.IntValue, SignMask);
1769
1770 // Convert back to float.
1771 return modifySignAsInt(SignAsInt, DL, SignFlip);
1772}
1773
1774SDValue SelectionDAGLegalize::ExpandFABS(SDNode *Node) const {
1775 SDLoc DL(Node);
1776 SDValue Value = Node->getOperand(0);
1777
1778 // Transform FABS(x) => FCOPYSIGN(x, 0.0) if FCOPYSIGN is legal.
1779 EVT FloatVT = Value.getValueType();
1780 if (TLI.isOperationLegalOrCustom(ISD::FCOPYSIGN, FloatVT)) {
1781 SDValue Zero = DAG.getConstantFP(0.0, DL, FloatVT);
1782 return DAG.getNode(ISD::FCOPYSIGN, DL, FloatVT, Value, Zero);
1783 }
1784
1785 // Transform value to integer, clear the sign bit and transform back.
1786 FloatSignAsInt ValueAsInt;
1787 getSignAsIntValue(ValueAsInt, DL, Value);
1788 EVT IntVT = ValueAsInt.IntValue.getValueType();
1789 SDValue ClearSignMask = DAG.getConstant(~ValueAsInt.SignMask, DL, IntVT);
1790 SDValue ClearedSign = DAG.getNode(ISD::AND, DL, IntVT, ValueAsInt.IntValue,
1791 ClearSignMask);
1792 return modifySignAsInt(ValueAsInt, DL, ClearedSign);
1793}
1794
1795void SelectionDAGLegalize::ExpandDYNAMIC_STACKALLOC(SDNode* Node,
1796 SmallVectorImpl<SDValue> &Results) {
1798 assert(SPReg && "Target cannot require DYNAMIC_STACKALLOC expansion and"
1799 " not tell us which reg is the stack pointer!");
1800 SDLoc dl(Node);
1801 EVT VT = Node->getValueType(0);
1802 SDValue Tmp1 = SDValue(Node, 0);
1803 SDValue Tmp2 = SDValue(Node, 1);
1804 SDValue Tmp3 = Node->getOperand(2);
1805 SDValue Chain = Tmp1.getOperand(0);
1806
1807 // Chain the dynamic stack allocation so that it doesn't modify the stack
1808 // pointer when other instructions are using the stack.
1809 Chain = DAG.getCALLSEQ_START(Chain, 0, 0, dl);
1810
1811 SDValue Size = Tmp2.getOperand(1);
1812 SDValue SP = DAG.getCopyFromReg(Chain, dl, SPReg, VT);
1813 Chain = SP.getValue(1);
1814 Align Alignment = cast<ConstantSDNode>(Tmp3)->getAlignValue();
1815 const TargetFrameLowering *TFL = DAG.getSubtarget().getFrameLowering();
1816 unsigned Opc =
1819
1820 Align StackAlign = TFL->getStackAlign();
1821 Tmp1 = DAG.getNode(Opc, dl, VT, SP, Size); // Value
1822 if (Alignment > StackAlign)
1823 Tmp1 = DAG.getNode(ISD::AND, dl, VT, Tmp1,
1824 DAG.getSignedConstant(-Alignment.value(), dl, VT));
1825 Chain = DAG.getCopyToReg(Chain, dl, SPReg, Tmp1); // Output chain
1826
1827 Tmp2 = DAG.getCALLSEQ_END(Chain, 0, 0, SDValue(), dl);
1828
1829 Results.push_back(Tmp1);
1830 Results.push_back(Tmp2);
1831}
1832
1833/// Emit a store/load combination to the stack. This stores
1834/// SrcOp to a stack slot of type SlotVT, truncating it if needed. It then does
1835/// a load from the stack slot to DestVT, extending it if needed.
1836/// The resultant code need not be legal.
1837SDValue SelectionDAGLegalize::EmitStackConvert(SDValue SrcOp, EVT SlotVT,
1838 EVT DestVT, const SDLoc &dl) {
1839 return EmitStackConvert(SrcOp, SlotVT, DestVT, dl, DAG.getEntryNode());
1840}
1841
1842SDValue SelectionDAGLegalize::EmitStackConvert(SDValue SrcOp, EVT SlotVT,
1843 EVT DestVT, const SDLoc &dl,
1844 SDValue Chain) {
1845 EVT SrcVT = SrcOp.getValueType();
1846 Type *DestType = DestVT.getTypeForEVT(*DAG.getContext());
1847 Align DestAlign = DAG.getDataLayout().getPrefTypeAlign(DestType);
1848
1849 // Don't convert with stack if the load/store is expensive.
1850 if ((SrcVT.bitsGT(SlotVT) &&
1851 !TLI.isTruncStoreLegalOrCustom(SrcOp.getValueType(), SlotVT)) ||
1852 (SlotVT.bitsLT(DestVT) &&
1853 !TLI.isLoadExtLegalOrCustom(ISD::EXTLOAD, DestVT, SlotVT)))
1854 return SDValue();
1855
1856 // Create the stack frame object.
1857 Align SrcAlign = DAG.getDataLayout().getPrefTypeAlign(
1858 SrcOp.getValueType().getTypeForEVT(*DAG.getContext()));
1859 SDValue FIPtr = DAG.CreateStackTemporary(SlotVT.getStoreSize(), SrcAlign);
1860
1861 FrameIndexSDNode *StackPtrFI = cast<FrameIndexSDNode>(FIPtr);
1862 int SPFI = StackPtrFI->getIndex();
1863 MachinePointerInfo PtrInfo =
1865
1866 // Emit a store to the stack slot. Use a truncstore if the input value is
1867 // later than DestVT.
1868 SDValue Store;
1869
1870 if (SrcVT.bitsGT(SlotVT))
1871 Store = DAG.getTruncStore(Chain, dl, SrcOp, FIPtr, PtrInfo,
1872 SlotVT, SrcAlign);
1873 else {
1874 assert(SrcVT.bitsEq(SlotVT) && "Invalid store");
1875 Store = DAG.getStore(Chain, dl, SrcOp, FIPtr, PtrInfo, SrcAlign);
1876 }
1877
1878 // Result is a load from the stack slot.
1879 if (SlotVT.bitsEq(DestVT))
1880 return DAG.getLoad(DestVT, dl, Store, FIPtr, PtrInfo, DestAlign);
1881
1882 assert(SlotVT.bitsLT(DestVT) && "Unknown extension!");
1883 return DAG.getExtLoad(ISD::EXTLOAD, dl, DestVT, Store, FIPtr, PtrInfo, SlotVT,
1884 DestAlign);
1885}
1886
1887SDValue SelectionDAGLegalize::ExpandSCALAR_TO_VECTOR(SDNode *Node) {
1888 SDLoc dl(Node);
1889 // Create a vector sized/aligned stack slot, store the value to element #0,
1890 // then load the whole vector back out.
1891 SDValue StackPtr = DAG.CreateStackTemporary(Node->getValueType(0));
1892
1893 FrameIndexSDNode *StackPtrFI = cast<FrameIndexSDNode>(StackPtr);
1894 int SPFI = StackPtrFI->getIndex();
1895
1896 SDValue Ch = DAG.getTruncStore(
1897 DAG.getEntryNode(), dl, Node->getOperand(0), StackPtr,
1899 Node->getValueType(0).getVectorElementType());
1900 return DAG.getLoad(
1901 Node->getValueType(0), dl, Ch, StackPtr,
1903}
1904
1905static bool
1907 const TargetLowering &TLI, SDValue &Res) {
1908 unsigned NumElems = Node->getNumOperands();
1909 SDLoc dl(Node);
1910 EVT VT = Node->getValueType(0);
1911
1912 // Try to group the scalars into pairs, shuffle the pairs together, then
1913 // shuffle the pairs of pairs together, etc. until the vector has
1914 // been built. This will work only if all of the necessary shuffle masks
1915 // are legal.
1916
1917 // We do this in two phases; first to check the legality of the shuffles,
1918 // and next, assuming that all shuffles are legal, to create the new nodes.
1919 for (int Phase = 0; Phase < 2; ++Phase) {
1921 NewIntermedVals;
1922 for (unsigned i = 0; i < NumElems; ++i) {
1923 SDValue V = Node->getOperand(i);
1924 if (V.isUndef())
1925 continue;
1926
1927 SDValue Vec;
1928 if (Phase)
1929 Vec = DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, VT, V);
1930 IntermedVals.push_back(std::make_pair(Vec, SmallVector<int, 16>(1, i)));
1931 }
1932
1933 while (IntermedVals.size() > 2) {
1934 NewIntermedVals.clear();
1935 for (unsigned i = 0, e = (IntermedVals.size() & ~1u); i < e; i += 2) {
1936 // This vector and the next vector are shuffled together (simply to
1937 // append the one to the other).
1938 SmallVector<int, 16> ShuffleVec(NumElems, -1);
1939
1940 SmallVector<int, 16> FinalIndices;
1941 FinalIndices.reserve(IntermedVals[i].second.size() +
1942 IntermedVals[i+1].second.size());
1943
1944 int k = 0;
1945 for (unsigned j = 0, f = IntermedVals[i].second.size(); j != f;
1946 ++j, ++k) {
1947 ShuffleVec[k] = j;
1948 FinalIndices.push_back(IntermedVals[i].second[j]);
1949 }
1950 for (unsigned j = 0, f = IntermedVals[i+1].second.size(); j != f;
1951 ++j, ++k) {
1952 ShuffleVec[k] = NumElems + j;
1953 FinalIndices.push_back(IntermedVals[i+1].second[j]);
1954 }
1955
1956 SDValue Shuffle;
1957 if (Phase)
1958 Shuffle = DAG.getVectorShuffle(VT, dl, IntermedVals[i].first,
1959 IntermedVals[i+1].first,
1960 ShuffleVec);
1961 else if (!TLI.isShuffleMaskLegal(ShuffleVec, VT))
1962 return false;
1963 NewIntermedVals.push_back(
1964 std::make_pair(Shuffle, std::move(FinalIndices)));
1965 }
1966
1967 // If we had an odd number of defined values, then append the last
1968 // element to the array of new vectors.
1969 if ((IntermedVals.size() & 1) != 0)
1970 NewIntermedVals.push_back(IntermedVals.back());
1971
1972 IntermedVals.swap(NewIntermedVals);
1973 }
1974
1975 assert(IntermedVals.size() <= 2 && IntermedVals.size() > 0 &&
1976 "Invalid number of intermediate vectors");
1977 SDValue Vec1 = IntermedVals[0].first;
1978 SDValue Vec2;
1979 if (IntermedVals.size() > 1)
1980 Vec2 = IntermedVals[1].first;
1981 else if (Phase)
1982 Vec2 = DAG.getUNDEF(VT);
1983
1984 SmallVector<int, 16> ShuffleVec(NumElems, -1);
1985 for (unsigned i = 0, e = IntermedVals[0].second.size(); i != e; ++i)
1986 ShuffleVec[IntermedVals[0].second[i]] = i;
1987 for (unsigned i = 0, e = IntermedVals[1].second.size(); i != e; ++i)
1988 ShuffleVec[IntermedVals[1].second[i]] = NumElems + i;
1989
1990 if (Phase)
1991 Res = DAG.getVectorShuffle(VT, dl, Vec1, Vec2, ShuffleVec);
1992 else if (!TLI.isShuffleMaskLegal(ShuffleVec, VT))
1993 return false;
1994 }
1995
1996 return true;
1997}
1998
1999/// Expand a BUILD_VECTOR node on targets that don't
2000/// support the operation, but do support the resultant vector type.
2001SDValue SelectionDAGLegalize::ExpandBUILD_VECTOR(SDNode *Node) {
2002 unsigned NumElems = Node->getNumOperands();
2003 SDValue Value1, Value2;
2004 SDLoc dl(Node);
2005 EVT VT = Node->getValueType(0);
2006 EVT OpVT = Node->getOperand(0).getValueType();
2007 EVT EltVT = VT.getVectorElementType();
2008
2009 // If the only non-undef value is the low element, turn this into a
2010 // SCALAR_TO_VECTOR node. If this is { X, X, X, X }, determine X.
2011 bool isOnlyLowElement = true;
2012 bool MoreThanTwoValues = false;
2013 bool isConstant = true;
2014 for (unsigned i = 0; i < NumElems; ++i) {
2015 SDValue V = Node->getOperand(i);
2016 if (V.isUndef())
2017 continue;
2018 if (i > 0)
2019 isOnlyLowElement = false;
2021 isConstant = false;
2022
2023 if (!Value1.getNode()) {
2024 Value1 = V;
2025 } else if (!Value2.getNode()) {
2026 if (V != Value1)
2027 Value2 = V;
2028 } else if (V != Value1 && V != Value2) {
2029 MoreThanTwoValues = true;
2030 }
2031 }
2032
2033 if (!Value1.getNode())
2034 return DAG.getUNDEF(VT);
2035
2036 if (isOnlyLowElement)
2037 return DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, VT, Node->getOperand(0));
2038
2039 // If all elements are constants, create a load from the constant pool.
2040 if (isConstant) {
2042 for (unsigned i = 0, e = NumElems; i != e; ++i) {
2043 if (ConstantFPSDNode *V =
2044 dyn_cast<ConstantFPSDNode>(Node->getOperand(i))) {
2045 CV.push_back(const_cast<ConstantFP *>(V->getConstantFPValue()));
2046 } else if (ConstantSDNode *V =
2047 dyn_cast<ConstantSDNode>(Node->getOperand(i))) {
2048 if (OpVT==EltVT)
2049 CV.push_back(const_cast<ConstantInt *>(V->getConstantIntValue()));
2050 else {
2051 // If OpVT and EltVT don't match, EltVT is not legal and the
2052 // element values have been promoted/truncated earlier. Undo this;
2053 // we don't want a v16i8 to become a v16i32 for example.
2054 const ConstantInt *CI = V->getConstantIntValue();
2055 CV.push_back(ConstantInt::get(EltVT.getTypeForEVT(*DAG.getContext()),
2056 CI->getZExtValue(), /*IsSigned=*/false,
2057 /*ImplicitTrunc=*/true));
2058 }
2059 } else {
2060 assert(Node->getOperand(i).isUndef());
2061 Type *OpNTy = EltVT.getTypeForEVT(*DAG.getContext());
2062 CV.push_back(UndefValue::get(OpNTy));
2063 }
2064 }
2066 SDValue CPIdx =
2067 DAG.getConstantPool(CP, TLI.getPointerTy(DAG.getDataLayout()));
2068 Align Alignment = cast<ConstantPoolSDNode>(CPIdx)->getAlign();
2069 return DAG.getLoad(
2070 VT, dl, DAG.getEntryNode(), CPIdx,
2072 Alignment);
2073 }
2074
2075 SmallSet<SDValue, 16> DefinedValues;
2076 for (unsigned i = 0; i < NumElems; ++i) {
2077 if (Node->getOperand(i).isUndef())
2078 continue;
2079 DefinedValues.insert(Node->getOperand(i));
2080 }
2081
2082 if (TLI.shouldExpandBuildVectorWithShuffles(VT, DefinedValues.size())) {
2083 if (!MoreThanTwoValues) {
2084 SmallVector<int, 8> ShuffleVec(NumElems, -1);
2085 for (unsigned i = 0; i < NumElems; ++i) {
2086 SDValue V = Node->getOperand(i);
2087 if (V.isUndef())
2088 continue;
2089 ShuffleVec[i] = V == Value1 ? 0 : NumElems;
2090 }
2091 if (TLI.isShuffleMaskLegal(ShuffleVec, Node->getValueType(0))) {
2092 // Get the splatted value into the low element of a vector register.
2093 SDValue Vec1 = DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, VT, Value1);
2094 SDValue Vec2;
2095 if (Value2.getNode())
2096 Vec2 = DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, VT, Value2);
2097 else
2098 Vec2 = DAG.getUNDEF(VT);
2099
2100 // Return shuffle(LowValVec, undef, <0,0,0,0>)
2101 return DAG.getVectorShuffle(VT, dl, Vec1, Vec2, ShuffleVec);
2102 }
2103 } else {
2104 SDValue Res;
2105 if (ExpandBVWithShuffles(Node, DAG, TLI, Res))
2106 return Res;
2107 }
2108 }
2109
2110 // Otherwise, we can't handle this case efficiently.
2111 return ExpandVectorBuildThroughStack(Node);
2112}
2113
2114SDValue SelectionDAGLegalize::ExpandSPLAT_VECTOR(SDNode *Node) {
2115 SDLoc DL(Node);
2116 EVT VT = Node->getValueType(0);
2117 SDValue SplatVal = Node->getOperand(0);
2118
2119 return DAG.getSplatBuildVector(VT, DL, SplatVal);
2120}
2121
2122// Expand a node into a call to a libcall, returning the value as the first
2123// result and the chain as the second. If the result value does not fit into a
2124// register, return the lo part and set the hi part to the by-reg argument in
2125// the first. If it does fit into a single register, return the result and
2126// leave the Hi part unset.
2127std::pair<SDValue, SDValue>
2128SelectionDAGLegalize::ExpandLibCall(RTLIB::Libcall LC, SDNode *Node,
2129 TargetLowering::ArgListTy &&Args,
2130 bool IsSigned, EVT RetVT) {
2131 EVT CodePtrTy = TLI.getPointerTy(DAG.getDataLayout());
2133 RTLIB::LibcallImpl LCImpl = TLI.getLibcallImpl(LC);
2134 if (LCImpl != RTLIB::Unsupported)
2135 Callee = DAG.getExternalSymbol(LCImpl, CodePtrTy);
2136 else {
2137 Callee = DAG.getPOISON(CodePtrTy);
2138 DAG.getContext()->emitError(Twine("no libcall available for ") +
2139 Node->getOperationName(&DAG));
2140 }
2141
2142 Type *RetTy = RetVT.getTypeForEVT(*DAG.getContext());
2143
2144 // By default, the input chain to this libcall is the entry node of the
2145 // function. If the libcall is going to be emitted as a tail call then
2146 // TLI.isUsedByReturnOnly will change it to the right chain if the return
2147 // node which is being folded has a non-entry input chain.
2148 SDValue InChain = DAG.getEntryNode();
2149
2150 // isTailCall may be true since the callee does not reference caller stack
2151 // frame. Check if it's in the right position and that the return types match.
2152 SDValue TCChain = InChain;
2153 const Function &F = DAG.getMachineFunction().getFunction();
2154 bool isTailCall =
2155 TLI.isInTailCallPosition(DAG, Node, TCChain) &&
2156 (RetTy == F.getReturnType() || F.getReturnType()->isVoidTy());
2157 if (isTailCall)
2158 InChain = TCChain;
2159
2160 TargetLowering::CallLoweringInfo CLI(DAG);
2161 bool signExtend = TLI.shouldSignExtendTypeInLibCall(RetTy, IsSigned);
2162 CLI.setDebugLoc(SDLoc(Node))
2163 .setChain(InChain)
2164 .setLibCallee(TLI.getLibcallImplCallingConv(LCImpl), RetTy, Callee,
2165 std::move(Args))
2166 .setTailCall(isTailCall)
2167 .setSExtResult(signExtend)
2168 .setZExtResult(!signExtend)
2169 .setIsPostTypeLegalization(true);
2170
2171 std::pair<SDValue, SDValue> CallInfo = TLI.LowerCallTo(CLI);
2172
2173 if (!CallInfo.second.getNode()) {
2174 LLVM_DEBUG(dbgs() << "Created tailcall: "; DAG.getRoot().dump(&DAG));
2175 // It's a tailcall, return the chain (which is the DAG root).
2176 return {DAG.getRoot(), DAG.getRoot()};
2177 }
2178
2179 LLVM_DEBUG(dbgs() << "Created libcall: "; CallInfo.first.dump(&DAG));
2180 return CallInfo;
2181}
2182
2183std::pair<SDValue, SDValue> SelectionDAGLegalize::ExpandLibCall(RTLIB::Libcall LC, SDNode *Node,
2184 bool isSigned) {
2185 TargetLowering::ArgListTy Args;
2186 for (const SDValue &Op : Node->op_values()) {
2187 EVT ArgVT = Op.getValueType();
2188 Type *ArgTy = ArgVT.getTypeForEVT(*DAG.getContext());
2189 TargetLowering::ArgListEntry Entry(Op, ArgTy);
2190 Entry.IsSExt = TLI.shouldSignExtendTypeInLibCall(ArgTy, isSigned);
2191 Entry.IsZExt = !Entry.IsSExt;
2192 Args.push_back(Entry);
2193 }
2194
2195 return ExpandLibCall(LC, Node, std::move(Args), isSigned,
2196 Node->getValueType(0));
2197}
2198
2199void SelectionDAGLegalize::ExpandFPLibCall(SDNode* Node,
2200 RTLIB::Libcall LC,
2201 SmallVectorImpl<SDValue> &Results) {
2202 if (LC == RTLIB::UNKNOWN_LIBCALL)
2203 llvm_unreachable("Can't create an unknown libcall!");
2204
2205 if (Node->isStrictFPOpcode()) {
2206 EVT RetVT = Node->getValueType(0);
2208 TargetLowering::MakeLibCallOptions CallOptions;
2209 CallOptions.IsPostTypeLegalization = true;
2210 // FIXME: This doesn't support tail calls.
2211 std::pair<SDValue, SDValue> Tmp = TLI.makeLibCall(DAG, LC, RetVT,
2212 Ops, CallOptions,
2213 SDLoc(Node),
2214 Node->getOperand(0));
2215 Results.push_back(Tmp.first);
2216 Results.push_back(Tmp.second);
2217 } else {
2218 bool IsSignedArgument = Node->getOpcode() == ISD::FLDEXP;
2219 SDValue Tmp = ExpandLibCall(LC, Node, IsSignedArgument).first;
2220 Results.push_back(Tmp);
2221 }
2222}
2223
2224/// Expand the node to a libcall based on the result type.
2225void SelectionDAGLegalize::ExpandFPLibCall(SDNode* Node,
2226 RTLIB::Libcall Call_F32,
2227 RTLIB::Libcall Call_F64,
2228 RTLIB::Libcall Call_F80,
2229 RTLIB::Libcall Call_F128,
2230 RTLIB::Libcall Call_PPCF128,
2231 SmallVectorImpl<SDValue> &Results) {
2232 RTLIB::Libcall LC = RTLIB::getFPLibCall(Node->getSimpleValueType(0),
2233 Call_F32, Call_F64, Call_F80,
2234 Call_F128, Call_PPCF128);
2235 ExpandFPLibCall(Node, LC, Results);
2236}
2237
2238void SelectionDAGLegalize::ExpandFastFPLibCall(
2239 SDNode *Node, bool IsFast,
2240 std::pair<RTLIB::Libcall, RTLIB::Libcall> Call_F32,
2241 std::pair<RTLIB::Libcall, RTLIB::Libcall> Call_F64,
2242 std::pair<RTLIB::Libcall, RTLIB::Libcall> Call_F80,
2243 std::pair<RTLIB::Libcall, RTLIB::Libcall> Call_F128,
2244 std::pair<RTLIB::Libcall, RTLIB::Libcall> Call_PPCF128,
2245 SmallVectorImpl<SDValue> &Results) {
2246
2247 EVT VT = Node->getSimpleValueType(0);
2248
2249 RTLIB::Libcall LC;
2250
2251 // FIXME: Probably should define fast to respect nan/inf and only be
2252 // approximate functions.
2253
2254 if (IsFast) {
2255 LC = RTLIB::getFPLibCall(VT, Call_F32.first, Call_F64.first, Call_F80.first,
2256 Call_F128.first, Call_PPCF128.first);
2257 }
2258
2259 if (!IsFast || TLI.getLibcallImpl(LC) == RTLIB::Unsupported) {
2260 // Fall back if we don't have a fast implementation.
2261 LC = RTLIB::getFPLibCall(VT, Call_F32.second, Call_F64.second,
2262 Call_F80.second, Call_F128.second,
2263 Call_PPCF128.second);
2264 }
2265
2266 ExpandFPLibCall(Node, LC, Results);
2267}
2268
2269SDValue SelectionDAGLegalize::ExpandIntLibCall(SDNode* Node, bool isSigned,
2270 RTLIB::Libcall Call_I8,
2271 RTLIB::Libcall Call_I16,
2272 RTLIB::Libcall Call_I32,
2273 RTLIB::Libcall Call_I64,
2274 RTLIB::Libcall Call_I128) {
2275 RTLIB::Libcall LC;
2276 switch (Node->getSimpleValueType(0).SimpleTy) {
2277 default: llvm_unreachable("Unexpected request for libcall!");
2278 case MVT::i8: LC = Call_I8; break;
2279 case MVT::i16: LC = Call_I16; break;
2280 case MVT::i32: LC = Call_I32; break;
2281 case MVT::i64: LC = Call_I64; break;
2282 case MVT::i128: LC = Call_I128; break;
2283 }
2284 return ExpandLibCall(LC, Node, isSigned).first;
2285}
2286
2287/// Expand the node to a libcall based on first argument type (for instance
2288/// lround and its variant).
2289void SelectionDAGLegalize::ExpandArgFPLibCall(SDNode* Node,
2290 RTLIB::Libcall Call_F32,
2291 RTLIB::Libcall Call_F64,
2292 RTLIB::Libcall Call_F80,
2293 RTLIB::Libcall Call_F128,
2294 RTLIB::Libcall Call_PPCF128,
2295 SmallVectorImpl<SDValue> &Results) {
2296 EVT InVT = Node->getOperand(Node->isStrictFPOpcode() ? 1 : 0).getValueType();
2297 RTLIB::Libcall LC = RTLIB::getFPLibCall(InVT.getSimpleVT(),
2298 Call_F32, Call_F64, Call_F80,
2299 Call_F128, Call_PPCF128);
2300 ExpandFPLibCall(Node, LC, Results);
2301}
2302
2303SDValue SelectionDAGLegalize::ExpandBitCountingLibCall(
2304 SDNode *Node, RTLIB::Libcall CallI32, RTLIB::Libcall CallI64,
2305 RTLIB::Libcall CallI128) {
2306 RTLIB::Libcall LC;
2307 switch (Node->getSimpleValueType(0).SimpleTy) {
2308 default:
2309 llvm_unreachable("Unexpected request for libcall!");
2310 case MVT::i32:
2311 LC = CallI32;
2312 break;
2313 case MVT::i64:
2314 LC = CallI64;
2315 break;
2316 case MVT::i128:
2317 LC = CallI128;
2318 break;
2319 }
2320
2321 // Bit-counting libcalls have one unsigned argument and return `int`.
2322 // Note that `int` may be illegal on this target; ExpandLibCall will
2323 // take care of promoting it to a legal type.
2324 SDValue Op = Node->getOperand(0);
2325 EVT IntVT =
2327
2328 EVT ArgVT = Op.getValueType();
2329 Type *ArgTy = ArgVT.getTypeForEVT(*DAG.getContext());
2330 TargetLowering::ArgListEntry Arg(Op, ArgTy);
2331 Arg.IsSExt = TLI.shouldSignExtendTypeInLibCall(ArgTy, /*IsSigned=*/false);
2332 Arg.IsZExt = !Arg.IsSExt;
2333
2334 SDValue Res = ExpandLibCall(LC, Node, TargetLowering::ArgListTy{Arg},
2335 /*IsSigned=*/true, IntVT)
2336 .first;
2337
2338 // If ExpandLibCall created a tail call, the result was already
2339 // of the correct type. Otherwise, we need to sign extend it.
2340 if (Res.getValueType() != MVT::Other)
2341 Res = DAG.getSExtOrTrunc(Res, SDLoc(Node), Node->getValueType(0));
2342 return Res;
2343}
2344
2345/// Issue libcalls to __{u}divmod to compute div / rem pairs.
2346void
2347SelectionDAGLegalize::ExpandDivRemLibCall(SDNode *Node,
2348 SmallVectorImpl<SDValue> &Results) {
2349 unsigned Opcode = Node->getOpcode();
2350 bool isSigned = Opcode == ISD::SDIVREM;
2351
2352 RTLIB::Libcall LC;
2353 switch (Node->getSimpleValueType(0).SimpleTy) {
2354 default: llvm_unreachable("Unexpected request for libcall!");
2355 case MVT::i8: LC= isSigned ? RTLIB::SDIVREM_I8 : RTLIB::UDIVREM_I8; break;
2356 case MVT::i16: LC= isSigned ? RTLIB::SDIVREM_I16 : RTLIB::UDIVREM_I16; break;
2357 case MVT::i32: LC= isSigned ? RTLIB::SDIVREM_I32 : RTLIB::UDIVREM_I32; break;
2358 case MVT::i64: LC= isSigned ? RTLIB::SDIVREM_I64 : RTLIB::UDIVREM_I64; break;
2359 case MVT::i128: LC= isSigned ? RTLIB::SDIVREM_I128:RTLIB::UDIVREM_I128; break;
2360 }
2361
2362 // The input chain to this libcall is the entry node of the function.
2363 // Legalizing the call will automatically add the previous call to the
2364 // dependence.
2365 SDValue InChain = DAG.getEntryNode();
2366
2367 EVT RetVT = Node->getValueType(0);
2368 Type *RetTy = RetVT.getTypeForEVT(*DAG.getContext());
2369
2370 TargetLowering::ArgListTy Args;
2371 for (const SDValue &Op : Node->op_values()) {
2372 EVT ArgVT = Op.getValueType();
2373 Type *ArgTy = ArgVT.getTypeForEVT(*DAG.getContext());
2374 TargetLowering::ArgListEntry Entry(Op, ArgTy);
2375 Entry.IsSExt = isSigned;
2376 Entry.IsZExt = !isSigned;
2377 Args.push_back(Entry);
2378 }
2379
2380 // Also pass the return address of the remainder.
2381 SDValue FIPtr = DAG.CreateStackTemporary(RetVT);
2382 TargetLowering::ArgListEntry Entry(
2383 FIPtr, PointerType::getUnqual(RetTy->getContext()));
2384 Entry.IsSExt = isSigned;
2385 Entry.IsZExt = !isSigned;
2386 Args.push_back(Entry);
2387
2388 RTLIB::LibcallImpl LibcallImpl = TLI.getLibcallImpl(LC);
2389 if (LibcallImpl == RTLIB::Unsupported) {
2390 DAG.getContext()->emitError(Twine("no libcall available for ") +
2391 Node->getOperationName(&DAG));
2392 SDValue Poison = DAG.getPOISON(RetVT);
2393 Results.push_back(Poison);
2394 Results.push_back(Poison);
2395 return;
2396 }
2397
2398 SDValue Callee =
2399 DAG.getExternalSymbol(LibcallImpl, TLI.getPointerTy(DAG.getDataLayout()));
2400
2401 SDLoc dl(Node);
2402 TargetLowering::CallLoweringInfo CLI(DAG);
2403 CLI.setDebugLoc(dl)
2404 .setChain(InChain)
2405 .setLibCallee(TLI.getLibcallImplCallingConv(LibcallImpl), RetTy, Callee,
2406 std::move(Args))
2407 .setSExtResult(isSigned)
2408 .setZExtResult(!isSigned);
2409
2410 std::pair<SDValue, SDValue> CallInfo = TLI.LowerCallTo(CLI);
2411
2412 // Remainder is loaded back from the stack frame.
2413 int FI = cast<FrameIndexSDNode>(FIPtr)->getIndex();
2414 MachinePointerInfo PtrInfo =
2416
2417 SDValue Rem = DAG.getLoad(RetVT, dl, CallInfo.second, FIPtr, PtrInfo);
2418 Results.push_back(CallInfo.first);
2419 Results.push_back(Rem);
2420}
2421
2422/// Return true if sincos or __sincos_stret libcall is available.
2424 MVT::SimpleValueType VT = Node->getSimpleValueType(0).SimpleTy;
2425 return TLI.getLibcallImpl(RTLIB::getSINCOS(VT)) != RTLIB::Unsupported ||
2426 TLI.getLibcallImpl(RTLIB::getSINCOS_STRET(VT)) != RTLIB::Unsupported;
2427}
2428
2429/// Only issue sincos libcall if both sin and cos are needed.
2430static bool useSinCos(SDNode *Node) {
2431 unsigned OtherOpcode = Node->getOpcode() == ISD::FSIN
2432 ? ISD::FCOS : ISD::FSIN;
2433
2434 SDValue Op0 = Node->getOperand(0);
2435 for (const SDNode *User : Op0.getNode()->users()) {
2436 if (User == Node)
2437 continue;
2438 // The other user might have been turned into sincos already.
2439 if (User->getOpcode() == OtherOpcode || User->getOpcode() == ISD::FSINCOS)
2440 return true;
2441 }
2442 return false;
2443}
2444
2445SDValue SelectionDAGLegalize::ExpandSincosStretLibCall(SDNode *Node) const {
2446 // For iOS, we want to call an alternative entry point: __sincos_stret,
2447 // which returns the values in two S / D registers.
2448 SDLoc dl(Node);
2449 SDValue Arg = Node->getOperand(0);
2450 EVT ArgVT = Arg.getValueType();
2451 RTLIB::Libcall LC = RTLIB::getSINCOS_STRET(ArgVT);
2452 RTLIB::LibcallImpl SincosStret = TLI.getLibcallImpl(LC);
2453 if (SincosStret == RTLIB::Unsupported)
2454 return SDValue();
2455
2456 /// There are 3 different ABI cases to handle:
2457 /// - Direct return of separate fields in registers
2458 /// - Single return as vector elements
2459 /// - sret struct
2460
2461 const RTLIB::RuntimeLibcallsInfo &CallsInfo = TLI.getRuntimeLibcallsInfo();
2462
2463 const DataLayout &DL = DAG.getDataLayout();
2464
2465 auto [FuncTy, FuncAttrs] = CallsInfo.getFunctionTy(
2466 *DAG.getContext(), TM.getTargetTriple(), DL, SincosStret);
2467
2468 Type *SincosStretRetTy = FuncTy->getReturnType();
2469 CallingConv::ID CallConv = CallsInfo.getLibcallImplCallingConv(SincosStret);
2470
2471 SDValue Callee =
2472 DAG.getExternalSymbol(SincosStret, TLI.getProgramPointerTy(DL));
2473
2474 TargetLowering::ArgListTy Args;
2475 SDValue SRet;
2476
2477 int FrameIdx;
2478 if (FuncTy->getParamType(0)->isPointerTy()) {
2479 // Uses sret
2480 MachineFrameInfo &MFI = DAG.getMachineFunction().getFrameInfo();
2481
2482 AttributeSet PtrAttrs = FuncAttrs.getParamAttrs(0);
2483 Type *StructTy = PtrAttrs.getStructRetType();
2484 const uint64_t ByteSize = DL.getTypeAllocSize(StructTy);
2485 const Align StackAlign = DL.getPrefTypeAlign(StructTy);
2486
2487 FrameIdx = MFI.CreateStackObject(ByteSize, StackAlign, false);
2488 SRet = DAG.getFrameIndex(FrameIdx, TLI.getFrameIndexTy(DL));
2489
2490 TargetLowering::ArgListEntry Entry(SRet, FuncTy->getParamType(0));
2491 Entry.IsSRet = true;
2492 Entry.IndirectType = StructTy;
2493 Entry.Alignment = StackAlign;
2494
2495 Args.push_back(Entry);
2496 Args.emplace_back(Arg, FuncTy->getParamType(1));
2497 } else {
2498 Args.emplace_back(Arg, FuncTy->getParamType(0));
2499 }
2500
2501 TargetLowering::CallLoweringInfo CLI(DAG);
2502 CLI.setDebugLoc(dl)
2503 .setChain(DAG.getEntryNode())
2504 .setLibCallee(CallConv, SincosStretRetTy, Callee, std::move(Args))
2505 .setIsPostTypeLegalization();
2506
2507 std::pair<SDValue, SDValue> CallResult = TLI.LowerCallTo(CLI);
2508
2509 if (SRet) {
2510 MachinePointerInfo PtrInfo =
2512 SDValue LoadSin = DAG.getLoad(ArgVT, dl, CallResult.second, SRet, PtrInfo);
2513
2514 TypeSize StoreSize = ArgVT.getStoreSize();
2515
2516 // Address of cos field.
2517 SDValue Add = DAG.getObjectPtrOffset(dl, SRet, StoreSize);
2518 SDValue LoadCos = DAG.getLoad(ArgVT, dl, LoadSin.getValue(1), Add,
2519 PtrInfo.getWithOffset(StoreSize));
2520
2521 SDVTList Tys = DAG.getVTList(ArgVT, ArgVT);
2522 return DAG.getNode(ISD::MERGE_VALUES, dl, Tys, LoadSin.getValue(0),
2523 LoadCos.getValue(0));
2524 }
2525
2526 if (!CallResult.first.getValueType().isVector())
2527 return CallResult.first;
2528
2529 SDValue SinVal =
2530 DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, ArgVT, CallResult.first,
2531 DAG.getVectorIdxConstant(0, dl));
2532 SDValue CosVal =
2533 DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, ArgVT, CallResult.first,
2534 DAG.getVectorIdxConstant(1, dl));
2535 SDVTList Tys = DAG.getVTList(ArgVT, ArgVT);
2536 return DAG.getNode(ISD::MERGE_VALUES, dl, Tys, SinVal, CosVal);
2537}
2538
2539SDValue SelectionDAGLegalize::expandLdexp(SDNode *Node) const {
2540 SDLoc dl(Node);
2541 EVT VT = Node->getValueType(0);
2542 SDValue X = Node->getOperand(0);
2543 SDValue N = Node->getOperand(1);
2544 EVT ExpVT = N.getValueType();
2545 EVT AsIntVT = VT.changeTypeToInteger();
2546 if (AsIntVT == EVT()) // TODO: How to handle f80?
2547 return SDValue();
2548
2549 if (Node->getOpcode() == ISD::STRICT_FLDEXP) // TODO
2550 return SDValue();
2551
2552 SDNodeFlags NSW;
2553 NSW.setNoSignedWrap(true);
2554 SDNodeFlags NUW_NSW;
2555 NUW_NSW.setNoUnsignedWrap(true);
2556 NUW_NSW.setNoSignedWrap(true);
2557
2558 EVT SetCCVT =
2559 TLI.getSetCCResultType(DAG.getDataLayout(), *DAG.getContext(), ExpVT);
2560 const fltSemantics &FltSem = VT.getFltSemantics();
2561
2562 const APFloat::ExponentType MaxExpVal = APFloat::semanticsMaxExponent(FltSem);
2563 const APFloat::ExponentType MinExpVal = APFloat::semanticsMinExponent(FltSem);
2564 const int Precision = APFloat::semanticsPrecision(FltSem);
2565
2566 const SDValue MaxExp = DAG.getSignedConstant(MaxExpVal, dl, ExpVT);
2567 const SDValue MinExp = DAG.getSignedConstant(MinExpVal, dl, ExpVT);
2568
2569 const SDValue DoubleMaxExp = DAG.getSignedConstant(2 * MaxExpVal, dl, ExpVT);
2570
2571 const APFloat One(FltSem, "1.0");
2572 APFloat ScaleUpK = scalbn(One, MaxExpVal, APFloat::rmNearestTiesToEven);
2573
2574 // Offset by precision to avoid denormal range.
2575 APFloat ScaleDownK =
2576 scalbn(One, MinExpVal + Precision, APFloat::rmNearestTiesToEven);
2577
2578 // TODO: Should really introduce control flow and use a block for the >
2579 // MaxExp, < MinExp cases
2580
2581 // First, handle exponents Exp > MaxExp and scale down.
2582 SDValue NGtMaxExp = DAG.getSetCC(dl, SetCCVT, N, MaxExp, ISD::SETGT);
2583
2584 SDValue DecN0 = DAG.getNode(ISD::SUB, dl, ExpVT, N, MaxExp, NSW);
2585 SDValue ClampMaxVal = DAG.getConstant(3 * MaxExpVal, dl, ExpVT);
2586 SDValue ClampN_Big = DAG.getNode(ISD::SMIN, dl, ExpVT, N, ClampMaxVal);
2587 SDValue DecN1 =
2588 DAG.getNode(ISD::SUB, dl, ExpVT, ClampN_Big, DoubleMaxExp, NSW);
2589
2590 SDValue ScaleUpTwice =
2591 DAG.getSetCC(dl, SetCCVT, N, DoubleMaxExp, ISD::SETUGT);
2592
2593 const SDValue ScaleUpVal = DAG.getConstantFP(ScaleUpK, dl, VT);
2594 SDValue ScaleUp0 = DAG.getNode(ISD::FMUL, dl, VT, X, ScaleUpVal);
2595 SDValue ScaleUp1 = DAG.getNode(ISD::FMUL, dl, VT, ScaleUp0, ScaleUpVal);
2596
2597 SDValue SelectN_Big =
2598 DAG.getNode(ISD::SELECT, dl, ExpVT, ScaleUpTwice, DecN1, DecN0);
2599 SDValue SelectX_Big =
2600 DAG.getNode(ISD::SELECT, dl, VT, ScaleUpTwice, ScaleUp1, ScaleUp0);
2601
2602 // Now handle exponents Exp < MinExp
2603 SDValue NLtMinExp = DAG.getSetCC(dl, SetCCVT, N, MinExp, ISD::SETLT);
2604
2605 SDValue Increment0 = DAG.getConstant(-(MinExpVal + Precision), dl, ExpVT);
2606 SDValue Increment1 = DAG.getConstant(-2 * (MinExpVal + Precision), dl, ExpVT);
2607
2608 SDValue IncN0 = DAG.getNode(ISD::ADD, dl, ExpVT, N, Increment0, NUW_NSW);
2609
2610 SDValue ClampMinVal =
2611 DAG.getSignedConstant(3 * MinExpVal + 2 * Precision, dl, ExpVT);
2612 SDValue ClampN_Small = DAG.getNode(ISD::SMAX, dl, ExpVT, N, ClampMinVal);
2613 SDValue IncN1 =
2614 DAG.getNode(ISD::ADD, dl, ExpVT, ClampN_Small, Increment1, NSW);
2615
2616 const SDValue ScaleDownVal = DAG.getConstantFP(ScaleDownK, dl, VT);
2617 SDValue ScaleDown0 = DAG.getNode(ISD::FMUL, dl, VT, X, ScaleDownVal);
2618 SDValue ScaleDown1 = DAG.getNode(ISD::FMUL, dl, VT, ScaleDown0, ScaleDownVal);
2619
2620 SDValue ScaleDownTwice = DAG.getSetCC(
2621 dl, SetCCVT, N,
2622 DAG.getSignedConstant(2 * MinExpVal + Precision, dl, ExpVT), ISD::SETULT);
2623
2624 SDValue SelectN_Small =
2625 DAG.getNode(ISD::SELECT, dl, ExpVT, ScaleDownTwice, IncN1, IncN0);
2626 SDValue SelectX_Small =
2627 DAG.getNode(ISD::SELECT, dl, VT, ScaleDownTwice, ScaleDown1, ScaleDown0);
2628
2629 // Now combine the two out of range exponent handling cases with the base
2630 // case.
2631 SDValue NewX = DAG.getNode(
2632 ISD::SELECT, dl, VT, NGtMaxExp, SelectX_Big,
2633 DAG.getNode(ISD::SELECT, dl, VT, NLtMinExp, SelectX_Small, X));
2634
2635 SDValue NewN = DAG.getNode(
2636 ISD::SELECT, dl, ExpVT, NGtMaxExp, SelectN_Big,
2637 DAG.getNode(ISD::SELECT, dl, ExpVT, NLtMinExp, SelectN_Small, N));
2638
2639 SDValue BiasedN = DAG.getNode(ISD::ADD, dl, ExpVT, NewN, MaxExp, NSW);
2640
2641 SDValue ExponentShiftAmt =
2642 DAG.getShiftAmountConstant(Precision - 1, ExpVT, dl);
2643 SDValue CastExpToValTy = DAG.getZExtOrTrunc(BiasedN, dl, AsIntVT);
2644
2645 SDValue AsInt = DAG.getNode(ISD::SHL, dl, AsIntVT, CastExpToValTy,
2646 ExponentShiftAmt, NUW_NSW);
2647 SDValue AsFP = DAG.getNode(ISD::BITCAST, dl, VT, AsInt);
2648 return DAG.getNode(ISD::FMUL, dl, VT, NewX, AsFP);
2649}
2650
2651SDValue SelectionDAGLegalize::expandFrexp(SDNode *Node) const {
2652 SDLoc dl(Node);
2653 SDValue Val = Node->getOperand(0);
2654 EVT VT = Val.getValueType();
2655 EVT ExpVT = Node->getValueType(1);
2656 EVT AsIntVT = VT.changeTypeToInteger();
2657 if (AsIntVT == EVT()) // TODO: How to handle f80?
2658 return SDValue();
2659
2660 const fltSemantics &FltSem = VT.getFltSemantics();
2661 const APFloat::ExponentType MinExpVal = APFloat::semanticsMinExponent(FltSem);
2662 const unsigned Precision = APFloat::semanticsPrecision(FltSem);
2663 const unsigned BitSize = VT.getScalarSizeInBits();
2664
2665 // TODO: Could introduce control flow and skip over the denormal handling.
2666
2667 // scale_up = fmul value, scalbn(1.0, precision + 1)
2668 // extracted_exp = (bitcast value to uint) >> precision - 1
2669 // biased_exp = extracted_exp + min_exp
2670 // extracted_fract = (bitcast value to uint) & (fract_mask | sign_mask)
2671 //
2672 // is_denormal = val < smallest_normalized
2673 // computed_fract = is_denormal ? scale_up : extracted_fract
2674 // computed_exp = is_denormal ? biased_exp + (-precision - 1) : biased_exp
2675 //
2676 // result_0 = (!isfinite(val) || iszero(val)) ? val : computed_fract
2677 // result_1 = (!isfinite(val) || iszero(val)) ? 0 : computed_exp
2678
2679 SDValue NegSmallestNormalizedInt = DAG.getConstant(
2680 APFloat::getSmallestNormalized(FltSem, true).bitcastToAPInt(), dl,
2681 AsIntVT);
2682
2683 SDValue SmallestNormalizedInt = DAG.getConstant(
2684 APFloat::getSmallestNormalized(FltSem, false).bitcastToAPInt(), dl,
2685 AsIntVT);
2686
2687 // Masks out the exponent bits.
2688 SDValue ExpMask =
2689 DAG.getConstant(APFloat::getInf(FltSem).bitcastToAPInt(), dl, AsIntVT);
2690
2691 // Mask out the exponent part of the value.
2692 //
2693 // e.g, for f32 FractSignMaskVal = 0x807fffff
2694 APInt FractSignMaskVal = APInt::getBitsSet(BitSize, 0, Precision - 1);
2695 FractSignMaskVal.setBit(BitSize - 1); // Set the sign bit
2696
2697 APInt SignMaskVal = APInt::getSignedMaxValue(BitSize);
2698 SDValue SignMask = DAG.getConstant(SignMaskVal, dl, AsIntVT);
2699
2700 SDValue FractSignMask = DAG.getConstant(FractSignMaskVal, dl, AsIntVT);
2701
2702 const APFloat One(FltSem, "1.0");
2703 // Scale a possible denormal input.
2704 // e.g., for f64, 0x1p+54
2705 APFloat ScaleUpKVal =
2706 scalbn(One, Precision + 1, APFloat::rmNearestTiesToEven);
2707
2708 SDValue ScaleUpK = DAG.getConstantFP(ScaleUpKVal, dl, VT);
2709 SDValue ScaleUp = DAG.getNode(ISD::FMUL, dl, VT, Val, ScaleUpK);
2710
2711 EVT SetCCVT =
2712 TLI.getSetCCResultType(DAG.getDataLayout(), *DAG.getContext(), VT);
2713
2714 SDValue AsInt = DAG.getNode(ISD::BITCAST, dl, AsIntVT, Val);
2715
2716 SDValue Abs = DAG.getNode(ISD::AND, dl, AsIntVT, AsInt, SignMask);
2717
2718 SDValue AddNegSmallestNormal =
2719 DAG.getNode(ISD::ADD, dl, AsIntVT, Abs, NegSmallestNormalizedInt);
2720 SDValue DenormOrZero = DAG.getSetCC(dl, SetCCVT, AddNegSmallestNormal,
2721 NegSmallestNormalizedInt, ISD::SETULE);
2722
2723 SDValue IsDenormal =
2724 DAG.getSetCC(dl, SetCCVT, Abs, SmallestNormalizedInt, ISD::SETULT);
2725
2726 SDValue MinExp = DAG.getSignedConstant(MinExpVal, dl, ExpVT);
2727 SDValue Zero = DAG.getConstant(0, dl, ExpVT);
2728
2729 SDValue ScaledAsInt = DAG.getNode(ISD::BITCAST, dl, AsIntVT, ScaleUp);
2730 SDValue ScaledSelect =
2731 DAG.getNode(ISD::SELECT, dl, AsIntVT, IsDenormal, ScaledAsInt, AsInt);
2732
2733 SDValue ExpMaskScaled =
2734 DAG.getNode(ISD::AND, dl, AsIntVT, ScaledAsInt, ExpMask);
2735
2736 SDValue ScaledValue =
2737 DAG.getNode(ISD::SELECT, dl, AsIntVT, IsDenormal, ExpMaskScaled, Abs);
2738
2739 // Extract the exponent bits.
2740 SDValue ExponentShiftAmt =
2741 DAG.getShiftAmountConstant(Precision - 1, AsIntVT, dl);
2742 SDValue ShiftedExp =
2743 DAG.getNode(ISD::SRL, dl, AsIntVT, ScaledValue, ExponentShiftAmt);
2744 SDValue Exp = DAG.getSExtOrTrunc(ShiftedExp, dl, ExpVT);
2745
2746 SDValue NormalBiasedExp = DAG.getNode(ISD::ADD, dl, ExpVT, Exp, MinExp);
2747 SDValue DenormalOffset = DAG.getConstant(-Precision - 1, dl, ExpVT);
2748 SDValue DenormalExpBias =
2749 DAG.getNode(ISD::SELECT, dl, ExpVT, IsDenormal, DenormalOffset, Zero);
2750
2751 SDValue MaskedFractAsInt =
2752 DAG.getNode(ISD::AND, dl, AsIntVT, ScaledSelect, FractSignMask);
2753 const APFloat Half(FltSem, "0.5");
2754 SDValue FPHalf = DAG.getConstant(Half.bitcastToAPInt(), dl, AsIntVT);
2755 SDValue Or = DAG.getNode(ISD::OR, dl, AsIntVT, MaskedFractAsInt, FPHalf);
2756 SDValue MaskedFract = DAG.getNode(ISD::BITCAST, dl, VT, Or);
2757
2758 SDValue ComputedExp =
2759 DAG.getNode(ISD::ADD, dl, ExpVT, NormalBiasedExp, DenormalExpBias);
2760
2761 SDValue Result0 =
2762 DAG.getNode(ISD::SELECT, dl, VT, DenormOrZero, Val, MaskedFract);
2763
2764 SDValue Result1 =
2765 DAG.getNode(ISD::SELECT, dl, ExpVT, DenormOrZero, Zero, ComputedExp);
2766
2767 return DAG.getMergeValues({Result0, Result1}, dl);
2768}
2769
2770/// This function is responsible for legalizing a
2771/// INT_TO_FP operation of the specified operand when the target requests that
2772/// we expand it. At this point, we know that the result and operand types are
2773/// legal for the target.
2774SDValue SelectionDAGLegalize::ExpandLegalINT_TO_FP(SDNode *Node,
2775 SDValue &Chain) {
2776 bool isSigned = (Node->getOpcode() == ISD::STRICT_SINT_TO_FP ||
2777 Node->getOpcode() == ISD::SINT_TO_FP);
2778 EVT DestVT = Node->getValueType(0);
2779 SDLoc dl(Node);
2780 unsigned OpNo = Node->isStrictFPOpcode() ? 1 : 0;
2781 SDValue Op0 = Node->getOperand(OpNo);
2782 EVT SrcVT = Op0.getValueType();
2783
2784 // TODO: Should any fast-math-flags be set for the created nodes?
2785 LLVM_DEBUG(dbgs() << "Legalizing INT_TO_FP\n");
2786 if (SrcVT == MVT::i32 && TLI.isTypeLegal(MVT::f64) &&
2787 (DestVT.bitsLE(MVT::f64) ||
2788 TLI.isOperationLegal(Node->isStrictFPOpcode() ? ISD::STRICT_FP_EXTEND
2790 DestVT))) {
2791 LLVM_DEBUG(dbgs() << "32-bit [signed|unsigned] integer to float/double "
2792 "expansion\n");
2793
2794 // Get the stack frame index of a 8 byte buffer.
2795 SDValue StackSlot = DAG.CreateStackTemporary(MVT::f64);
2796
2797 SDValue Lo = Op0;
2798 // if signed map to unsigned space
2799 if (isSigned) {
2800 // Invert sign bit (signed to unsigned mapping).
2801 Lo = DAG.getNode(ISD::XOR, dl, MVT::i32, Lo,
2802 DAG.getConstant(0x80000000u, dl, MVT::i32));
2803 }
2804 // Initial hi portion of constructed double.
2805 SDValue Hi = DAG.getConstant(0x43300000u, dl, MVT::i32);
2806
2807 // If this a big endian target, swap the lo and high data.
2808 if (DAG.getDataLayout().isBigEndian())
2809 std::swap(Lo, Hi);
2810
2811 SDValue MemChain = DAG.getEntryNode();
2812
2813 // Store the lo of the constructed double.
2814 SDValue Store1 = DAG.getStore(MemChain, dl, Lo, StackSlot,
2815 MachinePointerInfo());
2816 // Store the hi of the constructed double.
2817 SDValue HiPtr =
2818 DAG.getMemBasePlusOffset(StackSlot, TypeSize::getFixed(4), dl);
2819 SDValue Store2 =
2820 DAG.getStore(MemChain, dl, Hi, HiPtr, MachinePointerInfo());
2821 MemChain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Store1, Store2);
2822
2823 // load the constructed double
2824 SDValue Load =
2825 DAG.getLoad(MVT::f64, dl, MemChain, StackSlot, MachinePointerInfo());
2826 // FP constant to bias correct the final result
2827 SDValue Bias = DAG.getConstantFP(
2828 isSigned ? llvm::bit_cast<double>(0x4330000080000000ULL)
2829 : llvm::bit_cast<double>(0x4330000000000000ULL),
2830 dl, MVT::f64);
2831 // Subtract the bias and get the final result.
2832 SDValue Sub;
2834 if (Node->isStrictFPOpcode()) {
2835 Sub = DAG.getNode(ISD::STRICT_FSUB, dl, {MVT::f64, MVT::Other},
2836 {Node->getOperand(0), Load, Bias});
2837 Chain = Sub.getValue(1);
2838 if (DestVT != Sub.getValueType()) {
2839 std::pair<SDValue, SDValue> ResultPair;
2840 ResultPair =
2841 DAG.getStrictFPExtendOrRound(Sub, Chain, dl, DestVT);
2842 Result = ResultPair.first;
2843 Chain = ResultPair.second;
2844 }
2845 else
2846 Result = Sub;
2847 } else {
2848 Sub = DAG.getNode(ISD::FSUB, dl, MVT::f64, Load, Bias);
2849 Result = DAG.getFPExtendOrRound(Sub, dl, DestVT);
2850 }
2851 return Result;
2852 }
2853
2854 if (isSigned)
2855 return SDValue();
2856
2857 // TODO: Generalize this for use with other types.
2858 if (((SrcVT == MVT::i32 || SrcVT == MVT::i64) && DestVT == MVT::f32) ||
2859 (SrcVT == MVT::i64 && DestVT == MVT::f64)) {
2860 LLVM_DEBUG(dbgs() << "Converting unsigned i32/i64 to f32/f64\n");
2861 // For unsigned conversions, convert them to signed conversions using the
2862 // algorithm from the x86_64 __floatundisf in compiler_rt. That method
2863 // should be valid for i32->f32 as well.
2864
2865 // More generally this transform should be valid if there are 3 more bits
2866 // in the integer type than the significand. Rounding uses the first bit
2867 // after the width of the significand and the OR of all bits after that. So
2868 // we need to be able to OR the shifted out bit into one of the bits that
2869 // participate in the OR.
2870
2871 // TODO: This really should be implemented using a branch rather than a
2872 // select. We happen to get lucky and machinesink does the right
2873 // thing most of the time. This would be a good candidate for a
2874 // pseudo-op, or, even better, for whole-function isel.
2875 EVT SetCCVT = getSetCCResultType(SrcVT);
2876
2877 SDValue SignBitTest = DAG.getSetCC(
2878 dl, SetCCVT, Op0, DAG.getConstant(0, dl, SrcVT), ISD::SETLT);
2879
2880 SDValue ShiftConst = DAG.getShiftAmountConstant(1, SrcVT, dl);
2881 SDValue Shr = DAG.getNode(ISD::SRL, dl, SrcVT, Op0, ShiftConst);
2882 SDValue AndConst = DAG.getConstant(1, dl, SrcVT);
2883 SDValue And = DAG.getNode(ISD::AND, dl, SrcVT, Op0, AndConst);
2884 SDValue Or = DAG.getNode(ISD::OR, dl, SrcVT, And, Shr);
2885
2886 SDValue Slow, Fast;
2887 if (Node->isStrictFPOpcode()) {
2888 // In strict mode, we must avoid spurious exceptions, and therefore
2889 // must make sure to only emit a single STRICT_SINT_TO_FP.
2890 SDValue InCvt = DAG.getSelect(dl, SrcVT, SignBitTest, Or, Op0);
2891 // The STRICT_SINT_TO_FP inherits the exception mode from the
2892 // incoming STRICT_UINT_TO_FP node; the STRICT_FADD node can
2893 // never raise any exception.
2894 SDNodeFlags Flags;
2895 Flags.setNoFPExcept(Node->getFlags().hasNoFPExcept());
2896 Fast = DAG.getNode(ISD::STRICT_SINT_TO_FP, dl, {DestVT, MVT::Other},
2897 {Node->getOperand(0), InCvt}, Flags);
2898 Flags.setNoFPExcept(true);
2899 Slow = DAG.getNode(ISD::STRICT_FADD, dl, {DestVT, MVT::Other},
2900 {Fast.getValue(1), Fast, Fast}, Flags);
2901 Chain = Slow.getValue(1);
2902 } else {
2903 SDValue SignCvt = DAG.getNode(ISD::SINT_TO_FP, dl, DestVT, Or);
2904 Slow = DAG.getNode(ISD::FADD, dl, DestVT, SignCvt, SignCvt);
2905 Fast = DAG.getNode(ISD::SINT_TO_FP, dl, DestVT, Op0);
2906 }
2907
2908 return DAG.getSelect(dl, DestVT, SignBitTest, Slow, Fast);
2909 }
2910
2911 // Don't expand it if there isn't cheap fadd.
2912 if (!TLI.isOperationLegalOrCustom(
2913 Node->isStrictFPOpcode() ? ISD::STRICT_FADD : ISD::FADD, DestVT))
2914 return SDValue();
2915
2916 // The following optimization is valid only if every value in SrcVT (when
2917 // treated as signed) is representable in DestVT. Check that the mantissa
2918 // size of DestVT is >= than the number of bits in SrcVT -1.
2919 assert(APFloat::semanticsPrecision(DestVT.getFltSemantics()) >=
2920 SrcVT.getSizeInBits() - 1 &&
2921 "Cannot perform lossless SINT_TO_FP!");
2922
2923 SDValue Tmp1;
2924 if (Node->isStrictFPOpcode()) {
2925 Tmp1 = DAG.getNode(ISD::STRICT_SINT_TO_FP, dl, { DestVT, MVT::Other },
2926 { Node->getOperand(0), Op0 });
2927 } else
2928 Tmp1 = DAG.getNode(ISD::SINT_TO_FP, dl, DestVT, Op0);
2929
2930 SDValue SignSet = DAG.getSetCC(dl, getSetCCResultType(SrcVT), Op0,
2931 DAG.getConstant(0, dl, SrcVT), ISD::SETLT);
2932 SDValue Zero = DAG.getIntPtrConstant(0, dl),
2933 Four = DAG.getIntPtrConstant(4, dl);
2934 SDValue CstOffset = DAG.getSelect(dl, Zero.getValueType(),
2935 SignSet, Four, Zero);
2936
2937 // If the sign bit of the integer is set, the large number will be treated
2938 // as a negative number. To counteract this, the dynamic code adds an
2939 // offset depending on the data type.
2940 uint64_t FF;
2941 switch (SrcVT.getSimpleVT().SimpleTy) {
2942 default:
2943 return SDValue();
2944 case MVT::i8 : FF = 0x43800000ULL; break; // 2^8 (as a float)
2945 case MVT::i16: FF = 0x47800000ULL; break; // 2^16 (as a float)
2946 case MVT::i32: FF = 0x4F800000ULL; break; // 2^32 (as a float)
2947 case MVT::i64: FF = 0x5F800000ULL; break; // 2^64 (as a float)
2948 }
2949 if (DAG.getDataLayout().isLittleEndian())
2950 FF <<= 32;
2951 Constant *FudgeFactor = ConstantInt::get(
2952 Type::getInt64Ty(*DAG.getContext()), FF);
2953
2954 SDValue CPIdx =
2955 DAG.getConstantPool(FudgeFactor, TLI.getPointerTy(DAG.getDataLayout()));
2956 Align Alignment = cast<ConstantPoolSDNode>(CPIdx)->getAlign();
2957 CPIdx = DAG.getNode(ISD::ADD, dl, CPIdx.getValueType(), CPIdx, CstOffset);
2958 Alignment = commonAlignment(Alignment, 4);
2959 SDValue FudgeInReg;
2960 if (DestVT == MVT::f32)
2961 FudgeInReg = DAG.getLoad(
2962 MVT::f32, dl, DAG.getEntryNode(), CPIdx,
2964 Alignment);
2965 else {
2966 SDValue Load = DAG.getExtLoad(
2967 ISD::EXTLOAD, dl, DestVT, DAG.getEntryNode(), CPIdx,
2969 Alignment);
2970 HandleSDNode Handle(Load);
2971 LegalizeOp(Load.getNode());
2972 FudgeInReg = Handle.getValue();
2973 }
2974
2975 if (Node->isStrictFPOpcode()) {
2976 SDValue Result = DAG.getNode(ISD::STRICT_FADD, dl, { DestVT, MVT::Other },
2977 { Tmp1.getValue(1), Tmp1, FudgeInReg });
2978 Chain = Result.getValue(1);
2979 return Result;
2980 }
2981
2982 return DAG.getNode(ISD::FADD, dl, DestVT, Tmp1, FudgeInReg);
2983}
2984
2985/// This function is responsible for legalizing a
2986/// *INT_TO_FP operation of the specified operand when the target requests that
2987/// we promote it. At this point, we know that the result and operand types are
2988/// legal for the target, and that there is a legal UINT_TO_FP or SINT_TO_FP
2989/// operation that takes a larger input.
2990void SelectionDAGLegalize::PromoteLegalINT_TO_FP(
2991 SDNode *N, const SDLoc &dl, SmallVectorImpl<SDValue> &Results) {
2992 bool IsStrict = N->isStrictFPOpcode();
2993 bool IsSigned = N->getOpcode() == ISD::SINT_TO_FP ||
2994 N->getOpcode() == ISD::STRICT_SINT_TO_FP;
2995 EVT DestVT = N->getValueType(0);
2996 SDValue LegalOp = N->getOperand(IsStrict ? 1 : 0);
2997 unsigned UIntOp = IsStrict ? ISD::STRICT_UINT_TO_FP : ISD::UINT_TO_FP;
2998 unsigned SIntOp = IsStrict ? ISD::STRICT_SINT_TO_FP : ISD::SINT_TO_FP;
2999
3000 // First step, figure out the appropriate *INT_TO_FP operation to use.
3001 EVT NewInTy = LegalOp.getValueType();
3002
3003 unsigned OpToUse = 0;
3004
3005 // Scan for the appropriate larger type to use.
3006 while (true) {
3007 NewInTy = (MVT::SimpleValueType)(NewInTy.getSimpleVT().SimpleTy+1);
3008 assert(NewInTy.isInteger() && "Ran out of possibilities!");
3009
3010 // If the target supports SINT_TO_FP of this type, use it.
3011 if (TLI.isOperationLegalOrCustom(SIntOp, NewInTy)) {
3012 OpToUse = SIntOp;
3013 break;
3014 }
3015 if (IsSigned)
3016 continue;
3017
3018 // If the target supports UINT_TO_FP of this type, use it.
3019 if (TLI.isOperationLegalOrCustom(UIntOp, NewInTy)) {
3020 OpToUse = UIntOp;
3021 break;
3022 }
3023
3024 // Otherwise, try a larger type.
3025 }
3026
3027 // Okay, we found the operation and type to use. Zero extend our input to the
3028 // desired type then run the operation on it.
3029 if (IsStrict) {
3030 SDValue Res =
3031 DAG.getNode(OpToUse, dl, {DestVT, MVT::Other},
3032 {N->getOperand(0),
3033 DAG.getNode(IsSigned ? ISD::SIGN_EXTEND : ISD::ZERO_EXTEND,
3034 dl, NewInTy, LegalOp)});
3035 Results.push_back(Res);
3036 Results.push_back(Res.getValue(1));
3037 return;
3038 }
3039
3040 Results.push_back(
3041 DAG.getNode(OpToUse, dl, DestVT,
3042 DAG.getNode(IsSigned ? ISD::SIGN_EXTEND : ISD::ZERO_EXTEND,
3043 dl, NewInTy, LegalOp)));
3044}
3045
3046/// This function is responsible for legalizing a
3047/// FP_TO_*INT operation of the specified operand when the target requests that
3048/// we promote it. At this point, we know that the result and operand types are
3049/// legal for the target, and that there is a legal FP_TO_UINT or FP_TO_SINT
3050/// operation that returns a larger result.
3051void SelectionDAGLegalize::PromoteLegalFP_TO_INT(SDNode *N, const SDLoc &dl,
3052 SmallVectorImpl<SDValue> &Results) {
3053 bool IsStrict = N->isStrictFPOpcode();
3054 bool IsSigned = N->getOpcode() == ISD::FP_TO_SINT ||
3055 N->getOpcode() == ISD::STRICT_FP_TO_SINT;
3056 EVT DestVT = N->getValueType(0);
3057 SDValue LegalOp = N->getOperand(IsStrict ? 1 : 0);
3058 // First step, figure out the appropriate FP_TO*INT operation to use.
3059 EVT NewOutTy = DestVT;
3060
3061 unsigned OpToUse = 0;
3062
3063 // Scan for the appropriate larger type to use.
3064 while (true) {
3065 NewOutTy = (MVT::SimpleValueType)(NewOutTy.getSimpleVT().SimpleTy+1);
3066 assert(NewOutTy.isInteger() && "Ran out of possibilities!");
3067
3068 // A larger signed type can hold all unsigned values of the requested type,
3069 // so using FP_TO_SINT is valid
3070 OpToUse = IsStrict ? ISD::STRICT_FP_TO_SINT : ISD::FP_TO_SINT;
3071 if (TLI.isOperationLegalOrCustom(OpToUse, NewOutTy))
3072 break;
3073
3074 // However, if the value may be < 0.0, we *must* use some FP_TO_SINT.
3075 OpToUse = IsStrict ? ISD::STRICT_FP_TO_UINT : ISD::FP_TO_UINT;
3076 if (!IsSigned && TLI.isOperationLegalOrCustom(OpToUse, NewOutTy))
3077 break;
3078
3079 // Otherwise, try a larger type.
3080 }
3081
3082 // Okay, we found the operation and type to use.
3084 if (IsStrict) {
3085 SDVTList VTs = DAG.getVTList(NewOutTy, MVT::Other);
3086 Operation = DAG.getNode(OpToUse, dl, VTs, N->getOperand(0), LegalOp);
3087 } else
3088 Operation = DAG.getNode(OpToUse, dl, NewOutTy, LegalOp);
3089
3090 // Truncate the result of the extended FP_TO_*INT operation to the desired
3091 // size.
3092 SDValue Trunc = DAG.getNode(ISD::TRUNCATE, dl, DestVT, Operation);
3093 Results.push_back(Trunc);
3094 if (IsStrict)
3095 Results.push_back(Operation.getValue(1));
3096}
3097
3098/// Promote FP_TO_*INT_SAT operation to a larger result type. At this point
3099/// the result and operand types are legal and there must be a legal
3100/// FP_TO_*INT_SAT operation for a larger result type.
3101SDValue SelectionDAGLegalize::PromoteLegalFP_TO_INT_SAT(SDNode *Node,
3102 const SDLoc &dl) {
3103 unsigned Opcode = Node->getOpcode();
3104
3105 // Scan for the appropriate larger type to use.
3106 EVT NewOutTy = Node->getValueType(0);
3107 while (true) {
3108 NewOutTy = (MVT::SimpleValueType)(NewOutTy.getSimpleVT().SimpleTy + 1);
3109 assert(NewOutTy.isInteger() && "Ran out of possibilities!");
3110
3111 if (TLI.isOperationLegalOrCustom(Opcode, NewOutTy))
3112 break;
3113 }
3114
3115 // Saturation width is determined by second operand, so we don't have to
3116 // perform any fixup and can directly truncate the result.
3117 SDValue Result = DAG.getNode(Opcode, dl, NewOutTy, Node->getOperand(0),
3118 Node->getOperand(1));
3119 return DAG.getNode(ISD::TRUNCATE, dl, Node->getValueType(0), Result);
3120}
3121
3122/// Open code the operations for PARITY of the specified operation.
3123SDValue SelectionDAGLegalize::ExpandPARITY(SDValue Op, const SDLoc &dl) {
3124 EVT VT = Op.getValueType();
3125 EVT ShVT = TLI.getShiftAmountTy(VT, DAG.getDataLayout());
3126 unsigned Sz = VT.getScalarSizeInBits();
3127
3128 // If CTPOP is legal, use it. Otherwise use shifts and xor.
3131 Result = DAG.getNode(ISD::CTPOP, dl, VT, Op);
3132 } else {
3133 Result = Op;
3134 for (unsigned i = Log2_32_Ceil(Sz); i != 0;) {
3135 SDValue Shift = DAG.getNode(ISD::SRL, dl, VT, Result,
3136 DAG.getConstant(1ULL << (--i), dl, ShVT));
3137 Result = DAG.getNode(ISD::XOR, dl, VT, Result, Shift);
3138 }
3139 }
3140
3141 return DAG.getNode(ISD::AND, dl, VT, Result, DAG.getConstant(1, dl, VT));
3142}
3143
3144SDValue SelectionDAGLegalize::PromoteReduction(SDNode *Node) {
3145 bool IsVPOpcode = ISD::isVPOpcode(Node->getOpcode());
3146 MVT VecVT = IsVPOpcode ? Node->getOperand(1).getSimpleValueType()
3147 : Node->getOperand(0).getSimpleValueType();
3148 MVT NewVecVT = TLI.getTypeToPromoteTo(Node->getOpcode(), VecVT);
3149 MVT ScalarVT = Node->getSimpleValueType(0);
3150 MVT NewScalarVT = NewVecVT.getVectorElementType();
3151
3152 SDLoc DL(Node);
3153 SmallVector<SDValue, 4> Operands(Node->getNumOperands());
3154
3155 // FIXME: Support integer.
3156 assert(Node->getOperand(0).getValueType().isFloatingPoint() &&
3157 "Only FP promotion is supported");
3158
3159 for (unsigned j = 0; j != Node->getNumOperands(); ++j)
3160 if (Node->getOperand(j).getValueType().isVector() &&
3161 !(IsVPOpcode &&
3162 ISD::getVPMaskIdx(Node->getOpcode()) == j)) { // Skip mask operand.
3163 // promote the vector operand.
3164 // FIXME: Support integer.
3165 assert(Node->getOperand(j).getValueType().isFloatingPoint() &&
3166 "Only FP promotion is supported");
3167 Operands[j] =
3168 DAG.getNode(ISD::FP_EXTEND, DL, NewVecVT, Node->getOperand(j));
3169 } else if (Node->getOperand(j).getValueType().isFloatingPoint()) {
3170 // promote the initial value.
3171 Operands[j] =
3172 DAG.getNode(ISD::FP_EXTEND, DL, NewScalarVT, Node->getOperand(j));
3173 } else {
3174 Operands[j] = Node->getOperand(j); // Skip VL operand.
3175 }
3176
3177 SDValue Res = DAG.getNode(Node->getOpcode(), DL, NewScalarVT, Operands,
3178 Node->getFlags());
3179
3180 assert(ScalarVT.isFloatingPoint() && "Only FP promotion is supported");
3181 return DAG.getNode(ISD::FP_ROUND, DL, ScalarVT, Res,
3182 DAG.getIntPtrConstant(0, DL, /*isTarget=*/true));
3183}
3184
3185bool SelectionDAGLegalize::ExpandNode(SDNode *Node) {
3186 LLVM_DEBUG(dbgs() << "Trying to expand node\n");
3188 SDLoc dl(Node);
3189 SDValue Tmp1, Tmp2, Tmp3, Tmp4;
3190 bool NeedInvert;
3191 switch (Node->getOpcode()) {
3192 case ISD::ABS:
3193 if ((Tmp1 = TLI.expandABS(Node, DAG)))
3194 Results.push_back(Tmp1);
3195 break;
3196 case ISD::ABDS:
3197 case ISD::ABDU:
3198 if ((Tmp1 = TLI.expandABD(Node, DAG)))
3199 Results.push_back(Tmp1);
3200 break;
3201 case ISD::AVGCEILS:
3202 case ISD::AVGCEILU:
3203 case ISD::AVGFLOORS:
3204 case ISD::AVGFLOORU:
3205 if ((Tmp1 = TLI.expandAVG(Node, DAG)))
3206 Results.push_back(Tmp1);
3207 break;
3208 case ISD::CTPOP:
3209 if ((Tmp1 = TLI.expandCTPOP(Node, DAG)))
3210 Results.push_back(Tmp1);
3211 break;
3212 case ISD::CTLZ:
3214 if ((Tmp1 = TLI.expandCTLZ(Node, DAG)))
3215 Results.push_back(Tmp1);
3216 break;
3217 case ISD::CTTZ:
3219 if ((Tmp1 = TLI.expandCTTZ(Node, DAG)))
3220 Results.push_back(Tmp1);
3221 break;
3222 case ISD::BITREVERSE:
3223 if ((Tmp1 = TLI.expandBITREVERSE(Node, DAG)))
3224 Results.push_back(Tmp1);
3225 break;
3226 case ISD::BSWAP:
3227 if ((Tmp1 = TLI.expandBSWAP(Node, DAG)))
3228 Results.push_back(Tmp1);
3229 break;
3230 case ISD::PARITY:
3231 Results.push_back(ExpandPARITY(Node->getOperand(0), dl));
3232 break;
3233 case ISD::FRAMEADDR:
3234 case ISD::RETURNADDR:
3236 Results.push_back(DAG.getConstant(0, dl, Node->getValueType(0)));
3237 break;
3238 case ISD::EH_DWARF_CFA: {
3239 SDValue CfaArg = DAG.getSExtOrTrunc(Node->getOperand(0), dl,
3240 TLI.getPointerTy(DAG.getDataLayout()));
3241 SDValue Offset = DAG.getNode(ISD::ADD, dl,
3242 CfaArg.getValueType(),
3244 CfaArg.getValueType()),
3245 CfaArg);
3246 SDValue FA = DAG.getNode(
3248 DAG.getConstant(0, dl, TLI.getPointerTy(DAG.getDataLayout())));
3249 Results.push_back(DAG.getNode(ISD::ADD, dl, FA.getValueType(),
3250 FA, Offset));
3251 break;
3252 }
3253 case ISD::GET_ROUNDING:
3254 Results.push_back(DAG.getConstant(1, dl, Node->getValueType(0)));
3255 Results.push_back(Node->getOperand(0));
3256 break;
3257 case ISD::EH_RETURN:
3258 case ISD::EH_LABEL:
3259 case ISD::PREFETCH:
3260 case ISD::VAEND:
3262 // If the target didn't expand these, there's nothing to do, so just
3263 // preserve the chain and be done.
3264 Results.push_back(Node->getOperand(0));
3265 break;
3268 // If the target didn't expand this, just return 'zero' and preserve the
3269 // chain.
3270 Results.append(Node->getNumValues() - 1,
3271 DAG.getConstant(0, dl, Node->getValueType(0)));
3272 Results.push_back(Node->getOperand(0));
3273 break;
3275 // If the target didn't expand this, just return 'zero' and preserve the
3276 // chain.
3277 Results.push_back(DAG.getConstant(0, dl, MVT::i32));
3278 Results.push_back(Node->getOperand(0));
3279 break;
3280 case ISD::ATOMIC_LOAD: {
3281 // There is no libcall for atomic load; fake it with ATOMIC_CMP_SWAP.
3282 SDValue Zero = DAG.getConstant(0, dl, Node->getValueType(0));
3283 SDVTList VTs = DAG.getVTList(Node->getValueType(0), MVT::Other);
3284 SDValue Swap = DAG.getAtomicCmpSwap(
3285 ISD::ATOMIC_CMP_SWAP, dl, cast<AtomicSDNode>(Node)->getMemoryVT(), VTs,
3286 Node->getOperand(0), Node->getOperand(1), Zero, Zero,
3287 cast<AtomicSDNode>(Node)->getMemOperand());
3288 Results.push_back(Swap.getValue(0));
3289 Results.push_back(Swap.getValue(1));
3290 break;
3291 }
3292 case ISD::ATOMIC_STORE: {
3293 // There is no libcall for atomic store; fake it with ATOMIC_SWAP.
3294 SDValue Swap = DAG.getAtomic(
3295 ISD::ATOMIC_SWAP, dl, cast<AtomicSDNode>(Node)->getMemoryVT(),
3296 Node->getOperand(0), Node->getOperand(2), Node->getOperand(1),
3297 cast<AtomicSDNode>(Node)->getMemOperand());
3298 Results.push_back(Swap.getValue(1));
3299 break;
3300 }
3302 // Expanding an ATOMIC_CMP_SWAP_WITH_SUCCESS produces an ATOMIC_CMP_SWAP and
3303 // splits out the success value as a comparison. Expanding the resulting
3304 // ATOMIC_CMP_SWAP will produce a libcall.
3305 SDVTList VTs = DAG.getVTList(Node->getValueType(0), MVT::Other);
3306 SDValue Res = DAG.getAtomicCmpSwap(
3307 ISD::ATOMIC_CMP_SWAP, dl, cast<AtomicSDNode>(Node)->getMemoryVT(), VTs,
3308 Node->getOperand(0), Node->getOperand(1), Node->getOperand(2),
3309 Node->getOperand(3), cast<MemSDNode>(Node)->getMemOperand());
3310
3311 SDValue ExtRes = Res;
3312 SDValue LHS = Res;
3313 SDValue RHS = Node->getOperand(1);
3314
3315 EVT AtomicType = cast<AtomicSDNode>(Node)->getMemoryVT();
3316 EVT OuterType = Node->getValueType(0);
3317 switch (TLI.getExtendForAtomicOps()) {
3318 case ISD::SIGN_EXTEND:
3319 LHS = DAG.getNode(ISD::AssertSext, dl, OuterType, Res,
3320 DAG.getValueType(AtomicType));
3321 RHS = DAG.getNode(ISD::SIGN_EXTEND_INREG, dl, OuterType,
3322 Node->getOperand(2), DAG.getValueType(AtomicType));
3323 ExtRes = LHS;
3324 break;
3325 case ISD::ZERO_EXTEND:
3326 LHS = DAG.getNode(ISD::AssertZext, dl, OuterType, Res,
3327 DAG.getValueType(AtomicType));
3328 RHS = DAG.getZeroExtendInReg(Node->getOperand(2), dl, AtomicType);
3329 ExtRes = LHS;
3330 break;
3331 case ISD::ANY_EXTEND:
3332 LHS = DAG.getZeroExtendInReg(Res, dl, AtomicType);
3333 RHS = DAG.getZeroExtendInReg(Node->getOperand(2), dl, AtomicType);
3334 break;
3335 default:
3336 llvm_unreachable("Invalid atomic op extension");
3337 }
3338
3340 DAG.getSetCC(dl, Node->getValueType(1), LHS, RHS, ISD::SETEQ);
3341
3342 Results.push_back(ExtRes.getValue(0));
3343 Results.push_back(Success);
3344 Results.push_back(Res.getValue(1));
3345 break;
3346 }
3347 case ISD::ATOMIC_LOAD_SUB: {
3348 SDLoc DL(Node);
3349 EVT VT = Node->getValueType(0);
3350 SDValue RHS = Node->getOperand(2);
3351 AtomicSDNode *AN = cast<AtomicSDNode>(Node);
3352 if (RHS->getOpcode() == ISD::SIGN_EXTEND_INREG &&
3353 cast<VTSDNode>(RHS->getOperand(1))->getVT() == AN->getMemoryVT())
3354 RHS = RHS->getOperand(0);
3355 SDValue NewRHS =
3356 DAG.getNode(ISD::SUB, DL, VT, DAG.getConstant(0, DL, VT), RHS);
3358 Node->getOperand(0), Node->getOperand(1),
3359 NewRHS, AN->getMemOperand());
3360 Results.push_back(Res);
3361 Results.push_back(Res.getValue(1));
3362 break;
3363 }
3365 ExpandDYNAMIC_STACKALLOC(Node, Results);
3366 break;
3367 case ISD::MERGE_VALUES:
3368 for (unsigned i = 0; i < Node->getNumValues(); i++)
3369 Results.push_back(Node->getOperand(i));
3370 break;
3371 case ISD::POISON:
3372 case ISD::UNDEF: {
3373 EVT VT = Node->getValueType(0);
3374 if (VT.isInteger())
3375 Results.push_back(DAG.getConstant(0, dl, VT));
3376 else {
3377 assert(VT.isFloatingPoint() && "Unknown value type!");
3378 Results.push_back(DAG.getConstantFP(0, dl, VT));
3379 }
3380 break;
3381 }
3383 // When strict mode is enforced we can't do expansion because it
3384 // does not honor the "strict" properties. Only libcall is allowed.
3385 if (TLI.isStrictFPEnabled())
3386 break;
3387 // We might as well mutate to FP_ROUND when FP_ROUND operation is legal
3388 // since this operation is more efficient than stack operation.
3389 if (TLI.getStrictFPOperationAction(Node->getOpcode(),
3390 Node->getValueType(0))
3391 == TargetLowering::Legal)
3392 break;
3393 // We fall back to use stack operation when the FP_ROUND operation
3394 // isn't available.
3395 if ((Tmp1 = EmitStackConvert(Node->getOperand(1), Node->getValueType(0),
3396 Node->getValueType(0), dl,
3397 Node->getOperand(0)))) {
3398 ReplaceNode(Node, Tmp1.getNode());
3399 LLVM_DEBUG(dbgs() << "Successfully expanded STRICT_FP_ROUND node\n");
3400 return true;
3401 }
3402 break;
3403 case ISD::FP_ROUND: {
3404 if ((Tmp1 = TLI.expandFP_ROUND(Node, DAG))) {
3405 Results.push_back(Tmp1);
3406 break;
3407 }
3408
3409 [[fallthrough]];
3410 }
3411 case ISD::BITCAST:
3412 if ((Tmp1 = EmitStackConvert(Node->getOperand(0), Node->getValueType(0),
3413 Node->getValueType(0), dl)))
3414 Results.push_back(Tmp1);
3415 break;
3417 // When strict mode is enforced we can't do expansion because it
3418 // does not honor the "strict" properties. Only libcall is allowed.
3419 if (TLI.isStrictFPEnabled())
3420 break;
3421 // We might as well mutate to FP_EXTEND when FP_EXTEND operation is legal
3422 // since this operation is more efficient than stack operation.
3423 if (TLI.getStrictFPOperationAction(Node->getOpcode(),
3424 Node->getValueType(0))
3425 == TargetLowering::Legal)
3426 break;
3427 // We fall back to use stack operation when the FP_EXTEND operation
3428 // isn't available.
3429 if ((Tmp1 = EmitStackConvert(
3430 Node->getOperand(1), Node->getOperand(1).getValueType(),
3431 Node->getValueType(0), dl, Node->getOperand(0)))) {
3432 ReplaceNode(Node, Tmp1.getNode());
3433 LLVM_DEBUG(dbgs() << "Successfully expanded STRICT_FP_EXTEND node\n");
3434 return true;
3435 }
3436 break;
3437 case ISD::FP_EXTEND: {
3438 SDValue Op = Node->getOperand(0);
3439 EVT SrcVT = Op.getValueType();
3440 EVT DstVT = Node->getValueType(0);
3441 if (SrcVT.getScalarType() == MVT::bf16) {
3442 Results.push_back(DAG.getNode(ISD::BF16_TO_FP, SDLoc(Node), DstVT, Op));
3443 break;
3444 }
3445
3446 if ((Tmp1 = EmitStackConvert(Op, SrcVT, DstVT, dl)))
3447 Results.push_back(Tmp1);
3448 break;
3449 }
3450 case ISD::BF16_TO_FP: {
3451 // Always expand bf16 to f32 casts, they lower to ext + shift.
3452 //
3453 // Note that the operand of this code can be bf16 or an integer type in case
3454 // bf16 is not supported on the target and was softened.
3455 SDValue Op = Node->getOperand(0);
3456 if (Op.getValueType() == MVT::bf16) {
3457 Op = DAG.getNode(ISD::ANY_EXTEND, dl, MVT::i32,
3458 DAG.getNode(ISD::BITCAST, dl, MVT::i16, Op));
3459 } else {
3460 Op = DAG.getAnyExtOrTrunc(Op, dl, MVT::i32);
3461 }
3462 Op = DAG.getNode(ISD::SHL, dl, MVT::i32, Op,
3463 DAG.getShiftAmountConstant(16, MVT::i32, dl));
3464 Op = DAG.getNode(ISD::BITCAST, dl, MVT::f32, Op);
3465 // Add fp_extend in case the output is bigger than f32.
3466 if (Node->getValueType(0) != MVT::f32)
3467 Op = DAG.getNode(ISD::FP_EXTEND, dl, Node->getValueType(0), Op);
3468 Results.push_back(Op);
3469 break;
3470 }
3471 case ISD::FP_TO_BF16: {
3472 SDValue Op = Node->getOperand(0);
3473 if (Op.getValueType() != MVT::f32)
3474 Op = DAG.getNode(ISD::FP_ROUND, dl, MVT::f32, Op,
3475 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true));
3476 // Certain SNaNs will turn into infinities if we do a simple shift right.
3477 if (!DAG.isKnownNeverSNaN(Op)) {
3478 Op = DAG.getNode(ISD::FCANONICALIZE, dl, MVT::f32, Op, Node->getFlags());
3479 }
3480 Op = DAG.getNode(ISD::SRL, dl, MVT::i32,
3481 DAG.getNode(ISD::BITCAST, dl, MVT::i32, Op),
3482 DAG.getShiftAmountConstant(16, MVT::i32, dl));
3483 // The result of this node can be bf16 or an integer type in case bf16 is
3484 // not supported on the target and was softened to i16 for storage.
3485 if (Node->getValueType(0) == MVT::bf16) {
3486 Op = DAG.getNode(ISD::BITCAST, dl, MVT::bf16,
3487 DAG.getNode(ISD::TRUNCATE, dl, MVT::i16, Op));
3488 } else {
3489 Op = DAG.getAnyExtOrTrunc(Op, dl, Node->getValueType(0));
3490 }
3491 Results.push_back(Op);
3492 break;
3493 }
3494 case ISD::FCANONICALIZE: {
3495 // This implements llvm.canonicalize.f* by multiplication with 1.0, as
3496 // suggested in
3497 // https://llvm.org/docs/LangRef.html#llvm-canonicalize-intrinsic.
3498 // It uses strict_fp operations even outside a strict_fp context in order
3499 // to guarantee that the canonicalization is not optimized away by later
3500 // passes. The result chain introduced by that is intentionally ignored
3501 // since no ordering requirement is intended here.
3502
3503 // Create strict multiplication by 1.0.
3504 SDValue Operand = Node->getOperand(0);
3505 EVT VT = Operand.getValueType();
3506 SDValue One = DAG.getConstantFP(1.0, dl, VT);
3507 SDValue Chain = DAG.getEntryNode();
3508 // Propagate existing flags on canonicalize, and additionally set
3509 // NoFPExcept.
3510 SDNodeFlags CanonicalizeFlags = Node->getFlags();
3511 CanonicalizeFlags.setNoFPExcept(true);
3512 SDValue Mul = DAG.getNode(ISD::STRICT_FMUL, dl, {VT, MVT::Other},
3513 {Chain, Operand, One}, CanonicalizeFlags);
3514
3515 Results.push_back(Mul);
3516 break;
3517 }
3519 EVT ExtraVT = cast<VTSDNode>(Node->getOperand(1))->getVT();
3520 EVT VT = Node->getValueType(0);
3521
3522 // An in-register sign-extend of a boolean is a negation:
3523 // 'true' (1) sign-extended is -1.
3524 // 'false' (0) sign-extended is 0.
3525 // However, we must mask the high bits of the source operand because the
3526 // SIGN_EXTEND_INREG does not guarantee that the high bits are already zero.
3527
3528 // TODO: Do this for vectors too?
3529 if (ExtraVT.isScalarInteger() && ExtraVT.getSizeInBits() == 1) {
3530 SDValue One = DAG.getConstant(1, dl, VT);
3531 SDValue And = DAG.getNode(ISD::AND, dl, VT, Node->getOperand(0), One);
3532 SDValue Zero = DAG.getConstant(0, dl, VT);
3533 SDValue Neg = DAG.getNode(ISD::SUB, dl, VT, Zero, And);
3534 Results.push_back(Neg);
3535 break;
3536 }
3537
3538 // NOTE: we could fall back on load/store here too for targets without
3539 // SRA. However, it is doubtful that any exist.
3540 unsigned BitsDiff = VT.getScalarSizeInBits() -
3541 ExtraVT.getScalarSizeInBits();
3542 SDValue ShiftCst = DAG.getShiftAmountConstant(BitsDiff, VT, dl);
3543 Tmp1 = DAG.getNode(ISD::SHL, dl, VT, Node->getOperand(0), ShiftCst);
3544 Tmp1 = DAG.getNode(ISD::SRA, dl, VT, Tmp1, ShiftCst);
3545 Results.push_back(Tmp1);
3546 break;
3547 }
3548 case ISD::UINT_TO_FP:
3550 if (TLI.expandUINT_TO_FP(Node, Tmp1, Tmp2, DAG)) {
3551 Results.push_back(Tmp1);
3552 if (Node->isStrictFPOpcode())
3553 Results.push_back(Tmp2);
3554 break;
3555 }
3556 [[fallthrough]];
3557 case ISD::SINT_TO_FP:
3559 if ((Tmp1 = ExpandLegalINT_TO_FP(Node, Tmp2))) {
3560 Results.push_back(Tmp1);
3561 if (Node->isStrictFPOpcode())
3562 Results.push_back(Tmp2);
3563 }
3564 break;
3565 case ISD::FP_TO_SINT:
3566 if (TLI.expandFP_TO_SINT(Node, Tmp1, DAG))
3567 Results.push_back(Tmp1);
3568 break;
3570 if (TLI.expandFP_TO_SINT(Node, Tmp1, DAG)) {
3571 ReplaceNode(Node, Tmp1.getNode());
3572 LLVM_DEBUG(dbgs() << "Successfully expanded STRICT_FP_TO_SINT node\n");
3573 return true;
3574 }
3575 break;
3576 case ISD::FP_TO_UINT:
3577 if (TLI.expandFP_TO_UINT(Node, Tmp1, Tmp2, DAG))
3578 Results.push_back(Tmp1);
3579 break;
3581 if (TLI.expandFP_TO_UINT(Node, Tmp1, Tmp2, DAG)) {
3582 // Relink the chain.
3583 DAG.ReplaceAllUsesOfValueWith(SDValue(Node,1), Tmp2);
3584 // Replace the new UINT result.
3585 ReplaceNodeWithValue(SDValue(Node, 0), Tmp1);
3586 LLVM_DEBUG(dbgs() << "Successfully expanded STRICT_FP_TO_UINT node\n");
3587 return true;
3588 }
3589 break;
3592 Results.push_back(TLI.expandFP_TO_INT_SAT(Node, DAG));
3593 break;
3594 case ISD::LROUND:
3595 case ISD::LLROUND: {
3596 SDValue Arg = Node->getOperand(0);
3597 EVT ArgVT = Arg.getValueType();
3598 EVT ResVT = Node->getValueType(0);
3599 SDLoc dl(Node);
3600 SDValue RoundNode = DAG.getNode(ISD::FROUND, dl, ArgVT, Arg);
3601 Results.push_back(DAG.getNode(ISD::FP_TO_SINT, dl, ResVT, RoundNode));
3602 break;
3603 }
3604 case ISD::VAARG:
3605 Results.push_back(DAG.expandVAArg(Node));
3606 Results.push_back(Results[0].getValue(1));
3607 break;
3608 case ISD::VACOPY:
3609 Results.push_back(DAG.expandVACopy(Node));
3610 break;
3612 if (Node->getOperand(0).getValueType().getVectorElementCount().isScalar())
3613 // This must be an access of the only element. Return it.
3614 Tmp1 = DAG.getNode(ISD::BITCAST, dl, Node->getValueType(0),
3615 Node->getOperand(0));
3616 else
3617 Tmp1 = ExpandExtractFromVectorThroughStack(SDValue(Node, 0));
3618 Results.push_back(Tmp1);
3619 break;
3621 Results.push_back(ExpandExtractFromVectorThroughStack(SDValue(Node, 0)));
3622 break;
3624 Results.push_back(ExpandInsertToVectorThroughStack(SDValue(Node, 0)));
3625 break;
3627 if (EVT VectorValueType = Node->getOperand(0).getValueType();
3628 VectorValueType.isScalableVector() ||
3629 TLI.isOperationExpand(ISD::EXTRACT_VECTOR_ELT, VectorValueType))
3630 Results.push_back(ExpandVectorBuildThroughStack(Node));
3631 else
3632 Results.push_back(ExpandConcatVectors(Node));
3633 break;
3635 Results.push_back(ExpandSCALAR_TO_VECTOR(Node));
3636 break;
3638 Results.push_back(ExpandINSERT_VECTOR_ELT(SDValue(Node, 0)));
3639 break;
3640 case ISD::VECTOR_SHUFFLE: {
3641 SmallVector<int, 32> NewMask;
3642 ArrayRef<int> Mask = cast<ShuffleVectorSDNode>(Node)->getMask();
3643
3644 EVT VT = Node->getValueType(0);
3645 EVT EltVT = VT.getVectorElementType();
3646 SDValue Op0 = Node->getOperand(0);
3647 SDValue Op1 = Node->getOperand(1);
3648 if (!TLI.isTypeLegal(EltVT)) {
3649 EVT NewEltVT = TLI.getTypeToTransformTo(*DAG.getContext(), EltVT);
3650
3651 // BUILD_VECTOR operands are allowed to be wider than the element type.
3652 // But if NewEltVT is smaller that EltVT the BUILD_VECTOR does not accept
3653 // it.
3654 if (NewEltVT.bitsLT(EltVT)) {
3655 // Convert shuffle node.
3656 // If original node was v4i64 and the new EltVT is i32,
3657 // cast operands to v8i32 and re-build the mask.
3658
3659 // Calculate new VT, the size of the new VT should be equal to original.
3660 EVT NewVT =
3661 EVT::getVectorVT(*DAG.getContext(), NewEltVT,
3662 VT.getSizeInBits() / NewEltVT.getSizeInBits());
3663 assert(NewVT.bitsEq(VT));
3664
3665 // cast operands to new VT
3666 Op0 = DAG.getNode(ISD::BITCAST, dl, NewVT, Op0);
3667 Op1 = DAG.getNode(ISD::BITCAST, dl, NewVT, Op1);
3668
3669 // Convert the shuffle mask
3670 unsigned int factor =
3672
3673 // EltVT gets smaller
3674 assert(factor > 0);
3675
3676 for (unsigned i = 0; i < VT.getVectorNumElements(); ++i) {
3677 if (Mask[i] < 0) {
3678 for (unsigned fi = 0; fi < factor; ++fi)
3679 NewMask.push_back(Mask[i]);
3680 }
3681 else {
3682 for (unsigned fi = 0; fi < factor; ++fi)
3683 NewMask.push_back(Mask[i]*factor+fi);
3684 }
3685 }
3686 Mask = NewMask;
3687 VT = NewVT;
3688 }
3689 EltVT = NewEltVT;
3690 }
3691 unsigned NumElems = VT.getVectorNumElements();
3693 for (unsigned i = 0; i != NumElems; ++i) {
3694 if (Mask[i] < 0) {
3695 Ops.push_back(DAG.getUNDEF(EltVT));
3696 continue;
3697 }
3698 unsigned Idx = Mask[i];
3699 if (Idx < NumElems)
3700 Ops.push_back(DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, EltVT, Op0,
3701 DAG.getVectorIdxConstant(Idx, dl)));
3702 else
3703 Ops.push_back(
3704 DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, EltVT, Op1,
3705 DAG.getVectorIdxConstant(Idx - NumElems, dl)));
3706 }
3707
3708 Tmp1 = DAG.getBuildVector(VT, dl, Ops);
3709 // We may have changed the BUILD_VECTOR type. Cast it back to the Node type.
3710 Tmp1 = DAG.getNode(ISD::BITCAST, dl, Node->getValueType(0), Tmp1);
3711 Results.push_back(Tmp1);
3712 break;
3713 }
3714 case ISD::VECTOR_SPLICE: {
3715 Results.push_back(TLI.expandVectorSplice(Node, DAG));
3716 break;
3717 }
3719 unsigned Factor = Node->getNumOperands();
3720 if (Factor <= 2 || !isPowerOf2_32(Factor))
3721 break;
3723 EVT VecVT = Node->getValueType(0);
3724 SmallVector<EVT> HalfVTs(Factor / 2, VecVT);
3725 // Deinterleave at Factor/2 so each result contains two factors interleaved:
3726 // a0b0 c0d0 a1b1 c1d1 -> [a0c0 b0d0] [a1c1 b1d1]
3727 SDValue L = DAG.getNode(ISD::VECTOR_DEINTERLEAVE, dl, HalfVTs,
3728 ArrayRef(Ops).take_front(Factor / 2));
3729 SDValue R = DAG.getNode(ISD::VECTOR_DEINTERLEAVE, dl, HalfVTs,
3730 ArrayRef(Ops).take_back(Factor / 2));
3731 Results.resize(Factor);
3732 // Deinterleave the 2 factors out:
3733 // [a0c0 a1c1] [b0d0 b1d1] -> a0a1 b0b1 c0c1 d0d1
3734 for (unsigned I = 0; I < Factor / 2; I++) {
3736 DAG.getNode(ISD::VECTOR_DEINTERLEAVE, dl, {VecVT, VecVT},
3737 {L.getValue(I), R.getValue(I)});
3738 Results[I] = Deinterleave.getValue(0);
3739 Results[I + Factor / 2] = Deinterleave.getValue(1);
3740 }
3741 break;
3742 }
3744 unsigned Factor = Node->getNumOperands();
3745 if (Factor <= 2 || !isPowerOf2_32(Factor))
3746 break;
3747 EVT VecVT = Node->getValueType(0);
3748 SmallVector<EVT> HalfVTs(Factor / 2, VecVT);
3749 SmallVector<SDValue, 8> LOps, ROps;
3750 // Interleave so we have 2 factors per result:
3751 // a0a1 b0b1 c0c1 d0d1 -> [a0c0 b0d0] [a1c1 b1d1]
3752 for (unsigned I = 0; I < Factor / 2; I++) {
3753 SDValue Interleave =
3754 DAG.getNode(ISD::VECTOR_INTERLEAVE, dl, {VecVT, VecVT},
3755 {Node->getOperand(I), Node->getOperand(I + Factor / 2)});
3756 LOps.push_back(Interleave.getValue(0));
3757 ROps.push_back(Interleave.getValue(1));
3758 }
3759 // Interleave at Factor/2:
3760 // [a0c0 b0d0] [a1c1 b1d1] -> a0b0 c0d0 a1b1 c1d1
3761 SDValue L = DAG.getNode(ISD::VECTOR_INTERLEAVE, dl, HalfVTs, LOps);
3762 SDValue R = DAG.getNode(ISD::VECTOR_INTERLEAVE, dl, HalfVTs, ROps);
3763 for (unsigned I = 0; I < Factor / 2; I++)
3764 Results.push_back(L.getValue(I));
3765 for (unsigned I = 0; I < Factor / 2; I++)
3766 Results.push_back(R.getValue(I));
3767 break;
3768 }
3769 case ISD::EXTRACT_ELEMENT: {
3770 EVT OpTy = Node->getOperand(0).getValueType();
3771 if (Node->getConstantOperandVal(1)) {
3772 // 1 -> Hi
3773 Tmp1 = DAG.getNode(
3774 ISD::SRL, dl, OpTy, Node->getOperand(0),
3775 DAG.getShiftAmountConstant(OpTy.getSizeInBits() / 2, OpTy, dl));
3776 Tmp1 = DAG.getNode(ISD::TRUNCATE, dl, Node->getValueType(0), Tmp1);
3777 } else {
3778 // 0 -> Lo
3779 Tmp1 = DAG.getNode(ISD::TRUNCATE, dl, Node->getValueType(0),
3780 Node->getOperand(0));
3781 }
3782 Results.push_back(Tmp1);
3783 break;
3784 }
3785 case ISD::STACKSAVE:
3786 // Expand to CopyFromReg if the target set
3787 // StackPointerRegisterToSaveRestore.
3789 Results.push_back(DAG.getCopyFromReg(Node->getOperand(0), dl, SP,
3790 Node->getValueType(0)));
3791 Results.push_back(Results[0].getValue(1));
3792 } else {
3793 Results.push_back(DAG.getUNDEF(Node->getValueType(0)));
3794 Results.push_back(Node->getOperand(0));
3795 }
3796 break;
3797 case ISD::STACKRESTORE:
3798 // Expand to CopyToReg if the target set
3799 // StackPointerRegisterToSaveRestore.
3801 Results.push_back(DAG.getCopyToReg(Node->getOperand(0), dl, SP,
3802 Node->getOperand(1)));
3803 } else {
3804 Results.push_back(Node->getOperand(0));
3805 }
3806 break;
3808 Results.push_back(DAG.getConstant(0, dl, Node->getValueType(0)));
3809 Results.push_back(Results[0].getValue(0));
3810 break;
3811 case ISD::FCOPYSIGN:
3812 Results.push_back(ExpandFCOPYSIGN(Node));
3813 break;
3814 case ISD::FNEG:
3815 Results.push_back(ExpandFNEG(Node));
3816 break;
3817 case ISD::FABS:
3818 Results.push_back(ExpandFABS(Node));
3819 break;
3820 case ISD::IS_FPCLASS: {
3821 auto Test = static_cast<FPClassTest>(Node->getConstantOperandVal(1));
3822 if (SDValue Expanded =
3823 TLI.expandIS_FPCLASS(Node->getValueType(0), Node->getOperand(0),
3824 Test, Node->getFlags(), SDLoc(Node), DAG))
3825 Results.push_back(Expanded);
3826 break;
3827 }
3828 case ISD::SMIN:
3829 case ISD::SMAX:
3830 case ISD::UMIN:
3831 case ISD::UMAX: {
3832 // Expand Y = MAX(A, B) -> Y = (A > B) ? A : B
3833 ISD::CondCode Pred;
3834 switch (Node->getOpcode()) {
3835 default: llvm_unreachable("How did we get here?");
3836 case ISD::SMAX: Pred = ISD::SETGT; break;
3837 case ISD::SMIN: Pred = ISD::SETLT; break;
3838 case ISD::UMAX: Pred = ISD::SETUGT; break;
3839 case ISD::UMIN: Pred = ISD::SETULT; break;
3840 }
3841 Tmp1 = Node->getOperand(0);
3842 Tmp2 = Node->getOperand(1);
3843 Tmp1 = DAG.getSelectCC(dl, Tmp1, Tmp2, Tmp1, Tmp2, Pred);
3844 Results.push_back(Tmp1);
3845 break;
3846 }
3847 case ISD::FMINNUM:
3848 case ISD::FMAXNUM: {
3849 if (SDValue Expanded = TLI.expandFMINNUM_FMAXNUM(Node, DAG))
3850 Results.push_back(Expanded);
3851 break;
3852 }
3853 case ISD::FMINIMUM:
3854 case ISD::FMAXIMUM: {
3855 if (SDValue Expanded = TLI.expandFMINIMUM_FMAXIMUM(Node, DAG))
3856 Results.push_back(Expanded);
3857 break;
3858 }
3859 case ISD::FMINIMUMNUM:
3860 case ISD::FMAXIMUMNUM: {
3861 Results.push_back(TLI.expandFMINIMUMNUM_FMAXIMUMNUM(Node, DAG));
3862 break;
3863 }
3864 case ISD::FSIN:
3865 case ISD::FCOS: {
3866 EVT VT = Node->getValueType(0);
3867 // Turn fsin / fcos into ISD::FSINCOS node if there are a pair of fsin /
3868 // fcos which share the same operand and both are used.
3869 if ((TLI.isOperationLegal(ISD::FSINCOS, VT) ||
3870 isSinCosLibcallAvailable(Node, TLI)) &&
3871 useSinCos(Node)) {
3872 SDVTList VTs = DAG.getVTList(VT, VT);
3873 Tmp1 = DAG.getNode(ISD::FSINCOS, dl, VTs, Node->getOperand(0));
3874 if (Node->getOpcode() == ISD::FCOS)
3875 Tmp1 = Tmp1.getValue(1);
3876 Results.push_back(Tmp1);
3877 }
3878 break;
3879 }
3880 case ISD::FLDEXP:
3881 case ISD::STRICT_FLDEXP: {
3882 EVT VT = Node->getValueType(0);
3883 RTLIB::Libcall LC = RTLIB::getLDEXP(VT);
3884 // Use the LibCall instead, it is very likely faster
3885 // FIXME: Use separate LibCall action.
3886 if (TLI.getLibcallImpl(LC) != RTLIB::Unsupported)
3887 break;
3888
3889 if (SDValue Expanded = expandLdexp(Node)) {
3890 Results.push_back(Expanded);
3891 if (Node->getOpcode() == ISD::STRICT_FLDEXP)
3892 Results.push_back(Expanded.getValue(1));
3893 }
3894
3895 break;
3896 }
3897 case ISD::FFREXP: {
3898 RTLIB::Libcall LC = RTLIB::getFREXP(Node->getValueType(0));
3899 // Use the LibCall instead, it is very likely faster
3900 // FIXME: Use separate LibCall action.
3901 if (TLI.getLibcallImpl(LC) != RTLIB::Unsupported)
3902 break;
3903
3904 if (SDValue Expanded = expandFrexp(Node)) {
3905 Results.push_back(Expanded);
3906 Results.push_back(Expanded.getValue(1));
3907 }
3908 break;
3909 }
3910 case ISD::FSINCOS: {
3911 if (isSinCosLibcallAvailable(Node, TLI))
3912 break;
3913 EVT VT = Node->getValueType(0);
3914 SDValue Op = Node->getOperand(0);
3915 SDNodeFlags Flags = Node->getFlags();
3916 Tmp1 = DAG.getNode(ISD::FSIN, dl, VT, Op, Flags);
3917 Tmp2 = DAG.getNode(ISD::FCOS, dl, VT, Op, Flags);
3918 Results.append({Tmp1, Tmp2});
3919 break;
3920 }
3921 case ISD::FMAD:
3922 llvm_unreachable("Illegal fmad should never be formed");
3923
3924 case ISD::FP16_TO_FP:
3925 if (Node->getValueType(0) != MVT::f32) {
3926 // We can extend to types bigger than f32 in two steps without changing
3927 // the result. Since "f16 -> f32" is much more commonly available, give
3928 // CodeGen the option of emitting that before resorting to a libcall.
3929 SDValue Res =
3930 DAG.getNode(ISD::FP16_TO_FP, dl, MVT::f32, Node->getOperand(0));
3931 Results.push_back(
3932 DAG.getNode(ISD::FP_EXTEND, dl, Node->getValueType(0), Res));
3933 }
3934 break;
3937 if (Node->getValueType(0) != MVT::f32) {
3938 // We can extend to types bigger than f32 in two steps without changing
3939 // the result. Since "f16 -> f32" is much more commonly available, give
3940 // CodeGen the option of emitting that before resorting to a libcall.
3941 SDValue Res = DAG.getNode(Node->getOpcode(), dl, {MVT::f32, MVT::Other},
3942 {Node->getOperand(0), Node->getOperand(1)});
3943 Res = DAG.getNode(ISD::STRICT_FP_EXTEND, dl,
3944 {Node->getValueType(0), MVT::Other},
3945 {Res.getValue(1), Res});
3946 Results.push_back(Res);
3947 Results.push_back(Res.getValue(1));
3948 }
3949 break;
3950 case ISD::FP_TO_FP16:
3951 LLVM_DEBUG(dbgs() << "Legalizing FP_TO_FP16\n");
3952 if (Node->getFlags().hasApproximateFuncs() && !TLI.useSoftFloat()) {
3953 SDValue Op = Node->getOperand(0);
3954 MVT SVT = Op.getSimpleValueType();
3955 if ((SVT == MVT::f64 || SVT == MVT::f80) &&
3957 // Under fastmath, we can expand this node into a fround followed by
3958 // a float-half conversion.
3959 SDValue FloatVal =
3960 DAG.getNode(ISD::FP_ROUND, dl, MVT::f32, Op,
3961 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true));
3962 Results.push_back(
3963 DAG.getNode(ISD::FP_TO_FP16, dl, Node->getValueType(0), FloatVal));
3964 }
3965 }
3966 break;
3967 case ISD::ConstantFP: {
3968 ConstantFPSDNode *CFP = cast<ConstantFPSDNode>(Node);
3969 // Check to see if this FP immediate is already legal.
3970 // If this is a legal constant, turn it into a TargetConstantFP node.
3971 if (!TLI.isFPImmLegal(CFP->getValueAPF(), Node->getValueType(0),
3972 DAG.shouldOptForSize()))
3973 Results.push_back(ExpandConstantFP(CFP, true));
3974 break;
3975 }
3976 case ISD::Constant: {
3977 ConstantSDNode *CP = cast<ConstantSDNode>(Node);
3978 Results.push_back(ExpandConstant(CP));
3979 break;
3980 }
3981 case ISD::FSUB: {
3982 EVT VT = Node->getValueType(0);
3983 if (TLI.isOperationLegalOrCustom(ISD::FADD, VT) &&
3985 const SDNodeFlags Flags = Node->getFlags();
3986 Tmp1 = DAG.getNode(ISD::FNEG, dl, VT, Node->getOperand(1));
3987 Tmp1 = DAG.getNode(ISD::FADD, dl, VT, Node->getOperand(0), Tmp1, Flags);
3988 Results.push_back(Tmp1);
3989 }
3990 break;
3991 }
3992 case ISD::SUB: {
3993 EVT VT = Node->getValueType(0);
3996 "Don't know how to expand this subtraction!");
3997 Tmp1 = DAG.getNOT(dl, Node->getOperand(1), VT);
3998 Tmp1 = DAG.getNode(ISD::ADD, dl, VT, Tmp1, DAG.getConstant(1, dl, VT));
3999 Results.push_back(DAG.getNode(ISD::ADD, dl, VT, Node->getOperand(0), Tmp1));
4000 break;
4001 }
4002 case ISD::UREM:
4003 case ISD::SREM:
4004 if (TLI.expandREM(Node, Tmp1, DAG))
4005 Results.push_back(Tmp1);
4006 break;
4007 case ISD::UDIV:
4008 case ISD::SDIV: {
4009 bool isSigned = Node->getOpcode() == ISD::SDIV;
4010 unsigned DivRemOpc = isSigned ? ISD::SDIVREM : ISD::UDIVREM;
4011 EVT VT = Node->getValueType(0);
4012 if (TLI.isOperationLegalOrCustom(DivRemOpc, VT)) {
4013 SDVTList VTs = DAG.getVTList(VT, VT);
4014 Tmp1 = DAG.getNode(DivRemOpc, dl, VTs, Node->getOperand(0),
4015 Node->getOperand(1));
4016 Results.push_back(Tmp1);
4017 }
4018 break;
4019 }
4020 case ISD::MULHU:
4021 case ISD::MULHS: {
4022 unsigned ExpandOpcode =
4023 Node->getOpcode() == ISD::MULHU ? ISD::UMUL_LOHI : ISD::SMUL_LOHI;
4024 EVT VT = Node->getValueType(0);
4025 SDVTList VTs = DAG.getVTList(VT, VT);
4026
4027 Tmp1 = DAG.getNode(ExpandOpcode, dl, VTs, Node->getOperand(0),
4028 Node->getOperand(1));
4029 Results.push_back(Tmp1.getValue(1));
4030 break;
4031 }
4032 case ISD::UMUL_LOHI:
4033 case ISD::SMUL_LOHI: {
4034 SDValue LHS = Node->getOperand(0);
4035 SDValue RHS = Node->getOperand(1);
4036 MVT VT = LHS.getSimpleValueType();
4037 unsigned MULHOpcode =
4038 Node->getOpcode() == ISD::UMUL_LOHI ? ISD::MULHU : ISD::MULHS;
4039
4040 if (TLI.isOperationLegalOrCustom(MULHOpcode, VT)) {
4041 Results.push_back(DAG.getNode(ISD::MUL, dl, VT, LHS, RHS));
4042 Results.push_back(DAG.getNode(MULHOpcode, dl, VT, LHS, RHS));
4043 break;
4044 }
4045
4047 EVT HalfType = EVT(VT).getHalfSizedIntegerVT(*DAG.getContext());
4048 assert(TLI.isTypeLegal(HalfType));
4049 if (TLI.expandMUL_LOHI(Node->getOpcode(), VT, dl, LHS, RHS, Halves,
4050 HalfType, DAG,
4051 TargetLowering::MulExpansionKind::Always)) {
4052 for (unsigned i = 0; i < 2; ++i) {
4053 SDValue Lo = DAG.getNode(ISD::ZERO_EXTEND, dl, VT, Halves[2 * i]);
4054 SDValue Hi = DAG.getNode(ISD::ANY_EXTEND, dl, VT, Halves[2 * i + 1]);
4055 SDValue Shift =
4056 DAG.getShiftAmountConstant(HalfType.getScalarSizeInBits(), VT, dl);
4057 Hi = DAG.getNode(ISD::SHL, dl, VT, Hi, Shift);
4058 Results.push_back(DAG.getNode(ISD::OR, dl, VT, Lo, Hi));
4059 }
4060 break;
4061 }
4062 break;
4063 }
4064 case ISD::MUL: {
4065 EVT VT = Node->getValueType(0);
4066 SDVTList VTs = DAG.getVTList(VT, VT);
4067 // See if multiply or divide can be lowered using two-result operations.
4068 // We just need the low half of the multiply; try both the signed
4069 // and unsigned forms. If the target supports both SMUL_LOHI and
4070 // UMUL_LOHI, form a preference by checking which forms of plain
4071 // MULH it supports.
4072 bool HasSMUL_LOHI = TLI.isOperationLegalOrCustom(ISD::SMUL_LOHI, VT);
4073 bool HasUMUL_LOHI = TLI.isOperationLegalOrCustom(ISD::UMUL_LOHI, VT);
4074 bool HasMULHS = TLI.isOperationLegalOrCustom(ISD::MULHS, VT);
4075 bool HasMULHU = TLI.isOperationLegalOrCustom(ISD::MULHU, VT);
4076 unsigned OpToUse = 0;
4077 if (HasSMUL_LOHI && !HasMULHS) {
4078 OpToUse = ISD::SMUL_LOHI;
4079 } else if (HasUMUL_LOHI && !HasMULHU) {
4080 OpToUse = ISD::UMUL_LOHI;
4081 } else if (HasSMUL_LOHI) {
4082 OpToUse = ISD::SMUL_LOHI;
4083 } else if (HasUMUL_LOHI) {
4084 OpToUse = ISD::UMUL_LOHI;
4085 }
4086 if (OpToUse) {
4087 Results.push_back(DAG.getNode(OpToUse, dl, VTs, Node->getOperand(0),
4088 Node->getOperand(1)));
4089 break;
4090 }
4091
4092 SDValue Lo, Hi;
4093 EVT HalfType = VT.getHalfSizedIntegerVT(*DAG.getContext());
4098 TLI.expandMUL(Node, Lo, Hi, HalfType, DAG,
4099 TargetLowering::MulExpansionKind::OnlyLegalOrCustom)) {
4100 Lo = DAG.getNode(ISD::ZERO_EXTEND, dl, VT, Lo);
4101 Hi = DAG.getNode(ISD::ANY_EXTEND, dl, VT, Hi);
4102 SDValue Shift =
4103 DAG.getShiftAmountConstant(HalfType.getSizeInBits(), VT, dl);
4104 Hi = DAG.getNode(ISD::SHL, dl, VT, Hi, Shift);
4105 Results.push_back(DAG.getNode(ISD::OR, dl, VT, Lo, Hi));
4106 }
4107 break;
4108 }
4109 case ISD::FSHL:
4110 case ISD::FSHR:
4111 if (SDValue Expanded = TLI.expandFunnelShift(Node, DAG))
4112 Results.push_back(Expanded);
4113 break;
4114 case ISD::ROTL:
4115 case ISD::ROTR:
4116 if (SDValue Expanded = TLI.expandROT(Node, true /*AllowVectorOps*/, DAG))
4117 Results.push_back(Expanded);
4118 break;
4119 case ISD::SADDSAT:
4120 case ISD::UADDSAT:
4121 case ISD::SSUBSAT:
4122 case ISD::USUBSAT:
4123 Results.push_back(TLI.expandAddSubSat(Node, DAG));
4124 break;
4125 case ISD::SCMP:
4126 case ISD::UCMP:
4127 Results.push_back(TLI.expandCMP(Node, DAG));
4128 break;
4129 case ISD::SSHLSAT:
4130 case ISD::USHLSAT:
4131 Results.push_back(TLI.expandShlSat(Node, DAG));
4132 break;
4133 case ISD::SMULFIX:
4134 case ISD::SMULFIXSAT:
4135 case ISD::UMULFIX:
4136 case ISD::UMULFIXSAT:
4137 Results.push_back(TLI.expandFixedPointMul(Node, DAG));
4138 break;
4139 case ISD::SDIVFIX:
4140 case ISD::SDIVFIXSAT:
4141 case ISD::UDIVFIX:
4142 case ISD::UDIVFIXSAT:
4143 if (SDValue V = TLI.expandFixedPointDiv(Node->getOpcode(), SDLoc(Node),
4144 Node->getOperand(0),
4145 Node->getOperand(1),
4146 Node->getConstantOperandVal(2),
4147 DAG)) {
4148 Results.push_back(V);
4149 break;
4150 }
4151 // FIXME: We might want to retry here with a wider type if we fail, if that
4152 // type is legal.
4153 // FIXME: Technically, so long as we only have sdivfixes where BW+Scale is
4154 // <= 128 (which is the case for all of the default Embedded-C types),
4155 // we will only get here with types and scales that we could always expand
4156 // if we were allowed to generate libcalls to division functions of illegal
4157 // type. But we cannot do that.
4158 llvm_unreachable("Cannot expand DIVFIX!");
4159 case ISD::UADDO_CARRY:
4160 case ISD::USUBO_CARRY: {
4161 SDValue LHS = Node->getOperand(0);
4162 SDValue RHS = Node->getOperand(1);
4163 SDValue Carry = Node->getOperand(2);
4164
4165 bool IsAdd = Node->getOpcode() == ISD::UADDO_CARRY;
4166
4167 // Initial add of the 2 operands.
4168 unsigned Op = IsAdd ? ISD::ADD : ISD::SUB;
4169 EVT VT = LHS.getValueType();
4170 SDValue Sum = DAG.getNode(Op, dl, VT, LHS, RHS);
4171
4172 // Initial check for overflow.
4173 EVT CarryType = Node->getValueType(1);
4174 EVT SetCCType = getSetCCResultType(Node->getValueType(0));
4175 ISD::CondCode CC = IsAdd ? ISD::SETULT : ISD::SETUGT;
4176 SDValue Overflow = DAG.getSetCC(dl, SetCCType, Sum, LHS, CC);
4177
4178 // Add of the sum and the carry.
4179 SDValue One = DAG.getConstant(1, dl, VT);
4180 SDValue CarryExt =
4181 DAG.getNode(ISD::AND, dl, VT, DAG.getZExtOrTrunc(Carry, dl, VT), One);
4182 SDValue Sum2 = DAG.getNode(Op, dl, VT, Sum, CarryExt);
4183
4184 // Second check for overflow. If we are adding, we can only overflow if the
4185 // initial sum is all 1s ang the carry is set, resulting in a new sum of 0.
4186 // If we are subtracting, we can only overflow if the initial sum is 0 and
4187 // the carry is set, resulting in a new sum of all 1s.
4188 SDValue Zero = DAG.getConstant(0, dl, VT);
4189 SDValue Overflow2 =
4190 IsAdd ? DAG.getSetCC(dl, SetCCType, Sum2, Zero, ISD::SETEQ)
4191 : DAG.getSetCC(dl, SetCCType, Sum, Zero, ISD::SETEQ);
4192 Overflow2 = DAG.getNode(ISD::AND, dl, SetCCType, Overflow2,
4193 DAG.getZExtOrTrunc(Carry, dl, SetCCType));
4194
4195 SDValue ResultCarry =
4196 DAG.getNode(ISD::OR, dl, SetCCType, Overflow, Overflow2);
4197
4198 Results.push_back(Sum2);
4199 Results.push_back(DAG.getBoolExtOrTrunc(ResultCarry, dl, CarryType, VT));
4200 break;
4201 }
4202 case ISD::SADDO:
4203 case ISD::SSUBO: {
4204 SDValue Result, Overflow;
4205 TLI.expandSADDSUBO(Node, Result, Overflow, DAG);
4206 Results.push_back(Result);
4207 Results.push_back(Overflow);
4208 break;
4209 }
4210 case ISD::UADDO:
4211 case ISD::USUBO: {
4212 SDValue Result, Overflow;
4213 TLI.expandUADDSUBO(Node, Result, Overflow, DAG);
4214 Results.push_back(Result);
4215 Results.push_back(Overflow);
4216 break;
4217 }
4218 case ISD::UMULO:
4219 case ISD::SMULO: {
4220 SDValue Result, Overflow;
4221 if (TLI.expandMULO(Node, Result, Overflow, DAG)) {
4222 Results.push_back(Result);
4223 Results.push_back(Overflow);
4224 }
4225 break;
4226 }
4227 case ISD::BUILD_PAIR: {
4228 EVT PairTy = Node->getValueType(0);
4229 Tmp1 = DAG.getNode(ISD::ZERO_EXTEND, dl, PairTy, Node->getOperand(0));
4230 Tmp2 = DAG.getNode(ISD::ANY_EXTEND, dl, PairTy, Node->getOperand(1));
4231 Tmp2 = DAG.getNode(
4232 ISD::SHL, dl, PairTy, Tmp2,
4233 DAG.getShiftAmountConstant(PairTy.getSizeInBits() / 2, PairTy, dl));
4234 Results.push_back(DAG.getNode(ISD::OR, dl, PairTy, Tmp1, Tmp2));
4235 break;
4236 }
4237 case ISD::SELECT:
4238 Tmp1 = Node->getOperand(0);
4239 Tmp2 = Node->getOperand(1);
4240 Tmp3 = Node->getOperand(2);
4241 if (Tmp1.getOpcode() == ISD::SETCC) {
4242 Tmp1 = DAG.getSelectCC(
4243 dl, Tmp1.getOperand(0), Tmp1.getOperand(1), Tmp2, Tmp3,
4244 cast<CondCodeSDNode>(Tmp1.getOperand(2))->get(), Node->getFlags());
4245 } else {
4246 Tmp1 =
4247 DAG.getSelectCC(dl, Tmp1, DAG.getConstant(0, dl, Tmp1.getValueType()),
4248 Tmp2, Tmp3, ISD::SETNE, Node->getFlags());
4249 }
4250 Results.push_back(Tmp1);
4251 break;
4252 case ISD::BR_JT: {
4253 SDValue Chain = Node->getOperand(0);
4254 SDValue Table = Node->getOperand(1);
4255 SDValue Index = Node->getOperand(2);
4256 int JTI = cast<JumpTableSDNode>(Table.getNode())->getIndex();
4257
4258 const DataLayout &TD = DAG.getDataLayout();
4259 EVT PTy = TLI.getPointerTy(TD);
4260
4261 unsigned EntrySize =
4263
4264 // For power-of-two jumptable entry sizes convert multiplication to a shift.
4265 // This transformation needs to be done here since otherwise the MIPS
4266 // backend will end up emitting a three instruction multiply sequence
4267 // instead of a single shift and MSP430 will call a runtime function.
4268 if (llvm::isPowerOf2_32(EntrySize))
4269 Index = DAG.getNode(
4270 ISD::SHL, dl, Index.getValueType(), Index,
4271 DAG.getConstant(llvm::Log2_32(EntrySize), dl, Index.getValueType()));
4272 else
4273 Index = DAG.getNode(ISD::MUL, dl, Index.getValueType(), Index,
4274 DAG.getConstant(EntrySize, dl, Index.getValueType()));
4275 SDValue Addr = DAG.getMemBasePlusOffset(Table, Index, dl);
4276
4277 EVT MemVT = EVT::getIntegerVT(*DAG.getContext(), EntrySize * 8);
4278 SDValue LD = DAG.getExtLoad(
4279 ISD::SEXTLOAD, dl, PTy, Chain, Addr,
4281 Addr = LD;
4282 if (TLI.isJumpTableRelative()) {
4283 // For PIC, the sequence is:
4284 // BRIND(RelocBase + load(Jumptable + index))
4285 // RelocBase can be JumpTable, GOT or some sort of global base.
4286 Addr = DAG.getMemBasePlusOffset(TLI.getPICJumpTableRelocBase(Table, DAG),
4287 Addr, dl);
4288 }
4289
4290 Tmp1 = TLI.expandIndirectJTBranch(dl, LD.getValue(1), Addr, JTI, DAG);
4291 Results.push_back(Tmp1);
4292 break;
4293 }
4294 case ISD::BRCOND:
4295 // Expand brcond's setcc into its constituent parts and create a BR_CC
4296 // Node.
4297 Tmp1 = Node->getOperand(0);
4298 Tmp2 = Node->getOperand(1);
4299 if (Tmp2.getOpcode() == ISD::SETCC &&
4301 Tmp2.getOperand(0).getValueType())) {
4302 Tmp1 = DAG.getNode(ISD::BR_CC, dl, MVT::Other, Tmp1, Tmp2.getOperand(2),
4303 Tmp2.getOperand(0), Tmp2.getOperand(1),
4304 Node->getOperand(2));
4305 } else {
4306 // We test only the i1 bit. Skip the AND if UNDEF or another AND.
4307 if (Tmp2.isUndef() ||
4308 (Tmp2.getOpcode() == ISD::AND && isOneConstant(Tmp2.getOperand(1))))
4309 Tmp3 = Tmp2;
4310 else
4311 Tmp3 = DAG.getNode(ISD::AND, dl, Tmp2.getValueType(), Tmp2,
4312 DAG.getConstant(1, dl, Tmp2.getValueType()));
4313 Tmp1 = DAG.getNode(ISD::BR_CC, dl, MVT::Other, Tmp1,
4314 DAG.getCondCode(ISD::SETNE), Tmp3,
4315 DAG.getConstant(0, dl, Tmp3.getValueType()),
4316 Node->getOperand(2));
4317 }
4318 Results.push_back(Tmp1);
4319 break;
4320 case ISD::SETCC:
4321 case ISD::VP_SETCC:
4322 case ISD::STRICT_FSETCC:
4323 case ISD::STRICT_FSETCCS: {
4324 bool IsVP = Node->getOpcode() == ISD::VP_SETCC;
4325 bool IsStrict = Node->getOpcode() == ISD::STRICT_FSETCC ||
4326 Node->getOpcode() == ISD::STRICT_FSETCCS;
4327 bool IsSignaling = Node->getOpcode() == ISD::STRICT_FSETCCS;
4328 SDValue Chain = IsStrict ? Node->getOperand(0) : SDValue();
4329 unsigned Offset = IsStrict ? 1 : 0;
4330 Tmp1 = Node->getOperand(0 + Offset);
4331 Tmp2 = Node->getOperand(1 + Offset);
4332 Tmp3 = Node->getOperand(2 + Offset);
4333 SDValue Mask, EVL;
4334 if (IsVP) {
4335 Mask = Node->getOperand(3 + Offset);
4336 EVL = Node->getOperand(4 + Offset);
4337 }
4338 bool Legalized = TLI.LegalizeSetCCCondCode(
4339 DAG, Node->getValueType(0), Tmp1, Tmp2, Tmp3, Mask, EVL, NeedInvert, dl,
4340 Chain, IsSignaling);
4341
4342 if (Legalized) {
4343 // If we expanded the SETCC by swapping LHS and RHS, or by inverting the
4344 // condition code, create a new SETCC node.
4345 if (Tmp3.getNode()) {
4346 if (IsStrict) {
4347 Tmp1 = DAG.getNode(Node->getOpcode(), dl, Node->getVTList(),
4348 {Chain, Tmp1, Tmp2, Tmp3}, Node->getFlags());
4349 Chain = Tmp1.getValue(1);
4350 } else if (IsVP) {
4351 Tmp1 = DAG.getNode(Node->getOpcode(), dl, Node->getValueType(0),
4352 {Tmp1, Tmp2, Tmp3, Mask, EVL}, Node->getFlags());
4353 } else {
4354 Tmp1 = DAG.getNode(Node->getOpcode(), dl, Node->getValueType(0), Tmp1,
4355 Tmp2, Tmp3, Node->getFlags());
4356 }
4357 }
4358
4359 // If we expanded the SETCC by inverting the condition code, then wrap
4360 // the existing SETCC in a NOT to restore the intended condition.
4361 if (NeedInvert) {
4362 if (!IsVP)
4363 Tmp1 = DAG.getLogicalNOT(dl, Tmp1, Tmp1->getValueType(0));
4364 else
4365 Tmp1 =
4366 DAG.getVPLogicalNOT(dl, Tmp1, Mask, EVL, Tmp1->getValueType(0));
4367 }
4368
4369 Results.push_back(Tmp1);
4370 if (IsStrict)
4371 Results.push_back(Chain);
4372
4373 break;
4374 }
4375
4376 // FIXME: It seems Legalized is false iff CCCode is Legal. I don't
4377 // understand if this code is useful for strict nodes.
4378 assert(!IsStrict && "Don't know how to expand for strict nodes.");
4379
4380 // Otherwise, SETCC for the given comparison type must be completely
4381 // illegal; expand it into a SELECT_CC.
4382 // FIXME: This drops the mask/evl for VP_SETCC.
4383 EVT VT = Node->getValueType(0);
4384 EVT Tmp1VT = Tmp1.getValueType();
4385 Tmp1 = DAG.getNode(ISD::SELECT_CC, dl, VT, Tmp1, Tmp2,
4386 DAG.getBoolConstant(true, dl, VT, Tmp1VT),
4387 DAG.getBoolConstant(false, dl, VT, Tmp1VT), Tmp3,
4388 Node->getFlags());
4389 Results.push_back(Tmp1);
4390 break;
4391 }
4392 case ISD::SELECT_CC: {
4393 // TODO: need to add STRICT_SELECT_CC and STRICT_SELECT_CCS
4394 Tmp1 = Node->getOperand(0); // LHS
4395 Tmp2 = Node->getOperand(1); // RHS
4396 Tmp3 = Node->getOperand(2); // True
4397 Tmp4 = Node->getOperand(3); // False
4398 EVT VT = Node->getValueType(0);
4399 SDValue Chain;
4400 SDValue CC = Node->getOperand(4);
4401 ISD::CondCode CCOp = cast<CondCodeSDNode>(CC)->get();
4402
4403 if (TLI.isCondCodeLegalOrCustom(CCOp, Tmp1.getSimpleValueType())) {
4404 // If the condition code is legal, then we need to expand this
4405 // node using SETCC and SELECT.
4406 EVT CmpVT = Tmp1.getValueType();
4408 "Cannot expand ISD::SELECT_CC when ISD::SELECT also needs to be "
4409 "expanded.");
4410 EVT CCVT = getSetCCResultType(CmpVT);
4411 SDValue Cond = DAG.getNode(ISD::SETCC, dl, CCVT, Tmp1, Tmp2, CC, Node->getFlags());
4412 Results.push_back(
4413 DAG.getSelect(dl, VT, Cond, Tmp3, Tmp4, Node->getFlags()));
4414 break;
4415 }
4416
4417 // SELECT_CC is legal, so the condition code must not be.
4418 bool Legalized = false;
4419 // Try to legalize by inverting the condition. This is for targets that
4420 // might support an ordered version of a condition, but not the unordered
4421 // version (or vice versa).
4422 ISD::CondCode InvCC = ISD::getSetCCInverse(CCOp, Tmp1.getValueType());
4423 if (TLI.isCondCodeLegalOrCustom(InvCC, Tmp1.getSimpleValueType())) {
4424 // Use the new condition code and swap true and false
4425 Legalized = true;
4426 Tmp1 =
4427 DAG.getSelectCC(dl, Tmp1, Tmp2, Tmp4, Tmp3, InvCC, Node->getFlags());
4428 } else {
4429 // If The inverse is not legal, then try to swap the arguments using
4430 // the inverse condition code.
4432 if (TLI.isCondCodeLegalOrCustom(SwapInvCC, Tmp1.getSimpleValueType())) {
4433 // The swapped inverse condition is legal, so swap true and false,
4434 // lhs and rhs.
4435 Legalized = true;
4436 Tmp1 = DAG.getSelectCC(dl, Tmp2, Tmp1, Tmp4, Tmp3, SwapInvCC,
4437 Node->getFlags());
4438 }
4439 }
4440
4441 if (!Legalized) {
4442 Legalized = TLI.LegalizeSetCCCondCode(
4443 DAG, getSetCCResultType(Tmp1.getValueType()), Tmp1, Tmp2, CC,
4444 /*Mask*/ SDValue(), /*EVL*/ SDValue(), NeedInvert, dl, Chain);
4445
4446 assert(Legalized && "Can't legalize SELECT_CC with legal condition!");
4447
4448 // If we expanded the SETCC by inverting the condition code, then swap
4449 // the True/False operands to match.
4450 if (NeedInvert)
4451 std::swap(Tmp3, Tmp4);
4452
4453 // If we expanded the SETCC by swapping LHS and RHS, or by inverting the
4454 // condition code, create a new SELECT_CC node.
4455 if (CC.getNode()) {
4456 Tmp1 = DAG.getNode(ISD::SELECT_CC, dl, Node->getValueType(0), Tmp1,
4457 Tmp2, Tmp3, Tmp4, CC, Node->getFlags());
4458 } else {
4459 Tmp2 = DAG.getConstant(0, dl, Tmp1.getValueType());
4460 CC = DAG.getCondCode(ISD::SETNE);
4461 Tmp1 = DAG.getNode(ISD::SELECT_CC, dl, Node->getValueType(0), Tmp1,
4462 Tmp2, Tmp3, Tmp4, CC, Node->getFlags());
4463 }
4464 }
4465 Results.push_back(Tmp1);
4466 break;
4467 }
4468 case ISD::BR_CC: {
4469 // TODO: need to add STRICT_BR_CC and STRICT_BR_CCS
4470 SDValue Chain;
4471 Tmp1 = Node->getOperand(0); // Chain
4472 Tmp2 = Node->getOperand(2); // LHS
4473 Tmp3 = Node->getOperand(3); // RHS
4474 Tmp4 = Node->getOperand(1); // CC
4475
4476 bool Legalized = TLI.LegalizeSetCCCondCode(
4477 DAG, getSetCCResultType(Tmp2.getValueType()), Tmp2, Tmp3, Tmp4,
4478 /*Mask*/ SDValue(), /*EVL*/ SDValue(), NeedInvert, dl, Chain);
4479 (void)Legalized;
4480 assert(Legalized && "Can't legalize BR_CC with legal condition!");
4481
4482 // If we expanded the SETCC by swapping LHS and RHS, create a new BR_CC
4483 // node.
4484 if (Tmp4.getNode()) {
4485 assert(!NeedInvert && "Don't know how to invert BR_CC!");
4486
4487 Tmp1 = DAG.getNode(ISD::BR_CC, dl, Node->getValueType(0), Tmp1,
4488 Tmp4, Tmp2, Tmp3, Node->getOperand(4));
4489 } else {
4490 Tmp3 = DAG.getConstant(0, dl, Tmp2.getValueType());
4491 Tmp4 = DAG.getCondCode(NeedInvert ? ISD::SETEQ : ISD::SETNE);
4492 Tmp1 = DAG.getNode(ISD::BR_CC, dl, Node->getValueType(0), Tmp1, Tmp4,
4493 Tmp2, Tmp3, Node->getOperand(4));
4494 }
4495 Results.push_back(Tmp1);
4496 break;
4497 }
4498 case ISD::BUILD_VECTOR:
4499 Results.push_back(ExpandBUILD_VECTOR(Node));
4500 break;
4501 case ISD::SPLAT_VECTOR:
4502 Results.push_back(ExpandSPLAT_VECTOR(Node));
4503 break;
4504 case ISD::SRA:
4505 case ISD::SRL:
4506 case ISD::SHL: {
4507 // Scalarize vector SRA/SRL/SHL.
4508 EVT VT = Node->getValueType(0);
4509 assert(VT.isVector() && "Unable to legalize non-vector shift");
4510 assert(TLI.isTypeLegal(VT.getScalarType())&& "Element type must be legal");
4511 unsigned NumElem = VT.getVectorNumElements();
4512
4514 for (unsigned Idx = 0; Idx < NumElem; Idx++) {
4515 SDValue Ex =
4517 Node->getOperand(0), DAG.getVectorIdxConstant(Idx, dl));
4518 SDValue Sh =
4520 Node->getOperand(1), DAG.getVectorIdxConstant(Idx, dl));
4521 Scalars.push_back(DAG.getNode(Node->getOpcode(), dl,
4522 VT.getScalarType(), Ex, Sh));
4523 }
4524
4525 SDValue Result = DAG.getBuildVector(Node->getValueType(0), dl, Scalars);
4526 Results.push_back(Result);
4527 break;
4528 }
4531 case ISD::VECREDUCE_ADD:
4532 case ISD::VECREDUCE_MUL:
4533 case ISD::VECREDUCE_AND:
4534 case ISD::VECREDUCE_OR:
4535 case ISD::VECREDUCE_XOR:
4544 Results.push_back(TLI.expandVecReduce(Node, DAG));
4545 break;
4546 case ISD::VP_CTTZ_ELTS:
4547 case ISD::VP_CTTZ_ELTS_ZERO_UNDEF:
4548 Results.push_back(TLI.expandVPCTTZElements(Node, DAG));
4549 break;
4550 case ISD::CLEAR_CACHE:
4551 // The default expansion of llvm.clear_cache is simply a no-op for those
4552 // targets where it is not needed.
4553 Results.push_back(Node->getOperand(0));
4554 break;
4555 case ISD::LRINT:
4556 case ISD::LLRINT: {
4557 SDValue Arg = Node->getOperand(0);
4558 EVT ArgVT = Arg.getValueType();
4559 EVT ResVT = Node->getValueType(0);
4560 SDLoc dl(Node);
4561 SDValue RoundNode = DAG.getNode(ISD::FRINT, dl, ArgVT, Arg);
4562 Results.push_back(DAG.getNode(ISD::FP_TO_SINT, dl, ResVT, RoundNode));
4563 break;
4564 }
4565 case ISD::ADDRSPACECAST:
4566 Results.push_back(DAG.UnrollVectorOp(Node));
4567 break;
4569 case ISD::GlobalAddress:
4572 case ISD::ConstantPool:
4573 case ISD::JumpTable:
4577 // FIXME: Custom lowering for these operations shouldn't return null!
4578 // Return true so that we don't call ConvertNodeToLibcall which also won't
4579 // do anything.
4580 return true;
4581 }
4582
4583 if (!TLI.isStrictFPEnabled() && Results.empty() && Node->isStrictFPOpcode()) {
4584 // FIXME: We were asked to expand a strict floating-point operation,
4585 // but there is currently no expansion implemented that would preserve
4586 // the "strict" properties. For now, we just fall back to the non-strict
4587 // version if that is legal on the target. The actual mutation of the
4588 // operation will happen in SelectionDAGISel::DoInstructionSelection.
4589 switch (Node->getOpcode()) {
4590 default:
4591 if (TLI.getStrictFPOperationAction(Node->getOpcode(),
4592 Node->getValueType(0))
4593 == TargetLowering::Legal)
4594 return true;
4595 break;
4596 case ISD::STRICT_FSUB: {
4598 ISD::STRICT_FSUB, Node->getValueType(0)) == TargetLowering::Legal)
4599 return true;
4601 ISD::STRICT_FADD, Node->getValueType(0)) != TargetLowering::Legal)
4602 break;
4603
4604 EVT VT = Node->getValueType(0);
4605 const SDNodeFlags Flags = Node->getFlags();
4606 SDValue Neg = DAG.getNode(ISD::FNEG, dl, VT, Node->getOperand(2), Flags);
4607 SDValue Fadd = DAG.getNode(ISD::STRICT_FADD, dl, Node->getVTList(),
4608 {Node->getOperand(0), Node->getOperand(1), Neg},
4609 Flags);
4610
4611 Results.push_back(Fadd);
4612 Results.push_back(Fadd.getValue(1));
4613 break;
4614 }
4617 case ISD::STRICT_LRINT:
4618 case ISD::STRICT_LLRINT:
4619 case ISD::STRICT_LROUND:
4621 // These are registered by the operand type instead of the value
4622 // type. Reflect that here.
4623 if (TLI.getStrictFPOperationAction(Node->getOpcode(),
4624 Node->getOperand(1).getValueType())
4625 == TargetLowering::Legal)
4626 return true;
4627 break;
4628 }
4629 }
4630
4631 // Replace the original node with the legalized result.
4632 if (Results.empty()) {
4633 LLVM_DEBUG(dbgs() << "Cannot expand node\n");
4634 return false;
4635 }
4636
4637 LLVM_DEBUG(dbgs() << "Successfully expanded node\n");
4638 ReplaceNode(Node, Results.data());
4639 return true;
4640}
4641
4642/// Return if we can use the FAST_* variant of a math libcall for the node.
4643/// FIXME: This is just guessing, we probably should have unique specific sets
4644/// flags required per libcall.
4645static bool canUseFastMathLibcall(const SDNode *Node) {
4646 // FIXME: Probably should define fast to respect nan/inf and only be
4647 // approximate functions.
4648
4649 SDNodeFlags Flags = Node->getFlags();
4650 return Flags.hasApproximateFuncs() && Flags.hasNoNaNs() &&
4651 Flags.hasNoInfs() && Flags.hasNoSignedZeros();
4652}
4653
4654void SelectionDAGLegalize::ConvertNodeToLibcall(SDNode *Node) {
4655 LLVM_DEBUG(dbgs() << "Trying to convert node to libcall\n");
4657 SDLoc dl(Node);
4658 TargetLowering::MakeLibCallOptions CallOptions;
4659 CallOptions.IsPostTypeLegalization = true;
4660 // FIXME: Check flags on the node to see if we can use a finite call.
4661 unsigned Opc = Node->getOpcode();
4662 switch (Opc) {
4663 case ISD::ATOMIC_FENCE: {
4664 // If the target didn't lower this, lower it to '__sync_synchronize()' call
4665 // FIXME: handle "fence singlethread" more efficiently.
4666 TargetLowering::ArgListTy Args;
4667
4668 TargetLowering::CallLoweringInfo CLI(DAG);
4669 CLI.setDebugLoc(dl)
4670 .setChain(Node->getOperand(0))
4671 .setLibCallee(
4672 CallingConv::C, Type::getVoidTy(*DAG.getContext()),
4673 DAG.getExternalSymbol("__sync_synchronize",
4674 TLI.getPointerTy(DAG.getDataLayout())),
4675 std::move(Args));
4676
4677 std::pair<SDValue, SDValue> CallResult = TLI.LowerCallTo(CLI);
4678
4679 Results.push_back(CallResult.second);
4680 break;
4681 }
4682 // By default, atomic intrinsics are marked Legal and lowered. Targets
4683 // which don't support them directly, however, may want libcalls, in which
4684 // case they mark them Expand, and we get here.
4685 case ISD::ATOMIC_SWAP:
4697 case ISD::ATOMIC_CMP_SWAP: {
4698 MVT VT = cast<AtomicSDNode>(Node)->getMemoryVT().getSimpleVT();
4699 AtomicOrdering Order = cast<AtomicSDNode>(Node)->getMergedOrdering();
4700 RTLIB::Libcall LC = RTLIB::getOUTLINE_ATOMIC(Opc, Order, VT);
4701 EVT RetVT = Node->getValueType(0);
4703 if (TLI.getLibcallImpl(LC) != RTLIB::Unsupported) {
4704 // If outline atomic available, prepare its arguments and expand.
4705 Ops.append(Node->op_begin() + 2, Node->op_end());
4706 Ops.push_back(Node->getOperand(1));
4707
4708 } else {
4709 LC = RTLIB::getSYNC(Opc, VT);
4710 assert(LC != RTLIB::UNKNOWN_LIBCALL &&
4711 "Unexpected atomic op or value type!");
4712 // Arguments for expansion to sync libcall
4713 Ops.append(Node->op_begin() + 1, Node->op_end());
4714 }
4715 std::pair<SDValue, SDValue> Tmp = TLI.makeLibCall(DAG, LC, RetVT,
4716 Ops, CallOptions,
4717 SDLoc(Node),
4718 Node->getOperand(0));
4719 Results.push_back(Tmp.first);
4720 Results.push_back(Tmp.second);
4721 break;
4722 }
4723 case ISD::TRAP: {
4724 // If this operation is not supported, lower it to 'abort()' call
4725 TargetLowering::ArgListTy Args;
4726 TargetLowering::CallLoweringInfo CLI(DAG);
4727 CLI.setDebugLoc(dl)
4728 .setChain(Node->getOperand(0))
4729 .setLibCallee(CallingConv::C, Type::getVoidTy(*DAG.getContext()),
4731 "abort", TLI.getPointerTy(DAG.getDataLayout())),
4732 std::move(Args));
4733 std::pair<SDValue, SDValue> CallResult = TLI.LowerCallTo(CLI);
4734
4735 Results.push_back(CallResult.second);
4736 break;
4737 }
4738 case ISD::CLEAR_CACHE: {
4739 SDValue InputChain = Node->getOperand(0);
4740 SDValue StartVal = Node->getOperand(1);
4741 SDValue EndVal = Node->getOperand(2);
4742 std::pair<SDValue, SDValue> Tmp = TLI.makeLibCall(
4743 DAG, RTLIB::CLEAR_CACHE, MVT::isVoid, {StartVal, EndVal}, CallOptions,
4744 SDLoc(Node), InputChain);
4745 Results.push_back(Tmp.second);
4746 break;
4747 }
4748 case ISD::FMINNUM:
4750 ExpandFPLibCall(Node, RTLIB::FMIN_F32, RTLIB::FMIN_F64,
4751 RTLIB::FMIN_F80, RTLIB::FMIN_F128,
4752 RTLIB::FMIN_PPCF128, Results);
4753 break;
4754 // FIXME: We do not have libcalls for FMAXIMUM and FMINIMUM. So, we cannot use
4755 // libcall legalization for these nodes, but there is no default expasion for
4756 // these nodes either (see PR63267 for example).
4757 case ISD::FMAXNUM:
4759 ExpandFPLibCall(Node, RTLIB::FMAX_F32, RTLIB::FMAX_F64,
4760 RTLIB::FMAX_F80, RTLIB::FMAX_F128,
4761 RTLIB::FMAX_PPCF128, Results);
4762 break;
4763 case ISD::FMINIMUMNUM:
4764 ExpandFPLibCall(Node, RTLIB::FMINIMUM_NUM_F32, RTLIB::FMINIMUM_NUM_F64,
4765 RTLIB::FMINIMUM_NUM_F80, RTLIB::FMINIMUM_NUM_F128,
4766 RTLIB::FMINIMUM_NUM_PPCF128, Results);
4767 break;
4768 case ISD::FMAXIMUMNUM:
4769 ExpandFPLibCall(Node, RTLIB::FMAXIMUM_NUM_F32, RTLIB::FMAXIMUM_NUM_F64,
4770 RTLIB::FMAXIMUM_NUM_F80, RTLIB::FMAXIMUM_NUM_F128,
4771 RTLIB::FMAXIMUM_NUM_PPCF128, Results);
4772 break;
4773 case ISD::FSQRT:
4774 case ISD::STRICT_FSQRT: {
4775 // FIXME: Probably should define fast to respect nan/inf and only be
4776 // approximate functions.
4777 ExpandFastFPLibCall(Node, canUseFastMathLibcall(Node),
4778 {RTLIB::FAST_SQRT_F32, RTLIB::SQRT_F32},
4779 {RTLIB::FAST_SQRT_F64, RTLIB::SQRT_F64},
4780 {RTLIB::FAST_SQRT_F80, RTLIB::SQRT_F80},
4781 {RTLIB::FAST_SQRT_F128, RTLIB::SQRT_F128},
4782 {RTLIB::FAST_SQRT_PPCF128, RTLIB::SQRT_PPCF128},
4783 Results);
4784 break;
4785 }
4786 case ISD::FCBRT:
4787 ExpandFPLibCall(Node, RTLIB::CBRT_F32, RTLIB::CBRT_F64,
4788 RTLIB::CBRT_F80, RTLIB::CBRT_F128,
4789 RTLIB::CBRT_PPCF128, Results);
4790 break;
4791 case ISD::FSIN:
4792 case ISD::STRICT_FSIN:
4793 ExpandFPLibCall(Node, RTLIB::SIN_F32, RTLIB::SIN_F64,
4794 RTLIB::SIN_F80, RTLIB::SIN_F128,
4795 RTLIB::SIN_PPCF128, Results);
4796 break;
4797 case ISD::FCOS:
4798 case ISD::STRICT_FCOS:
4799 ExpandFPLibCall(Node, RTLIB::COS_F32, RTLIB::COS_F64,
4800 RTLIB::COS_F80, RTLIB::COS_F128,
4801 RTLIB::COS_PPCF128, Results);
4802 break;
4803 case ISD::FTAN:
4804 case ISD::STRICT_FTAN:
4805 ExpandFPLibCall(Node, RTLIB::TAN_F32, RTLIB::TAN_F64, RTLIB::TAN_F80,
4806 RTLIB::TAN_F128, RTLIB::TAN_PPCF128, Results);
4807 break;
4808 case ISD::FASIN:
4809 case ISD::STRICT_FASIN:
4810 ExpandFPLibCall(Node, RTLIB::ASIN_F32, RTLIB::ASIN_F64, RTLIB::ASIN_F80,
4811 RTLIB::ASIN_F128, RTLIB::ASIN_PPCF128, Results);
4812 break;
4813 case ISD::FACOS:
4814 case ISD::STRICT_FACOS:
4815 ExpandFPLibCall(Node, RTLIB::ACOS_F32, RTLIB::ACOS_F64, RTLIB::ACOS_F80,
4816 RTLIB::ACOS_F128, RTLIB::ACOS_PPCF128, Results);
4817 break;
4818 case ISD::FATAN:
4819 case ISD::STRICT_FATAN:
4820 ExpandFPLibCall(Node, RTLIB::ATAN_F32, RTLIB::ATAN_F64, RTLIB::ATAN_F80,
4821 RTLIB::ATAN_F128, RTLIB::ATAN_PPCF128, Results);
4822 break;
4823 case ISD::FATAN2:
4824 case ISD::STRICT_FATAN2:
4825 ExpandFPLibCall(Node, RTLIB::ATAN2_F32, RTLIB::ATAN2_F64, RTLIB::ATAN2_F80,
4826 RTLIB::ATAN2_F128, RTLIB::ATAN2_PPCF128, Results);
4827 break;
4828 case ISD::FSINH:
4829 case ISD::STRICT_FSINH:
4830 ExpandFPLibCall(Node, RTLIB::SINH_F32, RTLIB::SINH_F64, RTLIB::SINH_F80,
4831 RTLIB::SINH_F128, RTLIB::SINH_PPCF128, Results);
4832 break;
4833 case ISD::FCOSH:
4834 case ISD::STRICT_FCOSH:
4835 ExpandFPLibCall(Node, RTLIB::COSH_F32, RTLIB::COSH_F64, RTLIB::COSH_F80,
4836 RTLIB::COSH_F128, RTLIB::COSH_PPCF128, Results);
4837 break;
4838 case ISD::FTANH:
4839 case ISD::STRICT_FTANH:
4840 ExpandFPLibCall(Node, RTLIB::TANH_F32, RTLIB::TANH_F64, RTLIB::TANH_F80,
4841 RTLIB::TANH_F128, RTLIB::TANH_PPCF128, Results);
4842 break;
4843 case ISD::FSINCOS:
4844 case ISD::FSINCOSPI: {
4845 EVT VT = Node->getValueType(0);
4846
4847 if (Node->getOpcode() == ISD::FSINCOS) {
4848 RTLIB::Libcall SincosStret = RTLIB::getSINCOS_STRET(VT);
4849 if (SincosStret != RTLIB::UNKNOWN_LIBCALL) {
4850 if (SDValue Expanded = ExpandSincosStretLibCall(Node)) {
4851 Results.push_back(Expanded);
4852 Results.push_back(Expanded.getValue(1));
4853 break;
4854 }
4855 }
4856 }
4857
4858 RTLIB::Libcall LC = Node->getOpcode() == ISD::FSINCOS
4859 ? RTLIB::getSINCOS(VT)
4860 : RTLIB::getSINCOSPI(VT);
4861 bool Expanded = TLI.expandMultipleResultFPLibCall(DAG, LC, Node, Results);
4862 if (!Expanded) {
4863 DAG.getContext()->emitError(Twine("no libcall available for ") +
4864 Node->getOperationName(&DAG));
4865 SDValue Poison = DAG.getPOISON(VT);
4866 Results.push_back(Poison);
4867 Results.push_back(Poison);
4868 }
4869
4870 break;
4871 }
4872 case ISD::FLOG:
4873 case ISD::STRICT_FLOG:
4874 ExpandFPLibCall(Node, RTLIB::LOG_F32, RTLIB::LOG_F64, RTLIB::LOG_F80,
4875 RTLIB::LOG_F128, RTLIB::LOG_PPCF128, Results);
4876 break;
4877 case ISD::FLOG2:
4878 case ISD::STRICT_FLOG2:
4879 ExpandFPLibCall(Node, RTLIB::LOG2_F32, RTLIB::LOG2_F64, RTLIB::LOG2_F80,
4880 RTLIB::LOG2_F128, RTLIB::LOG2_PPCF128, Results);
4881 break;
4882 case ISD::FLOG10:
4883 case ISD::STRICT_FLOG10:
4884 ExpandFPLibCall(Node, RTLIB::LOG10_F32, RTLIB::LOG10_F64, RTLIB::LOG10_F80,
4885 RTLIB::LOG10_F128, RTLIB::LOG10_PPCF128, Results);
4886 break;
4887 case ISD::FEXP:
4888 case ISD::STRICT_FEXP:
4889 ExpandFPLibCall(Node, RTLIB::EXP_F32, RTLIB::EXP_F64, RTLIB::EXP_F80,
4890 RTLIB::EXP_F128, RTLIB::EXP_PPCF128, Results);
4891 break;
4892 case ISD::FEXP2:
4893 case ISD::STRICT_FEXP2:
4894 ExpandFPLibCall(Node, RTLIB::EXP2_F32, RTLIB::EXP2_F64, RTLIB::EXP2_F80,
4895 RTLIB::EXP2_F128, RTLIB::EXP2_PPCF128, Results);
4896 break;
4897 case ISD::FEXP10:
4898 ExpandFPLibCall(Node, RTLIB::EXP10_F32, RTLIB::EXP10_F64, RTLIB::EXP10_F80,
4899 RTLIB::EXP10_F128, RTLIB::EXP10_PPCF128, Results);
4900 break;
4901 case ISD::FTRUNC:
4902 case ISD::STRICT_FTRUNC:
4903 ExpandFPLibCall(Node, RTLIB::TRUNC_F32, RTLIB::TRUNC_F64,
4904 RTLIB::TRUNC_F80, RTLIB::TRUNC_F128,
4905 RTLIB::TRUNC_PPCF128, Results);
4906 break;
4907 case ISD::FFLOOR:
4908 case ISD::STRICT_FFLOOR:
4909 ExpandFPLibCall(Node, RTLIB::FLOOR_F32, RTLIB::FLOOR_F64,
4910 RTLIB::FLOOR_F80, RTLIB::FLOOR_F128,
4911 RTLIB::FLOOR_PPCF128, Results);
4912 break;
4913 case ISD::FCEIL:
4914 case ISD::STRICT_FCEIL:
4915 ExpandFPLibCall(Node, RTLIB::CEIL_F32, RTLIB::CEIL_F64,
4916 RTLIB::CEIL_F80, RTLIB::CEIL_F128,
4917 RTLIB::CEIL_PPCF128, Results);
4918 break;
4919 case ISD::FRINT:
4920 case ISD::STRICT_FRINT:
4921 ExpandFPLibCall(Node, RTLIB::RINT_F32, RTLIB::RINT_F64,
4922 RTLIB::RINT_F80, RTLIB::RINT_F128,
4923 RTLIB::RINT_PPCF128, Results);
4924 break;
4925 case ISD::FNEARBYINT:
4927 ExpandFPLibCall(Node, RTLIB::NEARBYINT_F32,
4928 RTLIB::NEARBYINT_F64,
4929 RTLIB::NEARBYINT_F80,
4930 RTLIB::NEARBYINT_F128,
4931 RTLIB::NEARBYINT_PPCF128, Results);
4932 break;
4933 case ISD::FROUND:
4934 case ISD::STRICT_FROUND:
4935 ExpandFPLibCall(Node, RTLIB::ROUND_F32,
4936 RTLIB::ROUND_F64,
4937 RTLIB::ROUND_F80,
4938 RTLIB::ROUND_F128,
4939 RTLIB::ROUND_PPCF128, Results);
4940 break;
4941 case ISD::FROUNDEVEN:
4943 ExpandFPLibCall(Node, RTLIB::ROUNDEVEN_F32,
4944 RTLIB::ROUNDEVEN_F64,
4945 RTLIB::ROUNDEVEN_F80,
4946 RTLIB::ROUNDEVEN_F128,
4947 RTLIB::ROUNDEVEN_PPCF128, Results);
4948 break;
4949 case ISD::FLDEXP:
4950 case ISD::STRICT_FLDEXP:
4951 ExpandFPLibCall(Node, RTLIB::LDEXP_F32, RTLIB::LDEXP_F64, RTLIB::LDEXP_F80,
4952 RTLIB::LDEXP_F128, RTLIB::LDEXP_PPCF128, Results);
4953 break;
4954 case ISD::FMODF:
4955 case ISD::FFREXP: {
4956 EVT VT = Node->getValueType(0);
4957 RTLIB::Libcall LC = Node->getOpcode() == ISD::FMODF ? RTLIB::getMODF(VT)
4958 : RTLIB::getFREXP(VT);
4959 bool Expanded = TLI.expandMultipleResultFPLibCall(DAG, LC, Node, Results,
4960 /*CallRetResNo=*/0);
4961 if (!Expanded)
4962 llvm_unreachable("Expected scalar FFREXP/FMODF to expand to libcall!");
4963 break;
4964 }
4965 case ISD::FPOWI:
4966 case ISD::STRICT_FPOWI: {
4967 RTLIB::Libcall LC = RTLIB::getPOWI(Node->getSimpleValueType(0));
4968 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unexpected fpowi.");
4969 if (TLI.getLibcallImpl(LC) == RTLIB::Unsupported) {
4970 // Some targets don't have a powi libcall; use pow instead.
4971 if (Node->isStrictFPOpcode()) {
4973 DAG.getNode(ISD::STRICT_SINT_TO_FP, SDLoc(Node),
4974 {Node->getValueType(0), Node->getValueType(1)},
4975 {Node->getOperand(0), Node->getOperand(2)});
4976 SDValue FPOW =
4977 DAG.getNode(ISD::STRICT_FPOW, SDLoc(Node),
4978 {Node->getValueType(0), Node->getValueType(1)},
4979 {Exponent.getValue(1), Node->getOperand(1), Exponent});
4980 Results.push_back(FPOW);
4981 Results.push_back(FPOW.getValue(1));
4982 } else {
4984 DAG.getNode(ISD::SINT_TO_FP, SDLoc(Node), Node->getValueType(0),
4985 Node->getOperand(1));
4986 Results.push_back(DAG.getNode(ISD::FPOW, SDLoc(Node),
4987 Node->getValueType(0),
4988 Node->getOperand(0), Exponent));
4989 }
4990 break;
4991 }
4992 unsigned Offset = Node->isStrictFPOpcode() ? 1 : 0;
4993 bool ExponentHasSizeOfInt =
4994 DAG.getLibInfo().getIntSize() ==
4995 Node->getOperand(1 + Offset).getValueType().getSizeInBits();
4996 if (!ExponentHasSizeOfInt) {
4997 // If the exponent does not match with sizeof(int) a libcall to
4998 // RTLIB::POWI would use the wrong type for the argument.
4999 DAG.getContext()->emitError("POWI exponent does not match sizeof(int)");
5000 Results.push_back(DAG.getPOISON(Node->getValueType(0)));
5001 break;
5002 }
5003 ExpandFPLibCall(Node, LC, Results);
5004 break;
5005 }
5006 case ISD::FPOW:
5007 case ISD::STRICT_FPOW:
5008 ExpandFPLibCall(Node, RTLIB::POW_F32, RTLIB::POW_F64, RTLIB::POW_F80,
5009 RTLIB::POW_F128, RTLIB::POW_PPCF128, Results);
5010 break;
5011 case ISD::LROUND:
5012 case ISD::STRICT_LROUND:
5013 ExpandArgFPLibCall(Node, RTLIB::LROUND_F32,
5014 RTLIB::LROUND_F64, RTLIB::LROUND_F80,
5015 RTLIB::LROUND_F128,
5016 RTLIB::LROUND_PPCF128, Results);
5017 break;
5018 case ISD::LLROUND:
5020 ExpandArgFPLibCall(Node, RTLIB::LLROUND_F32,
5021 RTLIB::LLROUND_F64, RTLIB::LLROUND_F80,
5022 RTLIB::LLROUND_F128,
5023 RTLIB::LLROUND_PPCF128, Results);
5024 break;
5025 case ISD::LRINT:
5026 case ISD::STRICT_LRINT:
5027 ExpandArgFPLibCall(Node, RTLIB::LRINT_F32,
5028 RTLIB::LRINT_F64, RTLIB::LRINT_F80,
5029 RTLIB::LRINT_F128,
5030 RTLIB::LRINT_PPCF128, Results);
5031 break;
5032 case ISD::LLRINT:
5033 case ISD::STRICT_LLRINT:
5034 ExpandArgFPLibCall(Node, RTLIB::LLRINT_F32,
5035 RTLIB::LLRINT_F64, RTLIB::LLRINT_F80,
5036 RTLIB::LLRINT_F128,
5037 RTLIB::LLRINT_PPCF128, Results);
5038 break;
5039 case ISD::FDIV:
5040 case ISD::STRICT_FDIV: {
5041 ExpandFastFPLibCall(Node, canUseFastMathLibcall(Node),
5042 {RTLIB::FAST_DIV_F32, RTLIB::DIV_F32},
5043 {RTLIB::FAST_DIV_F64, RTLIB::DIV_F64},
5044 {RTLIB::FAST_DIV_F80, RTLIB::DIV_F80},
5045 {RTLIB::FAST_DIV_F128, RTLIB::DIV_F128},
5046 {RTLIB::FAST_DIV_PPCF128, RTLIB::DIV_PPCF128}, Results);
5047 break;
5048 }
5049 case ISD::FREM:
5050 case ISD::STRICT_FREM:
5051 ExpandFPLibCall(Node, RTLIB::REM_F32, RTLIB::REM_F64,
5052 RTLIB::REM_F80, RTLIB::REM_F128,
5053 RTLIB::REM_PPCF128, Results);
5054 break;
5055 case ISD::FMA:
5056 case ISD::STRICT_FMA:
5057 ExpandFPLibCall(Node, RTLIB::FMA_F32, RTLIB::FMA_F64,
5058 RTLIB::FMA_F80, RTLIB::FMA_F128,
5059 RTLIB::FMA_PPCF128, Results);
5060 break;
5061 case ISD::FADD:
5062 case ISD::STRICT_FADD: {
5063 ExpandFastFPLibCall(Node, canUseFastMathLibcall(Node),
5064 {RTLIB::FAST_ADD_F32, RTLIB::ADD_F32},
5065 {RTLIB::FAST_ADD_F64, RTLIB::ADD_F64},
5066 {RTLIB::FAST_ADD_F80, RTLIB::ADD_F80},
5067 {RTLIB::FAST_ADD_F128, RTLIB::ADD_F128},
5068 {RTLIB::FAST_ADD_PPCF128, RTLIB::ADD_PPCF128}, Results);
5069 break;
5070 }
5071 case ISD::FMUL:
5072 case ISD::STRICT_FMUL: {
5073 ExpandFastFPLibCall(Node, canUseFastMathLibcall(Node),
5074 {RTLIB::FAST_MUL_F32, RTLIB::MUL_F32},
5075 {RTLIB::FAST_MUL_F64, RTLIB::MUL_F64},
5076 {RTLIB::FAST_MUL_F80, RTLIB::MUL_F80},
5077 {RTLIB::FAST_MUL_F128, RTLIB::MUL_F128},
5078 {RTLIB::FAST_MUL_PPCF128, RTLIB::MUL_PPCF128}, Results);
5079 break;
5080 }
5081 case ISD::FP16_TO_FP:
5082 if (Node->getValueType(0) == MVT::f32) {
5083 Results.push_back(ExpandLibCall(RTLIB::FPEXT_F16_F32, Node, false).first);
5084 }
5085 break;
5087 if (Node->getValueType(0) == MVT::f32) {
5088 std::pair<SDValue, SDValue> Tmp = TLI.makeLibCall(
5089 DAG, RTLIB::FPEXT_BF16_F32, MVT::f32, Node->getOperand(1),
5090 CallOptions, SDLoc(Node), Node->getOperand(0));
5091 Results.push_back(Tmp.first);
5092 Results.push_back(Tmp.second);
5093 }
5094 break;
5096 if (Node->getValueType(0) == MVT::f32) {
5097 std::pair<SDValue, SDValue> Tmp = TLI.makeLibCall(
5098 DAG, RTLIB::FPEXT_F16_F32, MVT::f32, Node->getOperand(1), CallOptions,
5099 SDLoc(Node), Node->getOperand(0));
5100 Results.push_back(Tmp.first);
5101 Results.push_back(Tmp.second);
5102 }
5103 break;
5104 }
5105 case ISD::FP_TO_FP16: {
5106 RTLIB::Libcall LC =
5107 RTLIB::getFPROUND(Node->getOperand(0).getValueType(), MVT::f16);
5108 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unable to expand fp_to_fp16");
5109 Results.push_back(ExpandLibCall(LC, Node, false).first);
5110 break;
5111 }
5112 case ISD::FP_TO_BF16: {
5113 RTLIB::Libcall LC =
5114 RTLIB::getFPROUND(Node->getOperand(0).getValueType(), MVT::bf16);
5115 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unable to expand fp_to_bf16");
5116 Results.push_back(ExpandLibCall(LC, Node, false).first);
5117 break;
5118 }
5121 case ISD::SINT_TO_FP:
5122 case ISD::UINT_TO_FP: {
5123 // TODO - Common the code with DAGTypeLegalizer::SoftenFloatRes_XINT_TO_FP
5124 bool IsStrict = Node->isStrictFPOpcode();
5125 bool Signed = Node->getOpcode() == ISD::SINT_TO_FP ||
5126 Node->getOpcode() == ISD::STRICT_SINT_TO_FP;
5127 EVT SVT = Node->getOperand(IsStrict ? 1 : 0).getValueType();
5128 EVT RVT = Node->getValueType(0);
5129 EVT NVT = EVT();
5130 SDLoc dl(Node);
5131
5132 // Even if the input is legal, no libcall may exactly match, eg. we don't
5133 // have i1 -> fp conversions. So, it needs to be promoted to a larger type,
5134 // eg: i13 -> fp. Then, look for an appropriate libcall.
5135 RTLIB::Libcall LC = RTLIB::UNKNOWN_LIBCALL;
5136 for (unsigned t = MVT::FIRST_INTEGER_VALUETYPE;
5137 t <= MVT::LAST_INTEGER_VALUETYPE && LC == RTLIB::UNKNOWN_LIBCALL;
5138 ++t) {
5139 NVT = (MVT::SimpleValueType)t;
5140 // The source needs to big enough to hold the operand.
5141 if (NVT.bitsGE(SVT))
5142 LC = Signed ? RTLIB::getSINTTOFP(NVT, RVT)
5143 : RTLIB::getUINTTOFP(NVT, RVT);
5144 }
5145 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unable to legalize as libcall");
5146
5147 SDValue Chain = IsStrict ? Node->getOperand(0) : SDValue();
5148 // Sign/zero extend the argument if the libcall takes a larger type.
5150 NVT, Node->getOperand(IsStrict ? 1 : 0));
5151 CallOptions.setIsSigned(Signed);
5152 std::pair<SDValue, SDValue> Tmp =
5153 TLI.makeLibCall(DAG, LC, RVT, Op, CallOptions, dl, Chain);
5154 Results.push_back(Tmp.first);
5155 if (IsStrict)
5156 Results.push_back(Tmp.second);
5157 break;
5158 }
5159 case ISD::FP_TO_SINT:
5160 case ISD::FP_TO_UINT:
5163 // TODO - Common the code with DAGTypeLegalizer::SoftenFloatOp_FP_TO_XINT.
5164 bool IsStrict = Node->isStrictFPOpcode();
5165 bool Signed = Node->getOpcode() == ISD::FP_TO_SINT ||
5166 Node->getOpcode() == ISD::STRICT_FP_TO_SINT;
5167
5168 SDValue Op = Node->getOperand(IsStrict ? 1 : 0);
5169 EVT SVT = Op.getValueType();
5170 EVT RVT = Node->getValueType(0);
5171 EVT NVT = EVT();
5172 SDLoc dl(Node);
5173
5174 // Even if the result is legal, no libcall may exactly match, eg. we don't
5175 // have fp -> i1 conversions. So, it needs to be promoted to a larger type,
5176 // eg: fp -> i32. Then, look for an appropriate libcall.
5177 RTLIB::Libcall LC = RTLIB::UNKNOWN_LIBCALL;
5178 for (unsigned IntVT = MVT::FIRST_INTEGER_VALUETYPE;
5179 IntVT <= MVT::LAST_INTEGER_VALUETYPE && LC == RTLIB::UNKNOWN_LIBCALL;
5180 ++IntVT) {
5181 NVT = (MVT::SimpleValueType)IntVT;
5182 // The type needs to big enough to hold the result.
5183 if (NVT.bitsGE(RVT))
5184 LC = Signed ? RTLIB::getFPTOSINT(SVT, NVT)
5185 : RTLIB::getFPTOUINT(SVT, NVT);
5186 }
5187 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unable to legalize as libcall");
5188
5189 SDValue Chain = IsStrict ? Node->getOperand(0) : SDValue();
5190 std::pair<SDValue, SDValue> Tmp =
5191 TLI.makeLibCall(DAG, LC, NVT, Op, CallOptions, dl, Chain);
5192
5193 // Truncate the result if the libcall returns a larger type.
5194 Results.push_back(DAG.getNode(ISD::TRUNCATE, dl, RVT, Tmp.first));
5195 if (IsStrict)
5196 Results.push_back(Tmp.second);
5197 break;
5198 }
5199
5200 case ISD::FP_ROUND:
5201 case ISD::STRICT_FP_ROUND: {
5202 // X = FP_ROUND(Y, TRUNC)
5203 // TRUNC is a flag, which is always an integer that is zero or one.
5204 // If TRUNC is 0, this is a normal rounding, if it is 1, this FP_ROUND
5205 // is known to not change the value of Y.
5206 // We can only expand it into libcall if the TRUNC is 0.
5207 bool IsStrict = Node->isStrictFPOpcode();
5208 SDValue Op = Node->getOperand(IsStrict ? 1 : 0);
5209 SDValue Chain = IsStrict ? Node->getOperand(0) : SDValue();
5210 EVT VT = Node->getValueType(0);
5211 assert(cast<ConstantSDNode>(Node->getOperand(IsStrict ? 2 : 1))->isZero() &&
5212 "Unable to expand as libcall if it is not normal rounding");
5213
5214 RTLIB::Libcall LC = RTLIB::getFPROUND(Op.getValueType(), VT);
5215 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unable to legalize as libcall");
5216
5217 std::pair<SDValue, SDValue> Tmp =
5218 TLI.makeLibCall(DAG, LC, VT, Op, CallOptions, SDLoc(Node), Chain);
5219 Results.push_back(Tmp.first);
5220 if (IsStrict)
5221 Results.push_back(Tmp.second);
5222 break;
5223 }
5224 case ISD::FP_EXTEND: {
5225 Results.push_back(
5226 ExpandLibCall(RTLIB::getFPEXT(Node->getOperand(0).getValueType(),
5227 Node->getValueType(0)),
5228 Node, false).first);
5229 break;
5230 }
5234 RTLIB::Libcall LC = RTLIB::UNKNOWN_LIBCALL;
5235 if (Node->getOpcode() == ISD::STRICT_FP_TO_FP16)
5236 LC = RTLIB::getFPROUND(Node->getOperand(1).getValueType(), MVT::f16);
5237 else if (Node->getOpcode() == ISD::STRICT_FP_TO_BF16)
5238 LC = RTLIB::getFPROUND(Node->getOperand(1).getValueType(), MVT::bf16);
5239 else
5240 LC = RTLIB::getFPEXT(Node->getOperand(1).getValueType(),
5241 Node->getValueType(0));
5242
5243 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unable to legalize as libcall");
5244
5245 std::pair<SDValue, SDValue> Tmp =
5246 TLI.makeLibCall(DAG, LC, Node->getValueType(0), Node->getOperand(1),
5247 CallOptions, SDLoc(Node), Node->getOperand(0));
5248 Results.push_back(Tmp.first);
5249 Results.push_back(Tmp.second);
5250 break;
5251 }
5252 case ISD::FSUB:
5253 case ISD::STRICT_FSUB: {
5254 ExpandFastFPLibCall(Node, canUseFastMathLibcall(Node),
5255 {RTLIB::FAST_SUB_F32, RTLIB::SUB_F32},
5256 {RTLIB::FAST_SUB_F64, RTLIB::SUB_F64},
5257 {RTLIB::FAST_SUB_F80, RTLIB::SUB_F80},
5258 {RTLIB::FAST_SUB_F128, RTLIB::SUB_F128},
5259 {RTLIB::FAST_SUB_PPCF128, RTLIB::SUB_PPCF128}, Results);
5260 break;
5261 }
5262 case ISD::SREM:
5263 Results.push_back(ExpandIntLibCall(Node, true,
5264 RTLIB::SREM_I8,
5265 RTLIB::SREM_I16, RTLIB::SREM_I32,
5266 RTLIB::SREM_I64, RTLIB::SREM_I128));
5267 break;
5268 case ISD::UREM:
5269 Results.push_back(ExpandIntLibCall(Node, false,
5270 RTLIB::UREM_I8,
5271 RTLIB::UREM_I16, RTLIB::UREM_I32,
5272 RTLIB::UREM_I64, RTLIB::UREM_I128));
5273 break;
5274 case ISD::SDIV:
5275 Results.push_back(ExpandIntLibCall(Node, true,
5276 RTLIB::SDIV_I8,
5277 RTLIB::SDIV_I16, RTLIB::SDIV_I32,
5278 RTLIB::SDIV_I64, RTLIB::SDIV_I128));
5279 break;
5280 case ISD::UDIV:
5281 Results.push_back(ExpandIntLibCall(Node, false,
5282 RTLIB::UDIV_I8,
5283 RTLIB::UDIV_I16, RTLIB::UDIV_I32,
5284 RTLIB::UDIV_I64, RTLIB::UDIV_I128));
5285 break;
5286 case ISD::SDIVREM:
5287 case ISD::UDIVREM:
5288 // Expand into divrem libcall
5289 ExpandDivRemLibCall(Node, Results);
5290 break;
5291 case ISD::MUL:
5292 Results.push_back(ExpandIntLibCall(Node, false,
5293 RTLIB::MUL_I8,
5294 RTLIB::MUL_I16, RTLIB::MUL_I32,
5295 RTLIB::MUL_I64, RTLIB::MUL_I128));
5296 break;
5298 Results.push_back(ExpandBitCountingLibCall(
5299 Node, RTLIB::CTLZ_I32, RTLIB::CTLZ_I64, RTLIB::CTLZ_I128));
5300 break;
5301 case ISD::CTPOP:
5302 Results.push_back(ExpandBitCountingLibCall(
5303 Node, RTLIB::CTPOP_I32, RTLIB::CTPOP_I64, RTLIB::CTPOP_I128));
5304 break;
5305 case ISD::RESET_FPENV: {
5306 // It is legalized to call 'fesetenv(FE_DFL_ENV)'. On most targets
5307 // FE_DFL_ENV is defined as '((const fenv_t *) -1)' in glibc.
5308 EVT PtrTy = TLI.getPointerTy(DAG.getDataLayout());
5309 SDValue Ptr = DAG.getAllOnesConstant(dl, PtrTy);
5310 SDValue Chain = Node->getOperand(0);
5311 Results.push_back(
5312 DAG.makeStateFunctionCall(RTLIB::FESETENV, Ptr, Chain, dl));
5313 break;
5314 }
5315 case ISD::GET_FPENV_MEM: {
5316 SDValue Chain = Node->getOperand(0);
5317 SDValue EnvPtr = Node->getOperand(1);
5318 Results.push_back(
5319 DAG.makeStateFunctionCall(RTLIB::FEGETENV, EnvPtr, Chain, dl));
5320 break;
5321 }
5322 case ISD::SET_FPENV_MEM: {
5323 SDValue Chain = Node->getOperand(0);
5324 SDValue EnvPtr = Node->getOperand(1);
5325 Results.push_back(
5326 DAG.makeStateFunctionCall(RTLIB::FESETENV, EnvPtr, Chain, dl));
5327 break;
5328 }
5329 case ISD::GET_FPMODE: {
5330 // Call fegetmode, which saves control modes into a stack slot. Then load
5331 // the value to return from the stack.
5332 EVT ModeVT = Node->getValueType(0);
5334 int SPFI = cast<FrameIndexSDNode>(StackPtr.getNode())->getIndex();
5335 SDValue Chain = DAG.makeStateFunctionCall(RTLIB::FEGETMODE, StackPtr,
5336 Node->getOperand(0), dl);
5337 SDValue LdInst = DAG.getLoad(
5338 ModeVT, dl, Chain, StackPtr,
5340 Results.push_back(LdInst);
5341 Results.push_back(LdInst.getValue(1));
5342 break;
5343 }
5344 case ISD::SET_FPMODE: {
5345 // Move control modes to stack slot and then call fesetmode with the pointer
5346 // to the slot as argument.
5347 SDValue Mode = Node->getOperand(1);
5348 EVT ModeVT = Mode.getValueType();
5350 int SPFI = cast<FrameIndexSDNode>(StackPtr.getNode())->getIndex();
5351 SDValue StInst = DAG.getStore(
5352 Node->getOperand(0), dl, Mode, StackPtr,
5354 Results.push_back(
5355 DAG.makeStateFunctionCall(RTLIB::FESETMODE, StackPtr, StInst, dl));
5356 break;
5357 }
5358 case ISD::RESET_FPMODE: {
5359 // It is legalized to a call 'fesetmode(FE_DFL_MODE)'. On most targets
5360 // FE_DFL_MODE is defined as '((const femode_t *) -1)' in glibc. If not, the
5361 // target must provide custom lowering.
5362 const DataLayout &DL = DAG.getDataLayout();
5363 EVT PtrTy = TLI.getPointerTy(DL);
5364 SDValue Mode = DAG.getAllOnesConstant(dl, PtrTy);
5365 Results.push_back(DAG.makeStateFunctionCall(RTLIB::FESETMODE, Mode,
5366 Node->getOperand(0), dl));
5367 break;
5368 }
5369 }
5370
5371 // Replace the original node with the legalized result.
5372 if (!Results.empty()) {
5373 LLVM_DEBUG(dbgs() << "Successfully converted node to libcall\n");
5374 ReplaceNode(Node, Results.data());
5375 } else
5376 LLVM_DEBUG(dbgs() << "Could not convert node to libcall\n");
5377}
5378
5379// Determine the vector type to use in place of an original scalar element when
5380// promoting equally sized vectors.
5382 MVT EltVT, MVT NewEltVT) {
5383 unsigned OldEltsPerNewElt = EltVT.getSizeInBits() / NewEltVT.getSizeInBits();
5384 MVT MidVT = OldEltsPerNewElt == 1
5385 ? NewEltVT
5386 : MVT::getVectorVT(NewEltVT, OldEltsPerNewElt);
5387 assert(TLI.isTypeLegal(MidVT) && "unexpected");
5388 return MidVT;
5389}
5390
5391void SelectionDAGLegalize::PromoteNode(SDNode *Node) {
5392 LLVM_DEBUG(dbgs() << "Trying to promote node\n");
5394 MVT OVT = Node->getSimpleValueType(0);
5395 if (Node->getOpcode() == ISD::UINT_TO_FP ||
5396 Node->getOpcode() == ISD::SINT_TO_FP ||
5397 Node->getOpcode() == ISD::SETCC ||
5398 Node->getOpcode() == ISD::EXTRACT_VECTOR_ELT ||
5399 Node->getOpcode() == ISD::INSERT_VECTOR_ELT ||
5400 Node->getOpcode() == ISD::VECREDUCE_FMAX ||
5401 Node->getOpcode() == ISD::VECREDUCE_FMIN ||
5402 Node->getOpcode() == ISD::VECREDUCE_FMAXIMUM ||
5403 Node->getOpcode() == ISD::VECREDUCE_FMINIMUM) {
5404 OVT = Node->getOperand(0).getSimpleValueType();
5405 }
5406 if (Node->getOpcode() == ISD::ATOMIC_STORE ||
5407 Node->getOpcode() == ISD::STRICT_UINT_TO_FP ||
5408 Node->getOpcode() == ISD::STRICT_SINT_TO_FP ||
5409 Node->getOpcode() == ISD::STRICT_FSETCC ||
5410 Node->getOpcode() == ISD::STRICT_FSETCCS ||
5411 Node->getOpcode() == ISD::VP_REDUCE_FADD ||
5412 Node->getOpcode() == ISD::VP_REDUCE_FMUL ||
5413 Node->getOpcode() == ISD::VP_REDUCE_FMAX ||
5414 Node->getOpcode() == ISD::VP_REDUCE_FMIN ||
5415 Node->getOpcode() == ISD::VP_REDUCE_FMAXIMUM ||
5416 Node->getOpcode() == ISD::VP_REDUCE_FMINIMUM ||
5417 Node->getOpcode() == ISD::VP_REDUCE_SEQ_FADD)
5418 OVT = Node->getOperand(1).getSimpleValueType();
5419 if (Node->getOpcode() == ISD::BR_CC ||
5420 Node->getOpcode() == ISD::SELECT_CC)
5421 OVT = Node->getOperand(2).getSimpleValueType();
5422 // Preserve fast math flags
5423 SDNodeFlags FastMathFlags = Node->getFlags() & SDNodeFlags::FastMathFlags;
5424 SelectionDAG::FlagInserter FlagsInserter(DAG, FastMathFlags);
5425 MVT NVT = TLI.getTypeToPromoteTo(Node->getOpcode(), OVT);
5426 SDLoc dl(Node);
5427 SDValue Tmp1, Tmp2, Tmp3, Tmp4;
5428 switch (Node->getOpcode()) {
5429 case ISD::CTTZ:
5431 case ISD::CTLZ:
5432 case ISD::CTPOP: {
5433 // Zero extend the argument unless its cttz, then use any_extend.
5434 if (Node->getOpcode() == ISD::CTTZ ||
5435 Node->getOpcode() == ISD::CTTZ_ZERO_UNDEF)
5436 Tmp1 = DAG.getNode(ISD::ANY_EXTEND, dl, NVT, Node->getOperand(0));
5437 else
5438 Tmp1 = DAG.getNode(ISD::ZERO_EXTEND, dl, NVT, Node->getOperand(0));
5439
5440 unsigned NewOpc = Node->getOpcode();
5441 if (NewOpc == ISD::CTTZ) {
5442 // The count is the same in the promoted type except if the original
5443 // value was zero. This can be handled by setting the bit just off
5444 // the top of the original type.
5445 auto TopBit = APInt::getOneBitSet(NVT.getSizeInBits(),
5446 OVT.getSizeInBits());
5447 Tmp1 = DAG.getNode(ISD::OR, dl, NVT, Tmp1,
5448 DAG.getConstant(TopBit, dl, NVT));
5449 NewOpc = ISD::CTTZ_ZERO_UNDEF;
5450 }
5451 // Perform the larger operation. For CTPOP and CTTZ_ZERO_UNDEF, this is
5452 // already the correct result.
5453 Tmp1 = DAG.getNode(NewOpc, dl, NVT, Tmp1);
5454 if (NewOpc == ISD::CTLZ) {
5455 // Tmp1 = Tmp1 - (sizeinbits(NVT) - sizeinbits(Old VT))
5456 Tmp1 = DAG.getNode(ISD::SUB, dl, NVT, Tmp1,
5457 DAG.getConstant(NVT.getSizeInBits() -
5458 OVT.getSizeInBits(), dl, NVT));
5459 }
5460 Results.push_back(
5461 DAG.getNode(ISD::TRUNCATE, dl, OVT, Tmp1, SDNodeFlags::NoWrap));
5462 break;
5463 }
5464 case ISD::CTLZ_ZERO_UNDEF: {
5465 // We know that the argument is unlikely to be zero, hence we can take a
5466 // different approach as compared to ISD::CTLZ
5467
5468 // Any Extend the argument
5469 auto AnyExtendedNode =
5470 DAG.getNode(ISD::ANY_EXTEND, dl, NVT, Node->getOperand(0));
5471
5472 // Tmp1 = Tmp1 << (sizeinbits(NVT) - sizeinbits(Old VT))
5473 auto ShiftConstant = DAG.getShiftAmountConstant(
5474 NVT.getSizeInBits() - OVT.getSizeInBits(), NVT, dl);
5475 auto LeftShiftResult =
5476 DAG.getNode(ISD::SHL, dl, NVT, AnyExtendedNode, ShiftConstant);
5477
5478 // Perform the larger operation
5479 auto CTLZResult = DAG.getNode(Node->getOpcode(), dl, NVT, LeftShiftResult);
5480 Results.push_back(DAG.getNode(ISD::TRUNCATE, dl, OVT, CTLZResult));
5481 break;
5482 }
5483 case ISD::BITREVERSE:
5484 case ISD::BSWAP: {
5485 unsigned DiffBits = NVT.getSizeInBits() - OVT.getSizeInBits();
5486 Tmp1 = DAG.getNode(ISD::ZERO_EXTEND, dl, NVT, Node->getOperand(0));
5487 Tmp1 = DAG.getNode(Node->getOpcode(), dl, NVT, Tmp1);
5488 Tmp1 = DAG.getNode(ISD::SRL, dl, NVT, Tmp1,
5489 DAG.getShiftAmountConstant(DiffBits, NVT, dl));
5490
5491 Results.push_back(DAG.getNode(ISD::TRUNCATE, dl, OVT, Tmp1));
5492 break;
5493 }
5494 case ISD::FP_TO_UINT:
5496 case ISD::FP_TO_SINT:
5498 PromoteLegalFP_TO_INT(Node, dl, Results);
5499 break;
5502 Results.push_back(PromoteLegalFP_TO_INT_SAT(Node, dl));
5503 break;
5504 case ISD::UINT_TO_FP:
5506 case ISD::SINT_TO_FP:
5508 PromoteLegalINT_TO_FP(Node, dl, Results);
5509 break;
5510 case ISD::VAARG: {
5511 SDValue Chain = Node->getOperand(0); // Get the chain.
5512 SDValue Ptr = Node->getOperand(1); // Get the pointer.
5513
5514 unsigned TruncOp;
5515 if (OVT.isVector()) {
5516 TruncOp = ISD::BITCAST;
5517 } else {
5518 assert(OVT.isInteger()
5519 && "VAARG promotion is supported only for vectors or integer types");
5520 TruncOp = ISD::TRUNCATE;
5521 }
5522
5523 // Perform the larger operation, then convert back
5524 Tmp1 = DAG.getVAArg(NVT, dl, Chain, Ptr, Node->getOperand(2),
5525 Node->getConstantOperandVal(3));
5526 Chain = Tmp1.getValue(1);
5527
5528 Tmp2 = DAG.getNode(TruncOp, dl, OVT, Tmp1);
5529
5530 // Modified the chain result - switch anything that used the old chain to
5531 // use the new one.
5532 DAG.ReplaceAllUsesOfValueWith(SDValue(Node, 0), Tmp2);
5533 DAG.ReplaceAllUsesOfValueWith(SDValue(Node, 1), Chain);
5534 if (UpdatedNodes) {
5535 UpdatedNodes->insert(Tmp2.getNode());
5536 UpdatedNodes->insert(Chain.getNode());
5537 }
5538 ReplacedNode(Node);
5539 break;
5540 }
5541 case ISD::MUL:
5542 case ISD::SDIV:
5543 case ISD::SREM:
5544 case ISD::UDIV:
5545 case ISD::UREM:
5546 case ISD::SMIN:
5547 case ISD::SMAX:
5548 case ISD::UMIN:
5549 case ISD::UMAX:
5550 case ISD::AND:
5551 case ISD::OR:
5552 case ISD::XOR: {
5553 unsigned ExtOp, TruncOp;
5554 if (OVT.isVector()) {
5555 ExtOp = ISD::BITCAST;
5556 TruncOp = ISD::BITCAST;
5557 } else {
5558 assert(OVT.isInteger() && "Cannot promote logic operation");
5559
5560 switch (Node->getOpcode()) {
5561 default:
5562 ExtOp = ISD::ANY_EXTEND;
5563 break;
5564 case ISD::SDIV:
5565 case ISD::SREM:
5566 case ISD::SMIN:
5567 case ISD::SMAX:
5568 ExtOp = ISD::SIGN_EXTEND;
5569 break;
5570 case ISD::UDIV:
5571 case ISD::UREM:
5572 ExtOp = ISD::ZERO_EXTEND;
5573 break;
5574 case ISD::UMIN:
5575 case ISD::UMAX:
5576 if (TLI.isSExtCheaperThanZExt(OVT, NVT))
5577 ExtOp = ISD::SIGN_EXTEND;
5578 else
5579 ExtOp = ISD::ZERO_EXTEND;
5580 break;
5581 }
5582 TruncOp = ISD::TRUNCATE;
5583 }
5584 // Promote each of the values to the new type.
5585 Tmp1 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(0));
5586 Tmp2 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(1));
5587 // Perform the larger operation, then convert back
5588 Tmp1 = DAG.getNode(Node->getOpcode(), dl, NVT, Tmp1, Tmp2);
5589 Results.push_back(DAG.getNode(TruncOp, dl, OVT, Tmp1));
5590 break;
5591 }
5592 case ISD::UMUL_LOHI:
5593 case ISD::SMUL_LOHI: {
5594 // Promote to a multiply in a wider integer type.
5595 unsigned ExtOp = Node->getOpcode() == ISD::UMUL_LOHI ? ISD::ZERO_EXTEND
5597 Tmp1 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(0));
5598 Tmp2 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(1));
5599 Tmp1 = DAG.getNode(ISD::MUL, dl, NVT, Tmp1, Tmp2);
5600
5601 unsigned OriginalSize = OVT.getScalarSizeInBits();
5602 Tmp2 = DAG.getNode(ISD::SRL, dl, NVT, Tmp1,
5603 DAG.getShiftAmountConstant(OriginalSize, NVT, dl));
5604 Results.push_back(DAG.getNode(ISD::TRUNCATE, dl, OVT, Tmp1));
5605 Results.push_back(DAG.getNode(ISD::TRUNCATE, dl, OVT, Tmp2));
5606 break;
5607 }
5608 case ISD::SELECT: {
5609 unsigned ExtOp, TruncOp;
5610 if (Node->getValueType(0).isVector() ||
5611 Node->getValueType(0).getSizeInBits() == NVT.getSizeInBits()) {
5612 ExtOp = ISD::BITCAST;
5613 TruncOp = ISD::BITCAST;
5614 } else if (Node->getValueType(0).isInteger()) {
5615 ExtOp = ISD::ANY_EXTEND;
5616 TruncOp = ISD::TRUNCATE;
5617 } else {
5618 ExtOp = ISD::FP_EXTEND;
5619 TruncOp = ISD::FP_ROUND;
5620 }
5621 Tmp1 = Node->getOperand(0);
5622 // Promote each of the values to the new type.
5623 Tmp2 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(1));
5624 Tmp3 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(2));
5625 // Perform the larger operation, then round down.
5626 Tmp1 = DAG.getSelect(dl, NVT, Tmp1, Tmp2, Tmp3);
5627 if (TruncOp != ISD::FP_ROUND)
5628 Tmp1 = DAG.getNode(TruncOp, dl, Node->getValueType(0), Tmp1);
5629 else
5630 Tmp1 = DAG.getNode(TruncOp, dl, Node->getValueType(0), Tmp1,
5631 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true));
5632 Results.push_back(Tmp1);
5633 break;
5634 }
5635 case ISD::VECTOR_SHUFFLE: {
5636 ArrayRef<int> Mask = cast<ShuffleVectorSDNode>(Node)->getMask();
5637
5638 // Cast the two input vectors.
5639 Tmp1 = DAG.getNode(ISD::BITCAST, dl, NVT, Node->getOperand(0));
5640 Tmp2 = DAG.getNode(ISD::BITCAST, dl, NVT, Node->getOperand(1));
5641
5642 // Convert the shuffle mask to the right # elements.
5643 Tmp1 = ShuffleWithNarrowerEltType(NVT, OVT, dl, Tmp1, Tmp2, Mask);
5644 Tmp1 = DAG.getNode(ISD::BITCAST, dl, OVT, Tmp1);
5645 Results.push_back(Tmp1);
5646 break;
5647 }
5648 case ISD::VECTOR_SPLICE: {
5649 Tmp1 = DAG.getNode(ISD::ANY_EXTEND, dl, NVT, Node->getOperand(0));
5650 Tmp2 = DAG.getNode(ISD::ANY_EXTEND, dl, NVT, Node->getOperand(1));
5651 Tmp3 = DAG.getNode(ISD::VECTOR_SPLICE, dl, NVT, Tmp1, Tmp2,
5652 Node->getOperand(2));
5653 Results.push_back(DAG.getNode(ISD::TRUNCATE, dl, OVT, Tmp3));
5654 break;
5655 }
5656 case ISD::SELECT_CC: {
5657 SDValue Cond = Node->getOperand(4);
5658 ISD::CondCode CCCode = cast<CondCodeSDNode>(Cond)->get();
5659 // Type of the comparison operands.
5660 MVT CVT = Node->getSimpleValueType(0);
5661 assert(CVT == OVT && "not handled");
5662
5663 unsigned ExtOp = ISD::FP_EXTEND;
5664 if (NVT.isInteger()) {
5666 }
5667
5668 // Promote the comparison operands, if needed.
5669 if (TLI.isCondCodeLegal(CCCode, CVT)) {
5670 Tmp1 = Node->getOperand(0);
5671 Tmp2 = Node->getOperand(1);
5672 } else {
5673 Tmp1 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(0));
5674 Tmp2 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(1));
5675 }
5676 // Cast the true/false operands.
5677 Tmp3 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(2));
5678 Tmp4 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(3));
5679
5680 Tmp1 = DAG.getNode(ISD::SELECT_CC, dl, NVT, {Tmp1, Tmp2, Tmp3, Tmp4, Cond},
5681 Node->getFlags());
5682
5683 // Cast the result back to the original type.
5684 if (ExtOp != ISD::FP_EXTEND)
5685 Tmp1 = DAG.getNode(ISD::TRUNCATE, dl, OVT, Tmp1);
5686 else
5687 Tmp1 = DAG.getNode(ISD::FP_ROUND, dl, OVT, Tmp1,
5688 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true));
5689
5690 Results.push_back(Tmp1);
5691 break;
5692 }
5693 case ISD::SETCC:
5694 case ISD::STRICT_FSETCC:
5695 case ISD::STRICT_FSETCCS: {
5696 unsigned ExtOp = ISD::FP_EXTEND;
5697 if (NVT.isInteger()) {
5698 ISD::CondCode CCCode = cast<CondCodeSDNode>(Node->getOperand(2))->get();
5699 if (isSignedIntSetCC(CCCode) ||
5700 TLI.isSExtCheaperThanZExt(Node->getOperand(0).getValueType(), NVT))
5701 ExtOp = ISD::SIGN_EXTEND;
5702 else
5703 ExtOp = ISD::ZERO_EXTEND;
5704 }
5705 if (Node->isStrictFPOpcode()) {
5706 SDValue InChain = Node->getOperand(0);
5707 std::tie(Tmp1, std::ignore) =
5708 DAG.getStrictFPExtendOrRound(Node->getOperand(1), InChain, dl, NVT);
5709 std::tie(Tmp2, std::ignore) =
5710 DAG.getStrictFPExtendOrRound(Node->getOperand(2), InChain, dl, NVT);
5711 SmallVector<SDValue, 2> TmpChains = {Tmp1.getValue(1), Tmp2.getValue(1)};
5712 SDValue OutChain = DAG.getTokenFactor(dl, TmpChains);
5713 SDVTList VTs = DAG.getVTList(Node->getValueType(0), MVT::Other);
5714 Results.push_back(DAG.getNode(Node->getOpcode(), dl, VTs,
5715 {OutChain, Tmp1, Tmp2, Node->getOperand(3)},
5716 Node->getFlags()));
5717 Results.push_back(Results.back().getValue(1));
5718 break;
5719 }
5720 Tmp1 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(0));
5721 Tmp2 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(1));
5722 Results.push_back(DAG.getNode(ISD::SETCC, dl, Node->getValueType(0), Tmp1,
5723 Tmp2, Node->getOperand(2), Node->getFlags()));
5724 break;
5725 }
5726 case ISD::BR_CC: {
5727 unsigned ExtOp = ISD::FP_EXTEND;
5728 if (NVT.isInteger()) {
5729 ISD::CondCode CCCode =
5730 cast<CondCodeSDNode>(Node->getOperand(1))->get();
5732 }
5733 Tmp1 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(2));
5734 Tmp2 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(3));
5735 Results.push_back(DAG.getNode(ISD::BR_CC, dl, Node->getValueType(0),
5736 Node->getOperand(0), Node->getOperand(1),
5737 Tmp1, Tmp2, Node->getOperand(4)));
5738 break;
5739 }
5740 case ISD::FADD:
5741 case ISD::FSUB:
5742 case ISD::FMUL:
5743 case ISD::FDIV:
5744 case ISD::FREM:
5745 case ISD::FMINNUM:
5746 case ISD::FMAXNUM:
5747 case ISD::FMINIMUM:
5748 case ISD::FMAXIMUM:
5749 case ISD::FMINIMUMNUM:
5750 case ISD::FMAXIMUMNUM:
5751 case ISD::FPOW:
5752 case ISD::FATAN2:
5753 Tmp1 = DAG.getNode(ISD::FP_EXTEND, dl, NVT, Node->getOperand(0));
5754 Tmp2 = DAG.getNode(ISD::FP_EXTEND, dl, NVT, Node->getOperand(1));
5755 Tmp3 = DAG.getNode(Node->getOpcode(), dl, NVT, Tmp1, Tmp2);
5756 Results.push_back(
5757 DAG.getNode(ISD::FP_ROUND, dl, OVT, Tmp3,
5758 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true)));
5759 break;
5760
5762 case ISD::STRICT_FMAXIMUM: {
5763 SDValue InChain = Node->getOperand(0);
5764 SDVTList VTs = DAG.getVTList(NVT, MVT::Other);
5765 Tmp1 = DAG.getNode(ISD::STRICT_FP_EXTEND, dl, VTs, InChain,
5766 Node->getOperand(1));
5767 Tmp2 = DAG.getNode(ISD::STRICT_FP_EXTEND, dl, VTs, InChain,
5768 Node->getOperand(2));
5769 SmallVector<SDValue, 4> Ops = {InChain, Tmp1, Tmp2};
5770 Tmp3 = DAG.getNode(Node->getOpcode(), dl, VTs, Ops, Node->getFlags());
5771 Tmp4 = DAG.getNode(ISD::STRICT_FP_ROUND, dl, DAG.getVTList(OVT, MVT::Other),
5772 InChain, Tmp3,
5773 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true));
5774 Results.push_back(Tmp4);
5775 Results.push_back(Tmp4.getValue(1));
5776 break;
5777 }
5778
5779 case ISD::STRICT_FADD:
5780 case ISD::STRICT_FSUB:
5781 case ISD::STRICT_FMUL:
5782 case ISD::STRICT_FDIV:
5785 case ISD::STRICT_FREM:
5786 case ISD::STRICT_FPOW:
5787 case ISD::STRICT_FATAN2:
5788 Tmp1 = DAG.getNode(ISD::STRICT_FP_EXTEND, dl, {NVT, MVT::Other},
5789 {Node->getOperand(0), Node->getOperand(1)});
5790 Tmp2 = DAG.getNode(ISD::STRICT_FP_EXTEND, dl, {NVT, MVT::Other},
5791 {Node->getOperand(0), Node->getOperand(2)});
5792 Tmp3 = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Tmp1.getValue(1),
5793 Tmp2.getValue(1));
5794 Tmp1 = DAG.getNode(Node->getOpcode(), dl, {NVT, MVT::Other},
5795 {Tmp3, Tmp1, Tmp2});
5796 Tmp1 = DAG.getNode(ISD::STRICT_FP_ROUND, dl, {OVT, MVT::Other},
5797 {Tmp1.getValue(1), Tmp1,
5798 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true)});
5799 Results.push_back(Tmp1);
5800 Results.push_back(Tmp1.getValue(1));
5801 break;
5802 case ISD::FMA:
5803 Tmp1 = DAG.getNode(ISD::FP_EXTEND, dl, NVT, Node->getOperand(0));
5804 Tmp2 = DAG.getNode(ISD::FP_EXTEND, dl, NVT, Node->getOperand(1));
5805 Tmp3 = DAG.getNode(ISD::FP_EXTEND, dl, NVT, Node->getOperand(2));
5806 Results.push_back(
5807 DAG.getNode(ISD::FP_ROUND, dl, OVT,
5808 DAG.getNode(Node->getOpcode(), dl, NVT, Tmp1, Tmp2, Tmp3),
5809 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true)));
5810 break;
5811 case ISD::STRICT_FMA:
5812 Tmp1 = DAG.getNode(ISD::STRICT_FP_EXTEND, dl, {NVT, MVT::Other},
5813 {Node->getOperand(0), Node->getOperand(1)});
5814 Tmp2 = DAG.getNode(ISD::STRICT_FP_EXTEND, dl, {NVT, MVT::Other},
5815 {Node->getOperand(0), Node->getOperand(2)});
5816 Tmp3 = DAG.getNode(ISD::STRICT_FP_EXTEND, dl, {NVT, MVT::Other},
5817 {Node->getOperand(0), Node->getOperand(3)});
5818 Tmp4 = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Tmp1.getValue(1),
5819 Tmp2.getValue(1), Tmp3.getValue(1));
5820 Tmp4 = DAG.getNode(Node->getOpcode(), dl, {NVT, MVT::Other},
5821 {Tmp4, Tmp1, Tmp2, Tmp3});
5822 Tmp4 = DAG.getNode(ISD::STRICT_FP_ROUND, dl, {OVT, MVT::Other},
5823 {Tmp4.getValue(1), Tmp4,
5824 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true)});
5825 Results.push_back(Tmp4);
5826 Results.push_back(Tmp4.getValue(1));
5827 break;
5828 case ISD::FCOPYSIGN:
5829 case ISD::FLDEXP:
5830 case ISD::FPOWI: {
5831 Tmp1 = DAG.getNode(ISD::FP_EXTEND, dl, NVT, Node->getOperand(0));
5832 Tmp2 = Node->getOperand(1);
5833 Tmp3 = DAG.getNode(Node->getOpcode(), dl, NVT, Tmp1, Tmp2);
5834
5835 // fcopysign doesn't change anything but the sign bit, so
5836 // (fp_round (fcopysign (fpext a), b))
5837 // is as precise as
5838 // (fp_round (fpext a))
5839 // which is a no-op. Mark it as a TRUNCating FP_ROUND.
5840 const bool isTrunc = (Node->getOpcode() == ISD::FCOPYSIGN);
5841 Results.push_back(
5842 DAG.getNode(ISD::FP_ROUND, dl, OVT, Tmp3,
5843 DAG.getIntPtrConstant(isTrunc, dl, /*isTarget=*/true)));
5844 break;
5845 }
5846 case ISD::STRICT_FLDEXP: {
5847 Tmp1 = DAG.getNode(ISD::STRICT_FP_EXTEND, dl, {NVT, MVT::Other},
5848 {Node->getOperand(0), Node->getOperand(1)});
5849 Tmp2 = Node->getOperand(2);
5850 Tmp3 = DAG.getNode(ISD::STRICT_FLDEXP, dl, {NVT, MVT::Other},
5851 {Tmp1.getValue(1), Tmp1, Tmp2});
5852 Tmp4 = DAG.getNode(ISD::STRICT_FP_ROUND, dl, {OVT, MVT::Other},
5853 {Tmp3.getValue(1), Tmp3,
5854 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true)});
5855 Results.push_back(Tmp4);
5856 Results.push_back(Tmp4.getValue(1));
5857 break;
5858 }
5859 case ISD::STRICT_FPOWI:
5860 Tmp1 = DAG.getNode(ISD::STRICT_FP_EXTEND, dl, {NVT, MVT::Other},
5861 {Node->getOperand(0), Node->getOperand(1)});
5862 Tmp2 = DAG.getNode(Node->getOpcode(), dl, {NVT, MVT::Other},
5863 {Tmp1.getValue(1), Tmp1, Node->getOperand(2)});
5864 Tmp3 = DAG.getNode(ISD::STRICT_FP_ROUND, dl, {OVT, MVT::Other},
5865 {Tmp2.getValue(1), Tmp2,
5866 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true)});
5867 Results.push_back(Tmp3);
5868 Results.push_back(Tmp3.getValue(1));
5869 break;
5870 case ISD::FFREXP: {
5871 Tmp1 = DAG.getNode(ISD::FP_EXTEND, dl, NVT, Node->getOperand(0));
5872 Tmp2 = DAG.getNode(ISD::FFREXP, dl, {NVT, Node->getValueType(1)}, Tmp1);
5873
5874 Results.push_back(
5875 DAG.getNode(ISD::FP_ROUND, dl, OVT, Tmp2,
5876 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true)));
5877
5878 Results.push_back(Tmp2.getValue(1));
5879 break;
5880 }
5881 case ISD::FMODF:
5882 case ISD::FSINCOS:
5883 case ISD::FSINCOSPI: {
5884 Tmp1 = DAG.getNode(ISD::FP_EXTEND, dl, NVT, Node->getOperand(0));
5885 Tmp2 = DAG.getNode(Node->getOpcode(), dl, DAG.getVTList(NVT, NVT), Tmp1);
5886 Tmp3 = DAG.getIntPtrConstant(0, dl, /*isTarget=*/true);
5887 for (unsigned ResNum = 0; ResNum < Node->getNumValues(); ResNum++)
5888 Results.push_back(
5889 DAG.getNode(ISD::FP_ROUND, dl, OVT, Tmp2.getValue(ResNum), Tmp3));
5890 break;
5891 }
5892 case ISD::FFLOOR:
5893 case ISD::FCEIL:
5894 case ISD::FRINT:
5895 case ISD::FNEARBYINT:
5896 case ISD::FROUND:
5897 case ISD::FROUNDEVEN:
5898 case ISD::FTRUNC:
5899 case ISD::FNEG:
5900 case ISD::FSQRT:
5901 case ISD::FSIN:
5902 case ISD::FCOS:
5903 case ISD::FTAN:
5904 case ISD::FASIN:
5905 case ISD::FACOS:
5906 case ISD::FATAN:
5907 case ISD::FSINH:
5908 case ISD::FCOSH:
5909 case ISD::FTANH:
5910 case ISD::FLOG:
5911 case ISD::FLOG2:
5912 case ISD::FLOG10:
5913 case ISD::FABS:
5914 case ISD::FEXP:
5915 case ISD::FEXP2:
5916 case ISD::FEXP10:
5917 case ISD::FCANONICALIZE:
5918 Tmp1 = DAG.getNode(ISD::FP_EXTEND, dl, NVT, Node->getOperand(0));
5919 Tmp2 = DAG.getNode(Node->getOpcode(), dl, NVT, Tmp1);
5920 Results.push_back(
5921 DAG.getNode(ISD::FP_ROUND, dl, OVT, Tmp2,
5922 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true)));
5923 break;
5924 case ISD::STRICT_FFLOOR:
5925 case ISD::STRICT_FCEIL:
5926 case ISD::STRICT_FRINT:
5928 case ISD::STRICT_FROUND:
5930 case ISD::STRICT_FTRUNC:
5931 case ISD::STRICT_FSQRT:
5932 case ISD::STRICT_FSIN:
5933 case ISD::STRICT_FCOS:
5934 case ISD::STRICT_FTAN:
5935 case ISD::STRICT_FASIN:
5936 case ISD::STRICT_FACOS:
5937 case ISD::STRICT_FATAN:
5938 case ISD::STRICT_FSINH:
5939 case ISD::STRICT_FCOSH:
5940 case ISD::STRICT_FTANH:
5941 case ISD::STRICT_FLOG:
5942 case ISD::STRICT_FLOG2:
5943 case ISD::STRICT_FLOG10:
5944 case ISD::STRICT_FEXP:
5945 case ISD::STRICT_FEXP2:
5946 Tmp1 = DAG.getNode(ISD::STRICT_FP_EXTEND, dl, {NVT, MVT::Other},
5947 {Node->getOperand(0), Node->getOperand(1)});
5948 Tmp2 = DAG.getNode(Node->getOpcode(), dl, {NVT, MVT::Other},
5949 {Tmp1.getValue(1), Tmp1});
5950 Tmp3 = DAG.getNode(ISD::STRICT_FP_ROUND, dl, {OVT, MVT::Other},
5951 {Tmp2.getValue(1), Tmp2,
5952 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true)});
5953 Results.push_back(Tmp3);
5954 Results.push_back(Tmp3.getValue(1));
5955 break;
5956 case ISD::BUILD_VECTOR: {
5957 MVT EltVT = OVT.getVectorElementType();
5958 MVT NewEltVT = NVT.getVectorElementType();
5959
5960 // Handle bitcasts to a different vector type with the same total bit size
5961 //
5962 // e.g. v2i64 = build_vector i64:x, i64:y => v4i32
5963 // =>
5964 // v4i32 = concat_vectors (v2i32 (bitcast i64:x)), (v2i32 (bitcast i64:y))
5965
5966 assert(NVT.isVector() && OVT.getSizeInBits() == NVT.getSizeInBits() &&
5967 "Invalid promote type for build_vector");
5968 assert(NewEltVT.bitsLE(EltVT) && "not handled");
5969
5970 MVT MidVT = getPromotedVectorElementType(TLI, EltVT, NewEltVT);
5971
5973 for (const SDValue &Op : Node->op_values())
5974 NewOps.push_back(DAG.getNode(ISD::BITCAST, SDLoc(Op), MidVT, Op));
5975
5976 SDLoc SL(Node);
5977 SDValue Concat =
5978 DAG.getNode(MidVT == NewEltVT ? ISD::BUILD_VECTOR : ISD::CONCAT_VECTORS,
5979 SL, NVT, NewOps);
5980 SDValue CvtVec = DAG.getNode(ISD::BITCAST, SL, OVT, Concat);
5981 Results.push_back(CvtVec);
5982 break;
5983 }
5985 MVT EltVT = OVT.getVectorElementType();
5986 MVT NewEltVT = NVT.getVectorElementType();
5987
5988 // Handle bitcasts to a different vector type with the same total bit size.
5989 //
5990 // e.g. v2i64 = extract_vector_elt x:v2i64, y:i32
5991 // =>
5992 // v4i32:castx = bitcast x:v2i64
5993 //
5994 // i64 = bitcast
5995 // (v2i32 build_vector (i32 (extract_vector_elt castx, (2 * y))),
5996 // (i32 (extract_vector_elt castx, (2 * y + 1)))
5997 //
5998
5999 assert(NVT.isVector() && OVT.getSizeInBits() == NVT.getSizeInBits() &&
6000 "Invalid promote type for extract_vector_elt");
6001 assert(NewEltVT.bitsLT(EltVT) && "not handled");
6002
6003 MVT MidVT = getPromotedVectorElementType(TLI, EltVT, NewEltVT);
6004 unsigned NewEltsPerOldElt = MidVT.getVectorNumElements();
6005
6006 SDValue Idx = Node->getOperand(1);
6007 EVT IdxVT = Idx.getValueType();
6008 SDLoc SL(Node);
6009 SDValue Factor = DAG.getConstant(NewEltsPerOldElt, SL, IdxVT);
6010 SDValue NewBaseIdx = DAG.getNode(ISD::MUL, SL, IdxVT, Idx, Factor);
6011
6012 SDValue CastVec = DAG.getNode(ISD::BITCAST, SL, NVT, Node->getOperand(0));
6013
6015 for (unsigned I = 0; I < NewEltsPerOldElt; ++I) {
6016 SDValue IdxOffset = DAG.getConstant(I, SL, IdxVT);
6017 SDValue TmpIdx = DAG.getNode(ISD::ADD, SL, IdxVT, NewBaseIdx, IdxOffset);
6018
6019 SDValue Elt = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, SL, NewEltVT,
6020 CastVec, TmpIdx);
6021 NewOps.push_back(Elt);
6022 }
6023
6024 SDValue NewVec = DAG.getBuildVector(MidVT, SL, NewOps);
6025 Results.push_back(DAG.getNode(ISD::BITCAST, SL, EltVT, NewVec));
6026 break;
6027 }
6029 MVT EltVT = OVT.getVectorElementType();
6030 MVT NewEltVT = NVT.getVectorElementType();
6031
6032 // Handle bitcasts to a different vector type with the same total bit size
6033 //
6034 // e.g. v2i64 = insert_vector_elt x:v2i64, y:i64, z:i32
6035 // =>
6036 // v4i32:castx = bitcast x:v2i64
6037 // v2i32:casty = bitcast y:i64
6038 //
6039 // v2i64 = bitcast
6040 // (v4i32 insert_vector_elt
6041 // (v4i32 insert_vector_elt v4i32:castx,
6042 // (extract_vector_elt casty, 0), 2 * z),
6043 // (extract_vector_elt casty, 1), (2 * z + 1))
6044
6045 assert(NVT.isVector() && OVT.getSizeInBits() == NVT.getSizeInBits() &&
6046 "Invalid promote type for insert_vector_elt");
6047 assert(NewEltVT.bitsLT(EltVT) && "not handled");
6048
6049 MVT MidVT = getPromotedVectorElementType(TLI, EltVT, NewEltVT);
6050 unsigned NewEltsPerOldElt = MidVT.getVectorNumElements();
6051
6052 SDValue Val = Node->getOperand(1);
6053 SDValue Idx = Node->getOperand(2);
6054 EVT IdxVT = Idx.getValueType();
6055 SDLoc SL(Node);
6056
6057 SDValue Factor = DAG.getConstant(NewEltsPerOldElt, SDLoc(), IdxVT);
6058 SDValue NewBaseIdx = DAG.getNode(ISD::MUL, SL, IdxVT, Idx, Factor);
6059
6060 SDValue CastVec = DAG.getNode(ISD::BITCAST, SL, NVT, Node->getOperand(0));
6061 SDValue CastVal = DAG.getNode(ISD::BITCAST, SL, MidVT, Val);
6062
6063 SDValue NewVec = CastVec;
6064 for (unsigned I = 0; I < NewEltsPerOldElt; ++I) {
6065 SDValue IdxOffset = DAG.getConstant(I, SL, IdxVT);
6066 SDValue InEltIdx = DAG.getNode(ISD::ADD, SL, IdxVT, NewBaseIdx, IdxOffset);
6067
6068 SDValue Elt = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, SL, NewEltVT,
6069 CastVal, IdxOffset);
6070
6071 NewVec = DAG.getNode(ISD::INSERT_VECTOR_ELT, SL, NVT,
6072 NewVec, Elt, InEltIdx);
6073 }
6074
6075 Results.push_back(DAG.getNode(ISD::BITCAST, SL, OVT, NewVec));
6076 break;
6077 }
6078 case ISD::SCALAR_TO_VECTOR: {
6079 MVT EltVT = OVT.getVectorElementType();
6080 MVT NewEltVT = NVT.getVectorElementType();
6081
6082 // Handle bitcasts to different vector type with the same total bit size.
6083 //
6084 // e.g. v2i64 = scalar_to_vector x:i64
6085 // =>
6086 // concat_vectors (v2i32 bitcast x:i64), (v2i32 undef)
6087 //
6088
6089 MVT MidVT = getPromotedVectorElementType(TLI, EltVT, NewEltVT);
6090 SDValue Val = Node->getOperand(0);
6091 SDLoc SL(Node);
6092
6093 SDValue CastVal = DAG.getNode(ISD::BITCAST, SL, MidVT, Val);
6094 SDValue Undef = DAG.getUNDEF(MidVT);
6095
6097 NewElts.push_back(CastVal);
6098 for (unsigned I = 1, NElts = OVT.getVectorNumElements(); I != NElts; ++I)
6099 NewElts.push_back(Undef);
6100
6101 SDValue Concat = DAG.getNode(ISD::CONCAT_VECTORS, SL, NVT, NewElts);
6102 SDValue CvtVec = DAG.getNode(ISD::BITCAST, SL, OVT, Concat);
6103 Results.push_back(CvtVec);
6104 break;
6105 }
6106 case ISD::ATOMIC_SWAP:
6107 case ISD::ATOMIC_STORE: {
6108 AtomicSDNode *AM = cast<AtomicSDNode>(Node);
6109 SDLoc SL(Node);
6110 SDValue CastVal = DAG.getNode(ISD::BITCAST, SL, NVT, AM->getVal());
6111 assert(NVT.getSizeInBits() == OVT.getSizeInBits() &&
6112 "unexpected promotion type");
6113 assert(AM->getMemoryVT().getSizeInBits() == NVT.getSizeInBits() &&
6114 "unexpected atomic_swap with illegal type");
6115
6116 SDValue Op0 = AM->getBasePtr();
6117 SDValue Op1 = CastVal;
6118
6119 // ATOMIC_STORE uses a swapped operand order from every other AtomicSDNode,
6120 // but really it should merge with ISD::STORE.
6121 if (AM->getOpcode() == ISD::ATOMIC_STORE)
6122 std::swap(Op0, Op1);
6123
6124 SDValue NewAtomic = DAG.getAtomic(AM->getOpcode(), SL, NVT, AM->getChain(),
6125 Op0, Op1, AM->getMemOperand());
6126
6127 if (AM->getOpcode() != ISD::ATOMIC_STORE) {
6128 Results.push_back(DAG.getNode(ISD::BITCAST, SL, OVT, NewAtomic));
6129 Results.push_back(NewAtomic.getValue(1));
6130 } else
6131 Results.push_back(NewAtomic);
6132 break;
6133 }
6134 case ISD::ATOMIC_LOAD: {
6135 AtomicSDNode *AM = cast<AtomicSDNode>(Node);
6136 SDLoc SL(Node);
6137 assert(NVT.getSizeInBits() == OVT.getSizeInBits() &&
6138 "unexpected promotion type");
6139 assert(AM->getMemoryVT().getSizeInBits() == NVT.getSizeInBits() &&
6140 "unexpected atomic_load with illegal type");
6141
6142 SDValue NewAtomic =
6143 DAG.getAtomic(ISD::ATOMIC_LOAD, SL, NVT, DAG.getVTList(NVT, MVT::Other),
6144 {AM->getChain(), AM->getBasePtr()}, AM->getMemOperand());
6145 Results.push_back(DAG.getNode(ISD::BITCAST, SL, OVT, NewAtomic));
6146 Results.push_back(NewAtomic.getValue(1));
6147 break;
6148 }
6149 case ISD::SPLAT_VECTOR: {
6150 SDValue Scalar = Node->getOperand(0);
6151 MVT ScalarType = Scalar.getSimpleValueType();
6152 MVT NewScalarType = NVT.getVectorElementType();
6153 if (ScalarType.isInteger()) {
6154 Tmp1 = DAG.getNode(ISD::ANY_EXTEND, dl, NewScalarType, Scalar);
6155 Tmp2 = DAG.getNode(Node->getOpcode(), dl, NVT, Tmp1);
6156 Results.push_back(DAG.getNode(ISD::TRUNCATE, dl, OVT, Tmp2));
6157 break;
6158 }
6159 Tmp1 = DAG.getNode(ISD::FP_EXTEND, dl, NewScalarType, Scalar);
6160 Tmp2 = DAG.getNode(Node->getOpcode(), dl, NVT, Tmp1);
6161 Results.push_back(
6162 DAG.getNode(ISD::FP_ROUND, dl, OVT, Tmp2,
6163 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true)));
6164 break;
6165 }
6170 case ISD::VP_REDUCE_FMAX:
6171 case ISD::VP_REDUCE_FMIN:
6172 case ISD::VP_REDUCE_FMAXIMUM:
6173 case ISD::VP_REDUCE_FMINIMUM:
6174 Results.push_back(PromoteReduction(Node));
6175 break;
6176 }
6177
6178 // Replace the original node with the legalized result.
6179 if (!Results.empty()) {
6180 LLVM_DEBUG(dbgs() << "Successfully promoted node\n");
6181 ReplaceNode(Node, Results.data());
6182 } else
6183 LLVM_DEBUG(dbgs() << "Could not promote node\n");
6184}
6185
6186/// This is the entry point for the file.
6189
6190 SmallPtrSet<SDNode *, 16> LegalizedNodes;
6191 // Use a delete listener to remove nodes which were deleted during
6192 // legalization from LegalizeNodes. This is needed to handle the situation
6193 // where a new node is allocated by the object pool to the same address of a
6194 // previously deleted node.
6195 DAGNodeDeletedListener DeleteListener(
6196 *this,
6197 [&LegalizedNodes](SDNode *N, SDNode *E) { LegalizedNodes.erase(N); });
6198
6199 SelectionDAGLegalize Legalizer(*this, LegalizedNodes);
6200
6201 // Visit all the nodes. We start in topological order, so that we see
6202 // nodes with their original operands intact. Legalization can produce
6203 // new nodes which may themselves need to be legalized. Iterate until all
6204 // nodes have been legalized.
6205 while (true) {
6206 bool AnyLegalized = false;
6207 for (auto NI = allnodes_end(); NI != allnodes_begin();) {
6208 --NI;
6209
6210 SDNode *N = &*NI;
6211 if (N->use_empty() && N != getRoot().getNode()) {
6212 ++NI;
6213 DeleteNode(N);
6214 continue;
6215 }
6216
6217 if (LegalizedNodes.insert(N).second) {
6218 AnyLegalized = true;
6219 Legalizer.LegalizeOp(N);
6220
6221 if (N->use_empty() && N != getRoot().getNode()) {
6222 ++NI;
6223 DeleteNode(N);
6224 }
6225 }
6226 }
6227 if (!AnyLegalized)
6228 break;
6229
6230 }
6231
6232 // Remove dead nodes now.
6234}
6235
6237 SmallSetVector<SDNode *, 16> &UpdatedNodes) {
6238 SmallPtrSet<SDNode *, 16> LegalizedNodes;
6239 SelectionDAGLegalize Legalizer(*this, LegalizedNodes, &UpdatedNodes);
6240
6241 // Directly insert the node in question, and legalize it. This will recurse
6242 // as needed through operands.
6243 LegalizedNodes.insert(N);
6244 Legalizer.LegalizeOp(N);
6245
6246 return LegalizedNodes.count(N);
6247}
#define Success
aarch64 falkor hwpf fix Falkor HW Prefetch Fix Late Phase
return SDValue()
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
static msgpack::DocNode getNode(msgpack::DocNode DN, msgpack::Type Type, MCValue Val)
static bool isConstant(const MachineInstr &MI)
This file declares a class to represent arbitrary precision floating point values and provide a varie...
This file implements a class to represent arbitrary precision integral constant values and operations...
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Function Alias Analysis Results
This file contains the declarations for the subclasses of Constant, which represent the different fla...
DXIL Legalizer
Utilities for dealing with flags related to floating point properties and mode controls.
static MaybeAlign getAlign(Value *Ptr)
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
static bool ExpandBVWithShuffles(SDNode *Node, SelectionDAG &DAG, const TargetLowering &TLI, SDValue &Res)
static bool isSinCosLibcallAvailable(SDNode *Node, const TargetLowering &TLI)
Return true if sincos or __sincos_stret libcall is available.
static bool useSinCos(SDNode *Node)
Only issue sincos libcall if both sin and cos are needed.
static bool canUseFastMathLibcall(const SDNode *Node)
Return if we can use the FAST_* variant of a math libcall for the node.
static MachineMemOperand * getStackAlignedMMO(SDValue StackPtr, MachineFunction &MF, bool isObjectScalable)
static MVT getPromotedVectorElementType(const TargetLowering &TLI, MVT EltVT, MVT NewEltVT)
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
std::pair< MCSymbol *, MachineModuleInfoImpl::StubValueTy > PairTy
Promote Memory to Register
Definition Mem2Reg.cpp:110
This file contains the declarations for metadata subclasses.
PowerPC Reduce CR logical Operation
static constexpr MCPhysReg SPReg
const SmallVectorImpl< MachineOperand > & Cond
static cl::opt< RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode > Mode("regalloc-enable-advisor", cl::Hidden, cl::init(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default), cl::desc("Enable regalloc advisor mode"), cl::values(clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default, "default", "Default"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Release, "release", "precompiled"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Development, "development", "for training")))
This file implements a set that has insertion order iteration characteristics.
This file defines the SmallPtrSet class.
This file defines the SmallSet class.
This file defines the SmallVector class.
#define LLVM_DEBUG(...)
Definition Debug.h:114
static TableGen::Emitter::OptClass< SkeletonEmitter > X("gen-skeleton-class", "Generate example skeleton class")
This file describes how to lower LLVM code to machine code.
static constexpr int Concat[]
Value * RHS
Value * LHS
BinaryOperator * Mul
bool isSignaling() const
Definition APFloat.h:1433
static APFloat getSmallestNormalized(const fltSemantics &Sem, bool Negative=false)
Returns the smallest (by magnitude) normalized finite number in the given semantics.
Definition APFloat.h:1140
APInt bitcastToAPInt() const
Definition APFloat.h:1335
static APFloat getInf(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative Infinity.
Definition APFloat.h:1080
Class for arbitrary precision integers.
Definition APInt.h:78
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
Definition APInt.h:230
void setBit(unsigned BitPosition)
Set the given bit to 1 whose position is given as "bitPosition".
Definition APInt.h:1331
static APInt getBitsSet(unsigned numBits, unsigned loBit, unsigned hiBit)
Get a value with a block of bits set.
Definition APInt.h:259
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition APInt.h:210
static APInt getOneBitSet(unsigned numBits, unsigned BitNo)
Return an APInt with exactly one bit set in the result.
Definition APInt.h:240
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
const SDValue & getBasePtr() const
const SDValue & getVal() const
LLVM_ABI Type * getStructRetType() const
static LLVM_ABI bool isValueValidForType(EVT VT, const APFloat &Val)
const APFloat & getValueAPF() const
const ConstantFP * getConstantFPValue() const
const APFloat & getValueAPF() const
Definition Constants.h:328
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
Definition Constants.h:171
static LLVM_ABI Constant * get(ArrayRef< Constant * > V)
bool isLittleEndian() const
Layout endianness...
Definition DataLayout.h:214
bool isBigEndian() const
Definition DataLayout.h:215
LLVM_ABI Align getPrefTypeAlign(Type *Ty) const
Returns the preferred stack/global alignment for the specified type.
bool empty() const
Definition Function.h:857
const BasicBlock & back() const
Definition Function.h:860
LLVM_ABI void emitError(const Instruction *I, const Twine &ErrorStr)
emitError - Emit an error message to the currently installed error handler with optional location inf...
static LocationSize precise(uint64_t Value)
static constexpr LocationSize beforeOrAfterPointer()
Any location before or after the base pointer (but still within the underlying object).
Machine Value Type.
SimpleValueType SimpleTy
uint64_t getScalarSizeInBits() const
bool bitsLE(MVT VT) const
Return true if this has no more bits than VT.
unsigned getVectorNumElements() const
bool isVector() const
Return true if this is a vector value type.
bool isInteger() const
Return true if this is an integer or a vector integer type.
bool bitsLT(MVT VT) const
Return true if this has less bits than VT.
TypeSize getSizeInBits() const
Returns the size of the specified MVT in bits.
static MVT getVectorVT(MVT VT, unsigned NumElements)
MVT getVectorElementType() const
bool isFloatingPoint() const
Return true if this is a FP or a vector FP type.
LLVM_ABI int CreateStackObject(uint64_t Size, Align Alignment, bool isSpillSlot, const AllocaInst *Alloca=nullptr, uint8_t ID=0)
Create a new statically sized stack object, returning a nonnegative identifier to represent it.
Align getObjectAlign(int ObjectIdx) const
Return the alignment of the specified stack object.
MachineMemOperand * getMachineMemOperand(MachinePointerInfo PtrInfo, MachineMemOperand::Flags f, LLT MemTy, Align base_alignment, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr, SyncScope::ID SSID=SyncScope::System, AtomicOrdering Ordering=AtomicOrdering::NotAtomic, AtomicOrdering FailureOrdering=AtomicOrdering::NotAtomic)
getMachineMemOperand - Allocate a new MachineMemOperand.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
Function & getFunction()
Return the LLVM function that this machine code represents.
const MachineJumpTableInfo * getJumpTableInfo() const
getJumpTableInfo - Return the jump table info object for the current function.
LLVM_ABI unsigned getEntrySize(const DataLayout &TD) const
getEntrySize - Return the size of each entry in the jump table.
A description of a memory reference used in the backend.
Flags
Flags values. These may be or'd together.
@ MOStore
The memory access writes data.
MachineMemOperand * getMemOperand() const
Return a MachineMemOperand object describing the memory reference performed by operation.
const SDValue & getChain() const
EVT getMemoryVT() const
Return the type of the in-memory value.
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Represents one node in the SelectionDAG.
bool isStrictFPOpcode()
Test if this node is a strict floating point pseudo-op.
ArrayRef< SDUse > ops() const
LLVM_ABI void dump() const
Dump this node, for debugging.
unsigned getOpcode() const
Return the SelectionDAG opcode value for this node.
static bool hasPredecessorHelper(const SDNode *N, SmallPtrSetImpl< const SDNode * > &Visited, SmallVectorImpl< const SDNode * > &Worklist, unsigned int MaxSteps=0, bool TopologicalPrune=false)
Returns true if N is a predecessor of any node in Worklist.
unsigned getNumValues() const
Return the number of values defined/returned by this operator.
const SDValue & getOperand(unsigned Num) const
EVT getValueType(unsigned ResNo) const
Return the type of a specified result.
iterator_range< user_iterator > users()
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
bool isUndef() const
SDNode * getNode() const
get the SDNode which holds the desired result
SDValue getValue(unsigned R) const
EVT getValueType() const
Return the ValueType of the referenced return value.
const SDValue & getOperand(unsigned i) const
uint64_t getScalarValueSizeInBits() const
unsigned getResNo() const
get the index which selects a specific result in the SDNode
MVT getSimpleValueType() const
Return the simple ValueType of the referenced return value.
unsigned getOpcode() const
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
LLVM_ABI SDValue getShiftAmountOperand(EVT LHSTy, SDValue Op)
Return the specified value casted to the target's desired shift amount type.
LLVM_ABI SDValue getExtLoad(ISD::LoadExtType ExtType, const SDLoc &dl, EVT VT, SDValue Chain, SDValue Ptr, MachinePointerInfo PtrInfo, EVT MemVT, MaybeAlign Alignment=MaybeAlign(), MachineMemOperand::Flags MMOFlags=MachineMemOperand::MONone, const AAMDNodes &AAInfo=AAMDNodes())
const SDValue & getRoot() const
Return the root tag of the SelectionDAG.
bool isKnownNeverSNaN(SDValue Op, const APInt &DemandedElts, unsigned Depth=0) const
const TargetSubtargetInfo & getSubtarget() const
SDValue getCopyToReg(SDValue Chain, const SDLoc &dl, Register Reg, SDValue N)
LLVM_ABI SDValue getMergeValues(ArrayRef< SDValue > Ops, const SDLoc &dl)
Create a MERGE_VALUES node from the given operands.
LLVM_ABI SDVTList getVTList(EVT VT)
Return an SDVTList that represents the list of values specified.
LLVM_ABI SDValue getShiftAmountConstant(uint64_t Val, EVT VT, const SDLoc &DL)
LLVM_ABI SDValue getAllOnesConstant(const SDLoc &DL, EVT VT, bool IsTarget=false, bool IsOpaque=false)
LLVM_ABI SDValue getFreeze(SDValue V)
Return a freeze using the SDLoc of the value operand.
LLVM_ABI SDValue getConstantPool(const Constant *C, EVT VT, MaybeAlign Align=std::nullopt, int Offs=0, bool isT=false, unsigned TargetFlags=0)
LLVM_ABI SDValue getAtomicCmpSwap(unsigned Opcode, const SDLoc &dl, EVT MemVT, SDVTList VTs, SDValue Chain, SDValue Ptr, SDValue Cmp, SDValue Swp, MachineMemOperand *MMO)
Gets a node for an atomic cmpxchg op.
SDValue getSetCC(const SDLoc &DL, EVT VT, SDValue LHS, SDValue RHS, ISD::CondCode Cond, SDValue Chain=SDValue(), bool IsSignaling=false)
Helper function to make it easier to build SetCC's if you just have an ISD::CondCode instead of an SD...
LLVM_ABI SDValue UnrollVectorOp(SDNode *N, unsigned ResNE=0)
Utility function used by legalize and lowering to "unroll" a vector operation by splitting out the sc...
LLVM_ABI SDValue getConstantFP(double Val, const SDLoc &DL, EVT VT, bool isTarget=false)
Create a ConstantFPSDNode wrapping a constant value.
LLVM_ABI SDValue getLoad(EVT VT, const SDLoc &dl, SDValue Chain, SDValue Ptr, MachinePointerInfo PtrInfo, MaybeAlign Alignment=MaybeAlign(), MachineMemOperand::Flags MMOFlags=MachineMemOperand::MONone, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr)
Loads are not normal binary operators: their result type is not determined by their operands,...
LLVM_ABI SDValue getAtomic(unsigned Opcode, const SDLoc &dl, EVT MemVT, SDValue Chain, SDValue Ptr, SDValue Val, MachineMemOperand *MMO)
Gets a node for an atomic op, produces result (if relevant) and chain and takes 2 operands.
LLVM_ABI bool shouldOptForSize() const
LLVM_ABI SDValue getNOT(const SDLoc &DL, SDValue Val, EVT VT)
Create a bitwise NOT operation as (XOR Val, -1).
const TargetLowering & getTargetLoweringInfo() const
LLVM_ABI SDValue expandVACopy(SDNode *Node)
Expand the specified ISD::VACOPY node as the Legalize pass would.
allnodes_const_iterator allnodes_begin() const
SDValue getUNDEF(EVT VT)
Return an UNDEF node. UNDEF does not have a useful SDLoc.
SDValue getCALLSEQ_END(SDValue Chain, SDValue Op1, SDValue Op2, SDValue InGlue, const SDLoc &DL)
Return a new CALLSEQ_END node, which always must have a glue result (to ensure it's not CSE'd).
SDValue getBuildVector(EVT VT, const SDLoc &DL, ArrayRef< SDValue > Ops)
Return an ISD::BUILD_VECTOR node.
allnodes_const_iterator allnodes_end() const
LLVM_ABI void DeleteNode(SDNode *N)
Remove the specified node from the system.
SDValue getCopyFromReg(SDValue Chain, const SDLoc &dl, Register Reg, EVT VT)
SDValue getSelect(const SDLoc &DL, EVT VT, SDValue Cond, SDValue LHS, SDValue RHS, SDNodeFlags Flags=SDNodeFlags())
Helper function to make it easier to build Select's if you just have operands and don't want to check...
LLVM_ABI SDValue getZeroExtendInReg(SDValue Op, const SDLoc &DL, EVT VT)
Return the expression required to zero extend the Op value assuming it was the smaller SrcTy value.
const DataLayout & getDataLayout() const
LLVM_ABI SDValue expandVAArg(SDNode *Node)
Expand the specified ISD::VAARG node as the Legalize pass would.
LLVM_ABI void Legalize()
This transforms the SelectionDAG into a SelectionDAG that is compatible with the target instruction s...
LLVM_ABI SDValue getTokenFactor(const SDLoc &DL, SmallVectorImpl< SDValue > &Vals)
Creates a new TokenFactor containing Vals.
LLVM_ABI bool LegalizeOp(SDNode *N, SmallSetVector< SDNode *, 16 > &UpdatedNodes)
Transforms a SelectionDAG node and any operands to it into a node that is compatible with the target ...
LLVM_ABI SDValue getConstant(uint64_t Val, const SDLoc &DL, EVT VT, bool isTarget=false, bool isOpaque=false)
Create a ConstantSDNode wrapping a constant value.
LLVM_ABI SDValue getMemBasePlusOffset(SDValue Base, TypeSize Offset, const SDLoc &DL, const SDNodeFlags Flags=SDNodeFlags())
Returns sum of the base pointer and offset.
LLVM_ABI SDValue getVAArg(EVT VT, const SDLoc &dl, SDValue Chain, SDValue Ptr, SDValue SV, unsigned Align)
VAArg produces a result and token chain, and takes a pointer and a source value as input.
LLVM_ABI SDValue getTruncStore(SDValue Chain, const SDLoc &dl, SDValue Val, SDValue Ptr, MachinePointerInfo PtrInfo, EVT SVT, Align Alignment, MachineMemOperand::Flags MMOFlags=MachineMemOperand::MONone, const AAMDNodes &AAInfo=AAMDNodes())
LLVM_ABI void ReplaceAllUsesWith(SDValue From, SDValue To)
Modify anything using 'From' to use 'To' instead.
LLVM_ABI SDValue makeStateFunctionCall(unsigned LibFunc, SDValue Ptr, SDValue InChain, const SDLoc &DLoc)
Helper used to make a call to a library function that has one argument of pointer type.
LLVM_ABI SDValue getStore(SDValue Chain, const SDLoc &dl, SDValue Val, SDValue Ptr, MachinePointerInfo PtrInfo, Align Alignment, MachineMemOperand::Flags MMOFlags=MachineMemOperand::MONone, const AAMDNodes &AAInfo=AAMDNodes())
Helper function to build ISD::STORE nodes.
LLVM_ABI SDValue getSignedConstant(int64_t Val, const SDLoc &DL, EVT VT, bool isTarget=false, bool isOpaque=false)
SDValue getCALLSEQ_START(SDValue Chain, uint64_t InSize, uint64_t OutSize, const SDLoc &DL)
Return a new CALLSEQ_START node, that starts new call frame, in which InSize bytes are set up inside ...
LLVM_ABI void RemoveDeadNodes()
This method deletes all unreachable nodes in the SelectionDAG.
SDValue getSelectCC(const SDLoc &DL, SDValue LHS, SDValue RHS, SDValue True, SDValue False, ISD::CondCode Cond, SDNodeFlags Flags=SDNodeFlags())
Helper function to make it easier to build SelectCC's if you just have an ISD::CondCode instead of an...
LLVM_ABI SDValue getSExtOrTrunc(SDValue Op, const SDLoc &DL, EVT VT)
Convert Op, which must be of integer type, to the integer type VT, by either sign-extending or trunca...
LLVM_ABI SDValue getBoolExtOrTrunc(SDValue Op, const SDLoc &SL, EVT VT, EVT OpVT)
Convert Op, which must be of integer type, to the integer type VT, by using an extension appropriate ...
LLVM_ABI SDValue getExternalSymbol(const char *Sym, EVT VT)
const TargetMachine & getTarget() const
LLVM_ABI std::pair< SDValue, SDValue > getStrictFPExtendOrRound(SDValue Op, SDValue Chain, const SDLoc &DL, EVT VT)
Convert Op, which must be a STRICT operation of float type, to the float type VT, by either extending...
LLVM_ABI SDValue getVPLogicalNOT(const SDLoc &DL, SDValue Val, SDValue Mask, SDValue EVL, EVT VT)
Create a vector-predicated logical NOT operation as (VP_XOR Val, BooleanOne, Mask,...
LLVM_ABI SDValue getAnyExtOrTrunc(SDValue Op, const SDLoc &DL, EVT VT)
Convert Op, which must be of integer type, to the integer type VT, by either any-extending or truncat...
LLVM_ABI SDValue getIntPtrConstant(uint64_t Val, const SDLoc &DL, bool isTarget=false)
LLVM_ABI SDValue getValueType(EVT)
LLVM_ABI SDValue getNode(unsigned Opcode, const SDLoc &DL, EVT VT, ArrayRef< SDUse > Ops)
Gets or creates the specified node.
LLVM_ABI SDValue getFPExtendOrRound(SDValue Op, const SDLoc &DL, EVT VT)
Convert Op, which must be of float type, to the float type VT, by either extending or rounding (by tr...
LLVM_ABI unsigned AssignTopologicalOrder()
Topological-sort the AllNodes list and a assign a unique node id for each node in the DAG based on th...
const TargetLibraryInfo & getLibInfo() const
LLVM_ABI SDValue getBoolConstant(bool V, const SDLoc &DL, EVT VT, EVT OpVT)
Create a true or false constant of type VT using the target's BooleanContent for type OpVT.
LLVM_ABI SDValue getVectorIdxConstant(uint64_t Val, const SDLoc &DL, bool isTarget=false)
LLVM_ABI void ReplaceAllUsesOfValueWith(SDValue From, SDValue To)
Replace any uses of From with To, leaving uses of other values produced by From.getNode() alone.
MachineFunction & getMachineFunction() const
SDValue getPOISON(EVT VT)
Return a POISON node. POISON does not have a useful SDLoc.
SDValue getSplatBuildVector(EVT VT, const SDLoc &DL, SDValue Op)
Return a splat ISD::BUILD_VECTOR node, consisting of Op splatted to all elements.
LLVM_ABI SDValue getFrameIndex(int FI, EVT VT, bool isTarget=false)
LLVM_ABI SDValue getZExtOrTrunc(SDValue Op, const SDLoc &DL, EVT VT)
Convert Op, which must be of integer type, to the integer type VT, by either zero-extending or trunca...
LLVM_ABI SDValue getCondCode(ISD::CondCode Cond)
SDValue getObjectPtrOffset(const SDLoc &SL, SDValue Ptr, TypeSize Offset)
Create an add instruction with appropriate flags when used for addressing some offset of an object.
LLVMContext * getContext() const
LLVM_ABI SDValue CreateStackTemporary(TypeSize Bytes, Align Alignment)
Create a stack temporary based on the size in bytes and the alignment.
LLVM_ABI SDNode * UpdateNodeOperands(SDNode *N, SDValue Op)
Mutate the specified node in-place to have the specified operands.
SDValue getEntryNode() const
Return the token chain corresponding to the entry of the function.
LLVM_ABI SDValue getVectorShuffle(EVT VT, const SDLoc &dl, SDValue N1, SDValue N2, ArrayRef< int > Mask)
Return an ISD::VECTOR_SHUFFLE node.
LLVM_ABI SDValue getLogicalNOT(const SDLoc &DL, SDValue Val, EVT VT)
Create a logical NOT operation as (XOR Val, BooleanOne).
bool insert(const value_type &X)
Insert a new element into the SetVector.
Definition SetVector.h:151
A templated base class for SmallPtrSet which provides the typesafe interface that is common across al...
bool erase(PtrType Ptr)
Remove pointer from the set.
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
A SetVector that performs no allocations if smaller than a certain size.
Definition SetVector.h:339
std::pair< const_iterator, bool > insert(const T &V)
insert - Insert an element into the set if it isn't already there.
Definition SmallSet.h:183
size_type size() const
Definition SmallSet.h:170
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void reserve(size_type N)
void swap(SmallVectorImpl &RHS)
void push_back(const T &Elt)
pointer data()
Return a pointer to the vector's buffer, even if empty().
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
This class is used to represent ISD::STORE nodes.
Align getStackAlign() const
getStackAlignment - This method returns the number of bytes to which the stack pointer must be aligne...
StackDirection getStackGrowthDirection() const
getStackGrowthDirection - Return the direction the stack grows
unsigned getIntSize() const
Get size of a C-level int or unsigned int, in bits.
bool isOperationExpand(unsigned Op, EVT VT) const
Return true if the specified operation is illegal on this target or unlikely to be made legal with cu...
virtual bool isShuffleMaskLegal(ArrayRef< int >, EVT) const
Targets can use this to indicate that they only support some VECTOR_SHUFFLE operations,...
virtual bool shouldExpandBuildVectorWithShuffles(EVT, unsigned DefinedValues) const
virtual bool isSExtCheaperThanZExt(EVT FromTy, EVT ToTy) const
Return true if sign-extension from FromTy to ToTy is cheaper than zero-extension.
MVT getVectorIdxTy(const DataLayout &DL) const
Returns the type to be used for the index operand of: ISD::INSERT_VECTOR_ELT, ISD::EXTRACT_VECTOR_ELT...
bool isOperationLegalOrPromote(unsigned Op, EVT VT, bool LegalOnly=false) const
Return true if the specified operation is legal on this target or can be made legal using promotion.
LegalizeAction getCondCodeAction(ISD::CondCode CC, MVT VT) const
Return how the condition code should be treated: either it is legal, needs to be expanded to some oth...
CallingConv::ID getLibcallImplCallingConv(RTLIB::LibcallImpl Call) const
Get the CallingConv that should be used for the specified libcall implementation.
virtual bool isFPImmLegal(const APFloat &, EVT, bool ForCodeSize=false) const
Returns true if the target can instruction select the specified FP immediate natively.
Register getStackPointerRegisterToSaveRestore() const
If a physical register, this specifies the register that llvm.savestack/llvm.restorestack should save...
LegalizeAction getFixedPointOperationAction(unsigned Op, EVT VT, unsigned Scale) const
Some fixed point operations may be natively supported by the target but only for specific scales.
virtual ISD::NodeType getExtendForAtomicOps() const
Returns how the platform's atomic operations are extended (ZERO_EXTEND, SIGN_EXTEND,...
EVT getShiftAmountTy(EVT LHSTy, const DataLayout &DL) const
Returns the type for the shift amount of a shift opcode.
bool isStrictFPEnabled() const
Return true if the target support strict float operation.
virtual EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Context, EVT VT) const
Return the ValueType of the result of SETCC operations.
virtual EVT getTypeToTransformTo(LLVMContext &Context, EVT VT) const
For types supported by the target, this is an identity function.
bool isCondCodeLegal(ISD::CondCode CC, MVT VT) const
Return true if the specified condition code is legal for a comparison of the specified types on this ...
bool isTypeLegal(EVT VT) const
Return true if the target has native support for the specified value type.
MVT getProgramPointerTy(const DataLayout &DL) const
Return the type for code pointers, which is determined by the program address space specified through...
virtual bool isJumpTableRelative() const
virtual bool ShouldShrinkFPConstant(EVT) const
If true, then instruction selection should seek to shrink the FP constant of the specified type to a ...
virtual MVT getPointerTy(const DataLayout &DL, uint32_t AS=0) const
Return the pointer type for the given address space, defaults to the pointer type from the data layou...
bool isOperationLegal(unsigned Op, EVT VT) const
Return true if the specified operation is legal on this target.
LegalizeAction getTruncStoreAction(EVT ValVT, EVT MemVT) const
Return how this store with truncation should be treated: either it is legal, needs to be promoted to ...
LegalizeAction getLoadExtAction(unsigned ExtType, EVT ValVT, EVT MemVT) const
Return how this load with extension should be treated: either it is legal, needs to be promoted to a ...
bool isOperationLegalOrCustom(unsigned Op, EVT VT, bool LegalOnly=false) const
Return true if the specified operation is legal on this target or can be made legal with custom lower...
virtual bool allowsMemoryAccess(LLVMContext &Context, const DataLayout &DL, EVT VT, unsigned AddrSpace=0, Align Alignment=Align(1), MachineMemOperand::Flags Flags=MachineMemOperand::MONone, unsigned *Fast=nullptr) const
Return true if the target supports a memory access of this type for the given address space and align...
virtual LegalizeAction getCustomOperationAction(SDNode &Op) const
How to legalize this custom operation?
bool isLoadExtLegalOrCustom(unsigned ExtType, EVT ValVT, EVT MemVT) const
Return true if the specified load with extension is legal or custom on this target.
LegalizeAction getStrictFPOperationAction(unsigned Op, EVT VT) const
bool isLoadExtLegal(unsigned ExtType, EVT ValVT, EVT MemVT) const
Return true if the specified load with extension is legal on this target.
RTLIB::LibcallImpl getLibcallImpl(RTLIB::Libcall Call) const
Get the libcall impl routine name for the specified libcall.
virtual bool useSoftFloat() const
bool isTruncStoreLegalOrCustom(EVT ValVT, EVT MemVT) const
Return true if the specified store with truncation has solution on this target.
LegalizeTypeAction getTypeAction(LLVMContext &Context, EVT VT) const
Return how we should legalize values of this type, either it is already legal (return 'Legal') or we ...
virtual bool shouldSignExtendTypeInLibCall(Type *Ty, bool IsSigned) const
Returns true if arguments should be sign-extended in lib calls.
std::vector< ArgListEntry > ArgListTy
bool allowsMemoryAccessForAlignment(LLVMContext &Context, const DataLayout &DL, EVT VT, unsigned AddrSpace=0, Align Alignment=Align(1), MachineMemOperand::Flags Flags=MachineMemOperand::MONone, unsigned *Fast=nullptr) const
This function returns true if the memory access is aligned or if the target allows this specific unal...
bool isCondCodeLegalOrCustom(ISD::CondCode CC, MVT VT) const
Return true if the specified condition code is legal or custom for a comparison of the specified type...
MVT getFrameIndexTy(const DataLayout &DL) const
Return the type for frame index, which is determined by the alloca address space specified through th...
MVT getRegisterType(MVT VT) const
Return the type of registers that this ValueType will eventually require.
LegalizeAction getOperationAction(unsigned Op, EVT VT) const
Return how this operation should be treated: either it is legal, needs to be promoted to a larger siz...
MVT getTypeToPromoteTo(unsigned Op, MVT VT) const
If the action for this operation is to promote, this method returns the ValueType to promote to.
const RTLIB::RuntimeLibcallsInfo & getRuntimeLibcallsInfo() const
This class defines information used to lower LLVM code to legal SelectionDAG operators that the targe...
SDValue expandAddSubSat(SDNode *Node, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::[US][ADD|SUB]SAT.
bool expandMultipleResultFPLibCall(SelectionDAG &DAG, RTLIB::Libcall LC, SDNode *Node, SmallVectorImpl< SDValue > &Results, std::optional< unsigned > CallRetResNo={}) const
Expands a node with multiple results to an FP or vector libcall.
bool expandMULO(SDNode *Node, SDValue &Result, SDValue &Overflow, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::[US]MULO.
bool expandMUL(SDNode *N, SDValue &Lo, SDValue &Hi, EVT HiLoVT, SelectionDAG &DAG, MulExpansionKind Kind, SDValue LL=SDValue(), SDValue LH=SDValue(), SDValue RL=SDValue(), SDValue RH=SDValue()) const
Expand a MUL into two nodes.
SDValue expandCTLZ(SDNode *N, SelectionDAG &DAG) const
Expand CTLZ/CTLZ_ZERO_UNDEF nodes.
SDValue expandBITREVERSE(SDNode *N, SelectionDAG &DAG) const
Expand BITREVERSE nodes.
SDValue expandCTTZ(SDNode *N, SelectionDAG &DAG) const
Expand CTTZ/CTTZ_ZERO_UNDEF nodes.
virtual SDValue expandIndirectJTBranch(const SDLoc &dl, SDValue Value, SDValue Addr, int JTI, SelectionDAG &DAG) const
Expands target specific indirect branch for the case of JumpTable expansion.
SDValue expandABD(SDNode *N, SelectionDAG &DAG) const
Expand ABDS/ABDU nodes.
SDValue expandShlSat(SDNode *Node, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::[US]SHLSAT.
SDValue expandIS_FPCLASS(EVT ResultVT, SDValue Op, FPClassTest Test, SDNodeFlags Flags, const SDLoc &DL, SelectionDAG &DAG) const
Expand check for floating point class.
SDValue expandFP_TO_INT_SAT(SDNode *N, SelectionDAG &DAG) const
Expand FP_TO_[US]INT_SAT into FP_TO_[US]INT and selects or min/max.
SDValue expandUnalignedStore(StoreSDNode *ST, SelectionDAG &DAG) const
Expands an unaligned store to 2 half-size stores for integer values, and possibly more for vectors.
void expandSADDSUBO(SDNode *Node, SDValue &Result, SDValue &Overflow, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::S(ADD|SUB)O.
SDValue expandABS(SDNode *N, SelectionDAG &DAG, bool IsNegative=false) const
Expand ABS nodes.
SDValue expandVecReduce(SDNode *Node, SelectionDAG &DAG) const
Expand a VECREDUCE_* into an explicit calculation.
SDValue expandVPCTTZElements(SDNode *N, SelectionDAG &DAG) const
Expand VP_CTTZ_ELTS/VP_CTTZ_ELTS_ZERO_UNDEF nodes.
bool expandFP_TO_UINT(SDNode *N, SDValue &Result, SDValue &Chain, SelectionDAG &DAG) const
Expand float to UINT conversion.
bool expandREM(SDNode *Node, SDValue &Result, SelectionDAG &DAG) const
Expand an SREM or UREM using SDIV/UDIV or SDIVREM/UDIVREM, if legal.
std::pair< SDValue, SDValue > expandUnalignedLoad(LoadSDNode *LD, SelectionDAG &DAG) const
Expands an unaligned load to 2 half-size loads for an integer, and possibly more for vectors.
SDValue expandFMINIMUMNUM_FMAXIMUMNUM(SDNode *N, SelectionDAG &DAG) const
Expand fminimumnum/fmaximumnum into multiple comparison with selects.
SDValue expandVectorSplice(SDNode *Node, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::VECTOR_SPLICE.
SDValue getVectorSubVecPointer(SelectionDAG &DAG, SDValue VecPtr, EVT VecVT, EVT SubVecVT, SDValue Index, const SDNodeFlags PtrArithFlags=SDNodeFlags()) const
Get a pointer to a sub-vector of type SubVecVT at index Idx located in memory for a vector of type Ve...
SDValue expandCTPOP(SDNode *N, SelectionDAG &DAG) const
Expand CTPOP nodes.
std::pair< SDValue, SDValue > LowerCallTo(CallLoweringInfo &CLI) const
This function lowers an abstract call to a function into an actual call.
SDValue expandBSWAP(SDNode *N, SelectionDAG &DAG) const
Expand BSWAP nodes.
SDValue expandFMINIMUM_FMAXIMUM(SDNode *N, SelectionDAG &DAG) const
Expand fminimum/fmaximum into multiple comparison with selects.
bool expandFP_TO_SINT(SDNode *N, SDValue &Result, SelectionDAG &DAG) const
Expand float(f32) to SINT(i64) conversion.
virtual SDValue getPICJumpTableRelocBase(SDValue Table, SelectionDAG &DAG) const
Returns relocation base for the given PIC jumptable.
bool isInTailCallPosition(SelectionDAG &DAG, SDNode *Node, SDValue &Chain) const
Check whether a given call node is in tail position within its function.
SDValue expandFunnelShift(SDNode *N, SelectionDAG &DAG) const
Expand funnel shift.
bool LegalizeSetCCCondCode(SelectionDAG &DAG, EVT VT, SDValue &LHS, SDValue &RHS, SDValue &CC, SDValue Mask, SDValue EVL, bool &NeedInvert, const SDLoc &dl, SDValue &Chain, bool IsSignaling=false) const
Legalize a SETCC or VP_SETCC with given LHS and RHS and condition code CC on the current target.
virtual SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const
This callback is invoked for operations that are unsupported by the target, which are registered to u...
SDValue expandFixedPointDiv(unsigned Opcode, const SDLoc &dl, SDValue LHS, SDValue RHS, unsigned Scale, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::[US]DIVFIX[SAT].
SDValue expandFP_ROUND(SDNode *Node, SelectionDAG &DAG) const
Expand round(fp) to fp conversion.
SDValue expandROT(SDNode *N, bool AllowVectorOps, SelectionDAG &DAG) const
Expand rotations.
SDValue getVectorElementPointer(SelectionDAG &DAG, SDValue VecPtr, EVT VecVT, SDValue Index, const SDNodeFlags PtrArithFlags=SDNodeFlags()) const
Get a pointer to vector element Idx located in memory for a vector of type VecVT starting at a base a...
SDValue expandFMINNUM_FMAXNUM(SDNode *N, SelectionDAG &DAG) const
Expand fminnum/fmaxnum into fminnum_ieee/fmaxnum_ieee with quieted inputs.
std::pair< SDValue, SDValue > makeLibCall(SelectionDAG &DAG, RTLIB::LibcallImpl LibcallImpl, EVT RetVT, ArrayRef< SDValue > Ops, MakeLibCallOptions CallOptions, const SDLoc &dl, SDValue Chain=SDValue()) const
Returns a pair of (return value, chain).
SDValue expandCMP(SDNode *Node, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::[US]CMP.
SDValue expandFixedPointMul(SDNode *Node, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::[U|S]MULFIX[SAT].
void expandUADDSUBO(SDNode *Node, SDValue &Result, SDValue &Overflow, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::U(ADD|SUB)O.
bool expandUINT_TO_FP(SDNode *N, SDValue &Result, SDValue &Chain, SelectionDAG &DAG) const
Expand UINT(i64) to double(f64) conversion.
bool expandMUL_LOHI(unsigned Opcode, EVT VT, const SDLoc &dl, SDValue LHS, SDValue RHS, SmallVectorImpl< SDValue > &Result, EVT HiLoVT, SelectionDAG &DAG, MulExpansionKind Kind, SDValue LL=SDValue(), SDValue LH=SDValue(), SDValue RL=SDValue(), SDValue RH=SDValue()) const
Expand a MUL or [US]MUL_LOHI of n-bit values into two or four nodes, respectively,...
SDValue expandAVG(SDNode *N, SelectionDAG &DAG) const
Expand vector/scalar AVGCEILS/AVGCEILU/AVGFLOORS/AVGFLOORU nodes.
Primary interface to the complete machine description for the target machine.
const Triple & getTargetTriple() const
virtual const TargetFrameLowering * getFrameLowering() const
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition TypeSize.h:343
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
Definition Type.h:128
bool isVoidTy() const
Return true if this is 'void'.
Definition Type.h:139
static LLVM_ABI UndefValue * get(Type *T)
Static factory methods - Return an 'undef' object of the specified type.
LLVM Value Representation.
Definition Value.h:75
constexpr ScalarTy getFixedValue() const
Definition TypeSize.h:200
constexpr ScalarTy getKnownMinValue() const
Returns the minimum value this quantity can represent.
Definition TypeSize.h:165
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
constexpr char Align[]
Key for Kernel::Arg::Metadata::mAlign.
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
@ Entry
Definition COFF.h:862
@ Fast
Attempts to make calls as fast as possible (e.g.
Definition CallingConv.h:41
@ SETCC
SetCC operator - This evaluates to a true value iff the condition is true.
Definition ISDOpcodes.h:809
@ MERGE_VALUES
MERGE_VALUES - This node takes multiple discrete operands and returns them all as its individual resu...
Definition ISDOpcodes.h:256
@ STACKRESTORE
STACKRESTORE has two operands, an input chain and a pointer to restore to it returns an output chain.
@ STACKSAVE
STACKSAVE - STACKSAVE has one operand, an input chain.
@ CTLZ_ZERO_UNDEF
Definition ISDOpcodes.h:782
@ STRICT_FSETCC
STRICT_FSETCC/STRICT_FSETCCS - Constrained versions of SETCC, used for floating-point operands only.
Definition ISDOpcodes.h:506
@ POISON
POISON - A poison node.
Definition ISDOpcodes.h:231
@ SET_FPENV
Sets the current floating-point environment.
@ VECREDUCE_SEQ_FADD
Generic reduction nodes.
@ EH_SJLJ_LONGJMP
OUTCHAIN = EH_SJLJ_LONGJMP(INCHAIN, buffer) This corresponds to the eh.sjlj.longjmp intrinsic.
Definition ISDOpcodes.h:163
@ SMUL_LOHI
SMUL_LOHI/UMUL_LOHI - Multiply two integers of type iN, producing a signed/unsigned value of type i[2...
Definition ISDOpcodes.h:270
@ INSERT_SUBVECTOR
INSERT_SUBVECTOR(VECTOR1, VECTOR2, IDX) - Returns a vector with VECTOR2 inserted into VECTOR1.
Definition ISDOpcodes.h:595
@ BSWAP
Byte Swap and Counting operators.
Definition ISDOpcodes.h:773
@ SMULFIX
RESULT = [US]MULFIX(LHS, RHS, SCALE) - Perform fixed point multiplication on 2 integers with the same...
Definition ISDOpcodes.h:389
@ VAEND
VAEND, VASTART - VAEND and VASTART have three operands: an input chain, pointer, and a SRCVALUE.
@ ATOMIC_STORE
OUTCHAIN = ATOMIC_STORE(INCHAIN, val, ptr) This corresponds to "store atomic" instruction.
@ FRAME_TO_ARGS_OFFSET
FRAME_TO_ARGS_OFFSET - This node represents offset from frame pointer to first (possible) on-stack ar...
Definition ISDOpcodes.h:140
@ RESET_FPENV
Set floating-point environment to default state.
@ FMAD
FMAD - Perform a * b + c, while getting the same result as the separately rounded operations.
Definition ISDOpcodes.h:517
@ ADD
Simple integer binary arithmetic operators.
Definition ISDOpcodes.h:259
@ LOAD
LOAD and STORE have token chains as their first operand, then the same operands as an LLVM load/store...
@ SMULFIXSAT
Same as the corresponding unsaturated fixed point instructions, but the result is clamped between the...
Definition ISDOpcodes.h:395
@ SET_FPMODE
Sets the current dynamic floating-point control modes.
@ ANY_EXTEND
ANY_EXTEND - Used for integer types. The high bits are undefined.
Definition ISDOpcodes.h:843
@ FMA
FMA - Perform a * b + c with no intermediate rounding step.
Definition ISDOpcodes.h:513
@ FMODF
FMODF - Decomposes the operand into integral and fractional parts, each having the same type and sign...
@ FATAN2
FATAN2 - atan2, inspired by libm.
@ FSINCOSPI
FSINCOSPI - Compute both the sine and cosine times pi more accurately than FSINCOS(pi*x),...
@ INTRINSIC_VOID
OUTCHAIN = INTRINSIC_VOID(INCHAIN, INTRINSICID, arg1, arg2, ...) This node represents a target intrin...
Definition ISDOpcodes.h:215
@ EH_SJLJ_SETUP_DISPATCH
OUTCHAIN = EH_SJLJ_SETUP_DISPATCH(INCHAIN) The target initializes the dispatch table here.
Definition ISDOpcodes.h:167
@ GlobalAddress
Definition ISDOpcodes.h:88
@ ATOMIC_CMP_SWAP_WITH_SUCCESS
Val, Success, OUTCHAIN = ATOMIC_CMP_SWAP_WITH_SUCCESS(INCHAIN, ptr, cmp, swap) N.b.
@ STRICT_FMINIMUM
Definition ISDOpcodes.h:466
@ SINT_TO_FP
[SU]INT_TO_FP - These operators convert integers (whose interpreted sign depends on the first letter)...
Definition ISDOpcodes.h:870
@ CONCAT_VECTORS
CONCAT_VECTORS(VECTOR0, VECTOR1, ...) - Given a number of values of vector type with the same length ...
Definition ISDOpcodes.h:579
@ VECREDUCE_FMAX
FMIN/FMAX nodes can have flags, for NaN/NoNaN variants.
@ FADD
Simple binary floating point operators.
Definition ISDOpcodes.h:412
@ VECREDUCE_FMAXIMUM
FMINIMUM/FMAXIMUM nodes propatate NaNs and signed zeroes using the llvm.minimum and llvm....
@ ABS
ABS - Determine the unsigned absolute value of a signed integer value of the same bitwidth.
Definition ISDOpcodes.h:746
@ ATOMIC_FENCE
OUTCHAIN = ATOMIC_FENCE(INCHAIN, ordering, scope) This corresponds to the fence instruction.
@ RESET_FPMODE
Sets default dynamic floating-point control modes.
@ SDIVREM
SDIVREM/UDIVREM - Divide two integers and produce both a quotient and remainder result.
Definition ISDOpcodes.h:275
@ FP16_TO_FP
FP16_TO_FP, FP_TO_FP16 - These operators are used to perform promotions and truncation for half-preci...
Definition ISDOpcodes.h:993
@ BITCAST
BITCAST - This operator converts between integer, vector and FP values, as if the value was stored to...
Definition ISDOpcodes.h:983
@ BUILD_PAIR
BUILD_PAIR - This is the opposite of EXTRACT_ELEMENT in some ways.
Definition ISDOpcodes.h:249
@ INIT_TRAMPOLINE
INIT_TRAMPOLINE - This corresponds to the init_trampoline intrinsic.
@ FLDEXP
FLDEXP - ldexp, inspired by libm (op0 * 2**op1).
@ SDIVFIX
RESULT = [US]DIVFIX(LHS, RHS, SCALE) - Perform fixed point division on 2 integers with the same width...
Definition ISDOpcodes.h:402
@ STRICT_FSQRT
Constrained versions of libm-equivalent floating point intrinsics.
Definition ISDOpcodes.h:433
@ BUILTIN_OP_END
BUILTIN_OP_END - This must be the last enum value in this list.
@ GlobalTLSAddress
Definition ISDOpcodes.h:89
@ EH_LABEL
EH_LABEL - Represents a label in mid basic block used to track locations needed for debug and excepti...
@ EH_RETURN
OUTCHAIN = EH_RETURN(INCHAIN, OFFSET, HANDLER) - This node represents 'eh_return' gcc dwarf builtin,...
Definition ISDOpcodes.h:151
@ SIGN_EXTEND
Conversion operators.
Definition ISDOpcodes.h:834
@ AVGCEILS
AVGCEILS/AVGCEILU - Rounding averaging add - Add two integers using an integer of type i[N+2],...
Definition ISDOpcodes.h:714
@ STRICT_UINT_TO_FP
Definition ISDOpcodes.h:480
@ SCALAR_TO_VECTOR
SCALAR_TO_VECTOR(VAL) - This represents the operation of loading a scalar value into element 0 of the...
Definition ISDOpcodes.h:664
@ READSTEADYCOUNTER
READSTEADYCOUNTER - This corresponds to the readfixedcounter intrinsic.
@ ADDROFRETURNADDR
ADDROFRETURNADDR - Represents the llvm.addressofreturnaddress intrinsic.
Definition ISDOpcodes.h:117
@ VECREDUCE_FADD
These reductions have relaxed evaluation order semantics, and have a single vector operand.
@ CTTZ_ZERO_UNDEF
Bit counting operators with an undefined result for zero inputs.
Definition ISDOpcodes.h:781
@ PREFETCH
PREFETCH - This corresponds to a prefetch intrinsic.
@ FSINCOS
FSINCOS - Compute both fsin and fcos as a single operation.
@ SETCCCARRY
Like SetCC, ops #0 and #1 are the LHS and RHS operands to compare, but op #2 is a boolean indicating ...
Definition ISDOpcodes.h:817
@ FNEG
Perform various unary floating-point operations inspired by libm.
@ BR_CC
BR_CC - Conditional branch.
@ SSUBO
Same for subtraction.
Definition ISDOpcodes.h:347
@ BR_JT
BR_JT - Jumptable branch.
@ VECTOR_INTERLEAVE
VECTOR_INTERLEAVE(VEC1, VEC2, ...) - Returns N vectors from N input vectors, where N is the factor to...
Definition ISDOpcodes.h:630
@ FCANONICALIZE
Returns platform specific canonical encoding of a floating point number.
Definition ISDOpcodes.h:536
@ IS_FPCLASS
Performs a check of floating point class property, defined by IEEE-754.
Definition ISDOpcodes.h:543
@ SSUBSAT
RESULT = [US]SUBSAT(LHS, RHS) - Perform saturation subtraction on 2 integers with the same bit width ...
Definition ISDOpcodes.h:369
@ SELECT
Select(COND, TRUEVAL, FALSEVAL).
Definition ISDOpcodes.h:786
@ ATOMIC_LOAD
Val, OUTCHAIN = ATOMIC_LOAD(INCHAIN, ptr) This corresponds to "load atomic" instruction.
@ UNDEF
UNDEF - An undefined node.
Definition ISDOpcodes.h:228
@ EXTRACT_ELEMENT
EXTRACT_ELEMENT - This is used to get the lower or upper (determined by a Constant,...
Definition ISDOpcodes.h:242
@ SPLAT_VECTOR
SPLAT_VECTOR(VAL) - Returns a vector with the scalar value VAL duplicated in all lanes.
Definition ISDOpcodes.h:671
@ VACOPY
VACOPY - VACOPY has 5 operands: an input chain, a destination pointer, a source pointer,...
@ SADDO
RESULT, BOOL = [SU]ADDO(LHS, RHS) - Overflow-aware nodes for addition.
Definition ISDOpcodes.h:343
@ VECREDUCE_ADD
Integer reductions may have a result type larger than the vector element type.
@ GET_ROUNDING
Returns current rounding mode: -1 Undefined 0 Round to 0 1 Round to nearest, ties to even 2 Round to ...
Definition ISDOpcodes.h:960
@ STRICT_FP_TO_FP16
Definition ISDOpcodes.h:996
@ MULHU
MULHU/MULHS - Multiply high - Multiply two integers of type iN, producing an unsigned/signed value of...
Definition ISDOpcodes.h:703
@ GET_FPMODE
Reads the current dynamic floating-point control modes.
@ STRICT_FP16_TO_FP
Definition ISDOpcodes.h:995
@ SHL
Shift and rotation operations.
Definition ISDOpcodes.h:764
@ VECTOR_SHUFFLE
VECTOR_SHUFFLE(VEC1, VEC2) - Returns a vector, of the same type as VEC1/VEC2.
Definition ISDOpcodes.h:644
@ EXTRACT_SUBVECTOR
EXTRACT_SUBVECTOR(VECTOR, IDX) - Returns a subvector from VECTOR.
Definition ISDOpcodes.h:609
@ STRICT_FMAXIMUM
Definition ISDOpcodes.h:465
@ READ_REGISTER
READ_REGISTER, WRITE_REGISTER - This node represents llvm.register on the DAG, which implements the n...
Definition ISDOpcodes.h:134
@ EXTRACT_VECTOR_ELT
EXTRACT_VECTOR_ELT(VECTOR, IDX) - Returns a single element from VECTOR identified by the (potentially...
Definition ISDOpcodes.h:571
@ ZERO_EXTEND
ZERO_EXTEND - Used for integer types, zeroing the new bits.
Definition ISDOpcodes.h:840
@ TargetConstantFP
Definition ISDOpcodes.h:175
@ DEBUGTRAP
DEBUGTRAP - Trap intended to get the attention of a debugger.
@ SELECT_CC
Select with condition operator - This selects between a true value and a false value (ops #2 and #3) ...
Definition ISDOpcodes.h:801
@ ATOMIC_CMP_SWAP
Val, OUTCHAIN = ATOMIC_CMP_SWAP(INCHAIN, ptr, cmp, swap) For double-word atomic operations: ValLo,...
@ FMINNUM
FMINNUM/FMAXNUM - Perform floating-point minimum maximum on two values, following IEEE-754 definition...
@ UBSANTRAP
UBSANTRAP - Trap with an immediate describing the kind of sanitizer failure.
@ SSHLSAT
RESULT = [US]SHLSAT(LHS, RHS) - Perform saturation left shift.
Definition ISDOpcodes.h:381
@ SMULO
Same for multiplication.
Definition ISDOpcodes.h:351
@ DYNAMIC_STACKALLOC
DYNAMIC_STACKALLOC - Allocate some number of bytes on the stack aligned to a specified boundary.
@ SIGN_EXTEND_INREG
SIGN_EXTEND_INREG - This operator atomically performs a SHL/SRA pair to sign extend a small value in ...
Definition ISDOpcodes.h:878
@ SMIN
[US]{MIN/MAX} - Binary minimum or maximum of signed or unsigned integers.
Definition ISDOpcodes.h:726
@ SDIVFIXSAT
Same as the corresponding unsaturated fixed point instructions, but the result is clamped between the...
Definition ISDOpcodes.h:408
@ FP_EXTEND
X = FP_EXTEND(Y) - Extend a smaller FP type into a larger FP type.
Definition ISDOpcodes.h:968
@ GLOBAL_OFFSET_TABLE
The address of the GOT.
Definition ISDOpcodes.h:103
@ UADDO_CARRY
Carry-using nodes for multiple precision addition and subtraction.
Definition ISDOpcodes.h:323
@ STRICT_SINT_TO_FP
STRICT_[US]INT_TO_FP - Convert a signed or unsigned integer to a floating point value.
Definition ISDOpcodes.h:479
@ STRICT_BF16_TO_FP
@ STRICT_FROUNDEVEN
Definition ISDOpcodes.h:459
@ EH_DWARF_CFA
EH_DWARF_CFA - This node represents the pointer to the DWARF Canonical Frame Address (CFA),...
Definition ISDOpcodes.h:145
@ BF16_TO_FP
BF16_TO_FP, FP_TO_BF16 - These operators are used to perform promotions and truncation for bfloat16.
@ FRAMEADDR
FRAMEADDR, RETURNADDR - These nodes represent llvm.frameaddress and llvm.returnaddress on the DAG.
Definition ISDOpcodes.h:110
@ STRICT_FP_TO_UINT
Definition ISDOpcodes.h:473
@ STRICT_FP_ROUND
X = STRICT_FP_ROUND(Y, TRUNC) - Rounding 'Y' from a larger floating point type down to the precision ...
Definition ISDOpcodes.h:495
@ STRICT_FP_TO_SINT
STRICT_FP_TO_[US]INT - Convert a floating point value to a signed or unsigned integer.
Definition ISDOpcodes.h:472
@ FMINIMUM
FMINIMUM/FMAXIMUM - NaN-propagating minimum/maximum that also treat -0.0 as less than 0....
@ FP_TO_SINT
FP_TO_[US]INT - Convert a floating point value to a signed or unsigned integer.
Definition ISDOpcodes.h:916
@ READCYCLECOUNTER
READCYCLECOUNTER - This corresponds to the readcyclecounter intrinsic.
@ TargetConstant
TargetConstant* - Like Constant*, but the DAG does not do any folding, simplification,...
Definition ISDOpcodes.h:174
@ STRICT_FP_EXTEND
X = STRICT_FP_EXTEND(Y) - Extend a smaller FP type into a larger FP type.
Definition ISDOpcodes.h:500
@ AND
Bitwise operators - logical and, logical or, logical xor.
Definition ISDOpcodes.h:738
@ TRAP
TRAP - Trapping instruction.
@ INTRINSIC_WO_CHAIN
RESULT = INTRINSIC_WO_CHAIN(INTRINSICID, arg1, arg2, ...) This node represents a target intrinsic fun...
Definition ISDOpcodes.h:200
@ GET_FPENV_MEM
Gets the current floating-point environment.
@ STRICT_FP_TO_BF16
@ SCMP
[US]CMP - 3-way comparison of signed or unsigned integers.
Definition ISDOpcodes.h:734
@ AVGFLOORS
AVGFLOORS/AVGFLOORU - Averaging add - Add two integers using an integer of type i[N+1],...
Definition ISDOpcodes.h:709
@ STRICT_FADD
Constrained versions of the binary floating point operators.
Definition ISDOpcodes.h:422
@ INSERT_VECTOR_ELT
INSERT_VECTOR_ELT(VECTOR, VAL, IDX) - Returns VECTOR with the element at IDX replaced with VAL.
Definition ISDOpcodes.h:560
@ TokenFactor
TokenFactor - This node takes multiple tokens as input and produces a single token result.
Definition ISDOpcodes.h:53
@ VECTOR_SPLICE
VECTOR_SPLICE(VEC1, VEC2, IMM) - Returns a subvector of the same type as VEC1/VEC2 from CONCAT_VECTOR...
Definition ISDOpcodes.h:656
@ ATOMIC_SWAP
Val, OUTCHAIN = ATOMIC_SWAP(INCHAIN, ptr, amt) Val, OUTCHAIN = ATOMIC_LOAD_[OpName](INCHAIN,...
@ ExternalSymbol
Definition ISDOpcodes.h:93
@ FFREXP
FFREXP - frexp, extract fractional and exponent component of a floating-point value.
@ FP_ROUND
X = FP_ROUND(Y, TRUNC) - Rounding 'Y' from a larger floating point type down to the precision of the ...
Definition ISDOpcodes.h:949
@ SPONENTRY
SPONENTRY - Represents the llvm.sponentry intrinsic.
Definition ISDOpcodes.h:122
@ CLEAR_CACHE
llvm.clear_cache intrinsic Operands: Input Chain, Start Addres, End Address Outputs: Output Chain
@ ADDRSPACECAST
ADDRSPACECAST - This operator converts between pointers of different address spaces.
Definition ISDOpcodes.h:987
@ EXPERIMENTAL_VECTOR_HISTOGRAM
Experimental vector histogram intrinsic Operands: Input Chain, Inc, Mask, Base, Index,...
@ STRICT_FNEARBYINT
Definition ISDOpcodes.h:453
@ FP_TO_SINT_SAT
FP_TO_[US]INT_SAT - Convert floating point value in operand 0 to a signed or unsigned scalar integer ...
Definition ISDOpcodes.h:935
@ VECREDUCE_FMINIMUM
@ EH_SJLJ_SETJMP
RESULT, OUTCHAIN = EH_SJLJ_SETJMP(INCHAIN, buffer) This corresponds to the eh.sjlj....
Definition ISDOpcodes.h:157
@ TRUNCATE
TRUNCATE - Completely drop the high bits.
Definition ISDOpcodes.h:846
@ VAARG
VAARG - VAARG has four operands: an input chain, a pointer, a SRCVALUE, and the alignment.
@ BRCOND
BRCOND - Conditional branch.
@ VECREDUCE_SEQ_FMUL
@ SHL_PARTS
SHL_PARTS/SRA_PARTS/SRL_PARTS - These operators are used for expanded integer shift operations.
Definition ISDOpcodes.h:823
@ AssertSext
AssertSext, AssertZext - These nodes record if a register contains a value that has already been zero...
Definition ISDOpcodes.h:62
@ FCOPYSIGN
FCOPYSIGN(X, Y) - Return the value of X with the sign of Y.
Definition ISDOpcodes.h:529
@ SADDSAT
RESULT = [US]ADDSAT(LHS, RHS) - Perform saturation addition on 2 integers with the same bit width (W)...
Definition ISDOpcodes.h:360
@ CALLSEQ_START
CALLSEQ_START/CALLSEQ_END - These operators mark the beginning and end of a call sequence,...
@ VECTOR_DEINTERLEAVE
VECTOR_DEINTERLEAVE(VEC1, VEC2, ...) - Returns N vectors from N input vectors, where N is the factor ...
Definition ISDOpcodes.h:619
@ GET_DYNAMIC_AREA_OFFSET
GET_DYNAMIC_AREA_OFFSET - get offset from native SP to the address of the most recent dynamic alloca.
@ SET_FPENV_MEM
Sets the current floating point environment.
@ FMINIMUMNUM
FMINIMUMNUM/FMAXIMUMNUM - minimumnum/maximumnum that is same with FMINNUM_IEEE and FMAXNUM_IEEE besid...
@ ABDS
ABDS/ABDU - Absolute difference - Return the absolute difference between two numbers interpreted as s...
Definition ISDOpcodes.h:721
@ ADJUST_TRAMPOLINE
ADJUST_TRAMPOLINE - This corresponds to the adjust_trampoline intrinsic.
@ INTRINSIC_W_CHAIN
RESULT,OUTCHAIN = INTRINSIC_W_CHAIN(INCHAIN, INTRINSICID, arg1, ...) This node represents a target in...
Definition ISDOpcodes.h:208
@ BUILD_VECTOR
BUILD_VECTOR(ELT0, ELT1, ELT2, ELT3,...) - Return a fixed-width vector with the specified,...
Definition ISDOpcodes.h:551
LLVM_ABI NodeType getExtForLoadExtType(bool IsFP, LoadExtType)
bool isNormalStore(const SDNode *N)
Returns true if the specified node is a non-truncating and unindexed store.
LLVM_ABI CondCode getSetCCInverse(CondCode Operation, EVT Type)
Return the operation corresponding to !(X op Y), where 'op' is a valid SetCC operation.
LLVM_ABI std::optional< unsigned > getVPMaskIdx(unsigned Opcode)
The operand position of the vector mask.
LLVM_ABI CondCode getSetCCSwappedOperands(CondCode Operation)
Return the operation corresponding to (Y op X) when given the operation for (X op Y).
bool isSignedIntSetCC(CondCode Code)
Return true if this is a setcc instruction that performs a signed comparison when used with integer o...
CondCode
ISD::CondCode enum - These are ordered carefully to make the bitfields below work out,...
LoadExtType
LoadExtType enum - This enum defines the three variants of LOADEXT (load with extension).
LLVM_ABI bool isVPOpcode(unsigned Opcode)
Whether this is a vector-predicated Opcode.
LLVM_ABI Libcall getPOWI(EVT RetVT)
getPOWI - Return the POWI_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getSINTTOFP(EVT OpVT, EVT RetVT)
getSINTTOFP - Return the SINTTOFP_*_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getSYNC(unsigned Opc, MVT VT)
Return the SYNC_FETCH_AND_* value for the given opcode and type, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getLDEXP(EVT RetVT)
getLDEXP - Return the LDEXP_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getUINTTOFP(EVT OpVT, EVT RetVT)
getUINTTOFP - Return the UINTTOFP_*_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getFREXP(EVT RetVT)
getFREXP - Return the FREXP_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getSINCOSPI(EVT RetVT)
getSINCOSPI - Return the SINCOSPI_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getFPLibCall(EVT VT, Libcall Call_F32, Libcall Call_F64, Libcall Call_F80, Libcall Call_F128, Libcall Call_PPCF128)
GetFPLibCall - Helper to return the right libcall for the given floating point type,...
LLVM_ABI Libcall getFPTOUINT(EVT OpVT, EVT RetVT)
getFPTOUINT - Return the FPTOUINT_*_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getMODF(EVT VT)
getMODF - Return the MODF_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getFPTOSINT(EVT OpVT, EVT RetVT)
getFPTOSINT - Return the FPTOSINT_*_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getOUTLINE_ATOMIC(unsigned Opc, AtomicOrdering Order, MVT VT)
Return the outline atomics value for the given opcode, atomic ordering and type, or UNKNOWN_LIBCALL i...
LLVM_ABI Libcall getFPEXT(EVT OpVT, EVT RetVT)
getFPEXT - Return the FPEXT_*_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getFPROUND(EVT OpVT, EVT RetVT)
getFPROUND - Return the FPROUND_*_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getSINCOS_STRET(EVT RetVT)
Return the SINCOS_STRET_ value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getSINCOS(EVT RetVT)
getSINCOS - Return the SINCOS_* value for the given types, or UNKNOWN_LIBCALL if there is none.
@ Undef
Value of the register doesn't matter.
std::enable_if_t< detail::IsValidPointer< X, Y >::value, X * > extract(Y &&MD)
Extract a Value from Metadata.
Definition Metadata.h:667
constexpr double e
NodeAddr< NodeBase * > Node
Definition RDFGraph.h:381
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition STLExtras.h:316
void dump(const SparseBitVector< ElementSize > &LHS, raw_ostream &out)
unsigned Log2_32_Ceil(uint32_t Value)
Return the ceil log base 2 of the specified value, 32 if the value is zero.
Definition MathExtras.h:344
@ Offset
Definition DWP.cpp:532
FunctionAddr VTableAddr Value
Definition InstrProf.h:137
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
Definition MathExtras.h:284
unsigned Log2_32(uint32_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
Definition MathExtras.h:331
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition MathExtras.h:279
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
APFloat scalbn(APFloat X, int Exp, APFloat::roundingMode RM)
Returns: X * 2^Exp for integral exponents.
Definition APFloat.h:1525
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:207
LLVM_ABI Constant * ConstantFoldCastOperand(unsigned Opcode, Constant *C, Type *DestTy, const DataLayout &DL)
Attempt to constant fold a cast with the specified operand.
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547
AtomicOrdering
Atomic ordering for LLVM's memory model.
To bit_cast(const From &from) noexcept
Definition bit.h:90
@ Or
Bitwise or logical OR of integers.
@ And
Bitwise or logical AND of integers.
@ Sub
Subtraction of integers.
@ Add
Sum of integers.
DWARFExpression::Operation Op
ArrayRef(const T &OneElt) -> ArrayRef< T >
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
LLVM_ABI bool isOneConstant(SDValue V)
Returns true if V is a constant integer one.
Align commonAlignment(Align A, uint64_t Offset)
Returns the alignment that satisfies both alignments.
Definition Alignment.h:201
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition BitVector.h:872
#define N
constexpr uint64_t value() const
This is a hole in the type system and should not be abused.
Definition Alignment.h:77
Extended Value Type.
Definition ValueTypes.h:35
TypeSize getStoreSize() const
Return the number of bytes overwritten by a store of the specified value type.
Definition ValueTypes.h:395
static EVT getVectorVT(LLVMContext &Context, EVT VT, unsigned NumElements, bool IsScalable=false)
Returns the EVT that represents a vector NumElements in length, where each element is of type VT.
Definition ValueTypes.h:74
EVT changeTypeToInteger() const
Return the type converted to an equivalently sized integer or vector with integer element type.
Definition ValueTypes.h:121
bool bitsGT(EVT VT) const
Return true if this has more bits than VT.
Definition ValueTypes.h:284
bool bitsLT(EVT VT) const
Return true if this has less bits than VT.
Definition ValueTypes.h:300
bool isFloatingPoint() const
Return true if this is a FP or a vector FP type.
Definition ValueTypes.h:147
TypeSize getSizeInBits() const
Return the size of the specified value type in bits.
Definition ValueTypes.h:373
bool isByteSized() const
Return true if the bit size is a multiple of 8.
Definition ValueTypes.h:243
uint64_t getScalarSizeInBits() const
Definition ValueTypes.h:385
EVT getHalfSizedIntegerVT(LLVMContext &Context) const
Finds the smallest simple value type that is greater than or equal to half the width of this EVT.
Definition ValueTypes.h:430
TypeSize getStoreSizeInBits() const
Return the number of bits overwritten by a store of the specified value type.
Definition ValueTypes.h:412
MVT getSimpleVT() const
Return the SimpleValueType held in the specified simple EVT.
Definition ValueTypes.h:316
static EVT getIntegerVT(LLVMContext &Context, unsigned BitWidth)
Returns the EVT that represents an integer with the given number of bits.
Definition ValueTypes.h:65
bool isVector() const
Return true if this is a vector value type.
Definition ValueTypes.h:168
EVT getScalarType() const
If this is a vector type, return the element type, otherwise return this.
Definition ValueTypes.h:323
bool bitsGE(EVT VT) const
Return true if this has no less bits than VT.
Definition ValueTypes.h:292
bool bitsEq(EVT VT) const
Return true if this has the same number of bits as VT.
Definition ValueTypes.h:256
LLVM_ABI Type * getTypeForEVT(LLVMContext &Context) const
This method returns an LLVM type corresponding to the specified EVT.
bool isScalableVector() const
Return true if this is a vector type where the runtime length is machine dependent.
Definition ValueTypes.h:174
EVT getVectorElementType() const
Given a vector type, return the type of each element.
Definition ValueTypes.h:328
bool isScalarInteger() const
Return true if this is an integer, but not a vector.
Definition ValueTypes.h:157
LLVM_ABI const fltSemantics & getFltSemantics() const
Returns an APFloat semantics tag appropriate for the value type.
unsigned getVectorNumElements() const
Given a vector type, return the number of elements it contains.
Definition ValueTypes.h:336
bool bitsLE(EVT VT) const
Return true if this has no more bits than VT.
Definition ValueTypes.h:308
bool isInteger() const
Return true if this is an integer or a vector integer type.
Definition ValueTypes.h:152
This class contains a discriminated union of information about pointers in memory operands,...
static LLVM_ABI MachinePointerInfo getJumpTable(MachineFunction &MF)
Return a MachinePointerInfo record that refers to a jump table entry.
static LLVM_ABI MachinePointerInfo getConstantPool(MachineFunction &MF)
Return a MachinePointerInfo record that refers to the constant pool.
MachinePointerInfo getWithOffset(int64_t O) const
static LLVM_ABI MachinePointerInfo getUnknownStack(MachineFunction &MF)
Stack memory without other information.
static LLVM_ABI MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.
CallingConv::ID getLibcallImplCallingConv(RTLIB::LibcallImpl Call) const
Get the CallingConv that should be used for the specified libcall.
std::pair< FunctionType *, AttributeList > getFunctionTy(LLVMContext &Ctx, const Triple &TT, const DataLayout &DL, RTLIB::LibcallImpl LibcallImpl) const
These are IR-level optimization flags that may be propagated to SDNodes.
void setNoFPExcept(bool b)
void setNoUnsignedWrap(bool b)
void setNoSignedWrap(bool b)
MakeLibCallOptions & setIsSigned(bool Value=true)