LLVM 23.0.0git
LegalizeVectorOps.cpp
Go to the documentation of this file.
1//===- LegalizeVectorOps.cpp - Implement SelectionDAG::LegalizeVectors ----===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements the SelectionDAG::LegalizeVectors method.
10//
11// The vector legalizer looks for vector operations which might need to be
12// scalarized and legalizes them. This is a separate step from Legalize because
13// scalarizing can introduce illegal types. For example, suppose we have an
14// ISD::SDIV of type v2i64 on x86-32. The type is legal (for example, addition
15// on a v2i64 is legal), but ISD::SDIV isn't legal, so we have to unroll the
16// operation, which introduces nodes with the illegal type i64 which must be
17// expanded. Similarly, suppose we have an ISD::SRA of type v16i8 on PowerPC;
18// the operation must be unrolled, which introduces nodes with the illegal
19// type i8 which must be promoted.
20//
21// This does not legalize vector manipulations like ISD::BUILD_VECTOR,
22// or operations that happen to take a vector which are custom-lowered;
23// the legalization for such operations never produces nodes
24// with illegal types, so it's okay to put off legalizing them until
25// SelectionDAG::Legalize runs.
26//
27//===----------------------------------------------------------------------===//
28
29#include "llvm/ADT/DenseMap.h"
39#include "llvm/IR/DataLayout.h"
42#include "llvm/Support/Debug.h"
44#include <cassert>
45#include <cstdint>
46#include <iterator>
47#include <utility>
48
49using namespace llvm;
50
51#define DEBUG_TYPE "legalizevectorops"
52
53namespace {
54
55class VectorLegalizer {
56 SelectionDAG& DAG;
57 const TargetLowering &TLI;
58 bool Changed = false; // Keep track of whether anything changed
59
60 /// For nodes that are of legal width, and that have more than one use, this
61 /// map indicates what regularized operand to use. This allows us to avoid
62 /// legalizing the same thing more than once.
64
65 /// Adds a node to the translation cache.
66 void AddLegalizedOperand(SDValue From, SDValue To) {
67 LegalizedNodes.insert(std::make_pair(From, To));
68 // If someone requests legalization of the new node, return itself.
69 if (From != To)
70 LegalizedNodes.insert(std::make_pair(To, To));
71 }
72
73 /// Legalizes the given node.
74 SDValue LegalizeOp(SDValue Op);
75
76 /// Assuming the node is legal, "legalize" the results.
77 SDValue TranslateLegalizeResults(SDValue Op, SDNode *Result);
78
79 /// Make sure Results are legal and update the translation cache.
80 SDValue RecursivelyLegalizeResults(SDValue Op,
82
83 /// Wrapper to interface LowerOperation with a vector of Results.
84 /// Returns false if the target wants to use default expansion. Otherwise
85 /// returns true. If return is true and the Results are empty, then the
86 /// target wants to keep the input node as is.
87 bool LowerOperationWrapper(SDNode *N, SmallVectorImpl<SDValue> &Results);
88
89 /// Implements unrolling a VSETCC.
90 SDValue UnrollVSETCC(SDNode *Node);
91
92 /// Implement expand-based legalization of vector operations.
93 ///
94 /// This is just a high-level routine to dispatch to specific code paths for
95 /// operations to legalize them.
97
98 /// Implements expansion for FP_TO_UINT; falls back to UnrollVectorOp if
99 /// FP_TO_SINT isn't legal.
100 void ExpandFP_TO_UINT(SDNode *Node, SmallVectorImpl<SDValue> &Results);
101
102 /// Implements expansion for UINT_TO_FLOAT; falls back to UnrollVectorOp if
103 /// SINT_TO_FLOAT and SHR on vectors isn't legal.
104 void ExpandUINT_TO_FLOAT(SDNode *Node, SmallVectorImpl<SDValue> &Results);
105
106 /// Implement expansion for SIGN_EXTEND_INREG using SRL and SRA.
107 SDValue ExpandSEXTINREG(SDNode *Node);
108
109 /// Implement expansion for ANY_EXTEND_VECTOR_INREG.
110 ///
111 /// Shuffles the low lanes of the operand into place and bitcasts to the proper
112 /// type. The contents of the bits in the extended part of each element are
113 /// undef.
114 SDValue ExpandANY_EXTEND_VECTOR_INREG(SDNode *Node);
115
116 /// Implement expansion for SIGN_EXTEND_VECTOR_INREG.
117 ///
118 /// Shuffles the low lanes of the operand into place, bitcasts to the proper
119 /// type, then shifts left and arithmetic shifts right to introduce a sign
120 /// extension.
121 SDValue ExpandSIGN_EXTEND_VECTOR_INREG(SDNode *Node);
122
123 /// Implement expansion for ZERO_EXTEND_VECTOR_INREG.
124 ///
125 /// Shuffles the low lanes of the operand into place and blends zeros into
126 /// the remaining lanes, finally bitcasting to the proper type.
127 SDValue ExpandZERO_EXTEND_VECTOR_INREG(SDNode *Node);
128
129 /// Expand bswap of vectors into a shuffle if legal.
130 SDValue ExpandBSWAP(SDNode *Node);
131
132 /// Implement vselect in terms of XOR, AND, OR when blend is not
133 /// supported by the target.
134 SDValue ExpandVSELECT(SDNode *Node);
135 SDValue ExpandVP_SELECT(SDNode *Node);
136 SDValue ExpandVP_MERGE(SDNode *Node);
137 SDValue ExpandVP_REM(SDNode *Node);
138 SDValue ExpandVP_FNEG(SDNode *Node);
139 SDValue ExpandVP_FABS(SDNode *Node);
140 SDValue ExpandVP_FCOPYSIGN(SDNode *Node);
141 SDValue ExpandLOOP_DEPENDENCE_MASK(SDNode *N);
142 SDValue ExpandMaskedBinOp(SDNode *N);
143 SDValue ExpandSELECT(SDNode *Node);
144 std::pair<SDValue, SDValue> ExpandLoad(SDNode *N);
145 SDValue ExpandStore(SDNode *N);
146 SDValue ExpandFNEG(SDNode *Node);
147 SDValue ExpandFABS(SDNode *Node);
148 SDValue ExpandFCOPYSIGN(SDNode *Node);
149 void ExpandFSUB(SDNode *Node, SmallVectorImpl<SDValue> &Results);
150 void ExpandSETCC(SDNode *Node, SmallVectorImpl<SDValue> &Results);
151 SDValue ExpandBITREVERSE(SDNode *Node);
152 void ExpandUADDSUBO(SDNode *Node, SmallVectorImpl<SDValue> &Results);
153 void ExpandSADDSUBO(SDNode *Node, SmallVectorImpl<SDValue> &Results);
154 void ExpandMULO(SDNode *Node, SmallVectorImpl<SDValue> &Results);
155 void ExpandFixedPointDiv(SDNode *Node, SmallVectorImpl<SDValue> &Results);
156 void ExpandStrictFPOp(SDNode *Node, SmallVectorImpl<SDValue> &Results);
157 void ExpandREM(SDNode *Node, SmallVectorImpl<SDValue> &Results);
158
159 bool tryExpandVecMathCall(SDNode *Node, RTLIB::Libcall LC,
161
162 void UnrollStrictFPOp(SDNode *Node, SmallVectorImpl<SDValue> &Results);
163
164 /// Implements vector promotion.
165 ///
166 /// This is essentially just bitcasting the operands to a different type and
167 /// bitcasting the result back to the original type.
169
170 /// Implements [SU]INT_TO_FP vector promotion.
171 ///
172 /// This is a [zs]ext of the input operand to a larger integer type.
173 void PromoteINT_TO_FP(SDNode *Node, SmallVectorImpl<SDValue> &Results);
174
175 /// Implements FP_TO_[SU]INT vector promotion of the result type.
176 ///
177 /// It is promoted to a larger integer type. The result is then
178 /// truncated back to the original type.
179 void PromoteFP_TO_INT(SDNode *Node, SmallVectorImpl<SDValue> &Results);
180
181 /// Implements vector setcc operation promotion.
182 ///
183 /// All vector operands are promoted to a vector type with larger element
184 /// type.
185 void PromoteSETCC(SDNode *Node, SmallVectorImpl<SDValue> &Results);
186
187 void PromoteSTRICT(SDNode *Node, SmallVectorImpl<SDValue> &Results);
188
189 /// Calculate the reduction using a type of higher precision and round the
190 /// result to match the original type. Setting NonArithmetic signifies the
191 /// rounding of the result does not affect its value.
192 void PromoteFloatVECREDUCE(SDNode *Node, SmallVectorImpl<SDValue> &Results,
193 bool NonArithmetic);
194
195 void PromoteVECTOR_COMPRESS(SDNode *Node, SmallVectorImpl<SDValue> &Results);
196
197public:
198 VectorLegalizer(SelectionDAG& dag) :
199 DAG(dag), TLI(dag.getTargetLoweringInfo()) {}
200
201 /// Begin legalizer the vector operations in the DAG.
202 bool Run();
203};
204
205} // end anonymous namespace
206
207bool VectorLegalizer::Run() {
208 // Before we start legalizing vector nodes, check if there are any vectors.
209 bool HasVectors = false;
211 E = std::prev(DAG.allnodes_end()); I != std::next(E); ++I) {
212 // Check if the values of the nodes contain vectors. We don't need to check
213 // the operands because we are going to check their values at some point.
214 HasVectors = llvm::any_of(I->values(), [](EVT T) { return T.isVector(); });
215
216 // If we found a vector node we can start the legalization.
217 if (HasVectors)
218 break;
219 }
220
221 // If this basic block has no vectors then no need to legalize vectors.
222 if (!HasVectors)
223 return false;
224
225 // The legalize process is inherently a bottom-up recursive process (users
226 // legalize their uses before themselves). Given infinite stack space, we
227 // could just start legalizing on the root and traverse the whole graph. In
228 // practice however, this causes us to run out of stack space on large basic
229 // blocks. To avoid this problem, compute an ordering of the nodes where each
230 // node is only legalized after all of its operands are legalized.
233 E = std::prev(DAG.allnodes_end()); I != std::next(E); ++I)
234 LegalizeOp(SDValue(&*I, 0));
235
236 // Finally, it's possible the root changed. Get the new root.
237 SDValue OldRoot = DAG.getRoot();
238 assert(LegalizedNodes.count(OldRoot) && "Root didn't get legalized?");
239 DAG.setRoot(LegalizedNodes[OldRoot]);
240
241 LegalizedNodes.clear();
242
243 // Remove dead nodes now.
244 DAG.RemoveDeadNodes();
245
246 return Changed;
247}
248
249SDValue VectorLegalizer::TranslateLegalizeResults(SDValue Op, SDNode *Result) {
250 assert(Op->getNumValues() == Result->getNumValues() &&
251 "Unexpected number of results");
252 // Generic legalization: just pass the operand through.
253 for (unsigned i = 0, e = Op->getNumValues(); i != e; ++i)
254 AddLegalizedOperand(Op.getValue(i), SDValue(Result, i));
255 return SDValue(Result, Op.getResNo());
256}
257
259VectorLegalizer::RecursivelyLegalizeResults(SDValue Op,
261 assert(Results.size() == Op->getNumValues() &&
262 "Unexpected number of results");
263 // Make sure that the generated code is itself legal.
264 for (unsigned i = 0, e = Results.size(); i != e; ++i) {
265 Results[i] = LegalizeOp(Results[i]);
266 AddLegalizedOperand(Op.getValue(i), Results[i]);
267 }
268
269 return Results[Op.getResNo()];
270}
271
272SDValue VectorLegalizer::LegalizeOp(SDValue Op) {
273 // Note that LegalizeOp may be reentered even from single-use nodes, which
274 // means that we always must cache transformed nodes.
275 auto I = LegalizedNodes.find(Op);
276 if (I != LegalizedNodes.end()) return I->second;
277
278 // Legalize the operands
280 for (const SDValue &Oper : Op->op_values())
281 Ops.push_back(LegalizeOp(Oper));
282
283 SDNode *Node = DAG.UpdateNodeOperands(Op.getNode(), Ops);
284
285 bool HasVectorValueOrOp =
286 llvm::any_of(Node->values(), [](EVT T) { return T.isVector(); }) ||
287 llvm::any_of(Node->op_values(),
288 [](SDValue O) { return O.getValueType().isVector(); });
289 if (!HasVectorValueOrOp)
290 return TranslateLegalizeResults(Op, Node);
291
292 TargetLowering::LegalizeAction Action = TargetLowering::Legal;
293 EVT ValVT;
294 switch (Op.getOpcode()) {
295 default:
296 return TranslateLegalizeResults(Op, Node);
297 case ISD::LOAD: {
298 LoadSDNode *LD = cast<LoadSDNode>(Node);
299 ISD::LoadExtType ExtType = LD->getExtensionType();
300 EVT LoadedVT = LD->getMemoryVT();
301 if (LoadedVT.isVector() && ExtType != ISD::NON_EXTLOAD)
302 Action = TLI.getLoadAction(LD->getValueType(0), LoadedVT, LD->getAlign(),
303 LD->getAddressSpace(), ExtType, false);
304 break;
305 }
306 case ISD::STORE: {
307 StoreSDNode *ST = cast<StoreSDNode>(Node);
308 EVT StVT = ST->getMemoryVT();
309 MVT ValVT = ST->getValue().getSimpleValueType();
310 if (StVT.isVector() && ST->isTruncatingStore())
311 Action = TLI.getTruncStoreAction(ValVT, StVT, ST->getAlign(),
312 ST->getAddressSpace());
313 break;
314 }
316 Action = TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0));
317 // This operation lies about being legal: when it claims to be legal,
318 // it should actually be expanded.
319 if (Action == TargetLowering::Legal)
320 Action = TargetLowering::Expand;
321 break;
322#define DAG_INSTRUCTION(NAME, NARG, ROUND_MODE, INTRINSIC, DAGN) \
323 case ISD::STRICT_##DAGN:
324#include "llvm/IR/ConstrainedOps.def"
325 ValVT = Node->getValueType(0);
326 if (Op.getOpcode() == ISD::STRICT_SINT_TO_FP ||
327 Op.getOpcode() == ISD::STRICT_UINT_TO_FP)
328 ValVT = Node->getOperand(1).getValueType();
329 if (Op.getOpcode() == ISD::STRICT_FSETCC ||
330 Op.getOpcode() == ISD::STRICT_FSETCCS) {
331 MVT OpVT = Node->getOperand(1).getSimpleValueType();
332 ISD::CondCode CCCode = cast<CondCodeSDNode>(Node->getOperand(3))->get();
333 Action = TLI.getCondCodeAction(CCCode, OpVT);
334 if (Action == TargetLowering::Legal)
335 Action = TLI.getOperationAction(Node->getOpcode(), OpVT);
336 } else {
337 Action = TLI.getOperationAction(Node->getOpcode(), ValVT);
338 }
339 // If we're asked to expand a strict vector floating-point operation,
340 // by default we're going to simply unroll it. That is usually the
341 // best approach, except in the case where the resulting strict (scalar)
342 // operations would themselves use the fallback mutation to non-strict.
343 // In that specific case, just do the fallback on the vector op.
344 if (Action == TargetLowering::Expand && !TLI.isStrictFPEnabled() &&
345 TLI.getStrictFPOperationAction(Node->getOpcode(), ValVT) ==
346 TargetLowering::Legal) {
347 EVT EltVT = ValVT.getVectorElementType();
348 if (TLI.getOperationAction(Node->getOpcode(), EltVT)
349 == TargetLowering::Expand &&
350 TLI.getStrictFPOperationAction(Node->getOpcode(), EltVT)
351 == TargetLowering::Legal)
352 Action = TargetLowering::Legal;
353 }
354 break;
355 case ISD::ADD:
356 case ISD::SUB:
357 case ISD::MUL:
358 case ISD::MULHS:
359 case ISD::MULHU:
360 case ISD::SDIV:
361 case ISD::UDIV:
362 case ISD::SREM:
363 case ISD::UREM:
364 case ISD::SDIVREM:
365 case ISD::UDIVREM:
366 case ISD::FADD:
367 case ISD::FSUB:
368 case ISD::FMUL:
369 case ISD::FDIV:
370 case ISD::FREM:
371 case ISD::AND:
372 case ISD::OR:
373 case ISD::XOR:
374 case ISD::SHL:
375 case ISD::SRA:
376 case ISD::SRL:
377 case ISD::FSHL:
378 case ISD::FSHR:
379 case ISD::ROTL:
380 case ISD::ROTR:
381 case ISD::ABS:
383 case ISD::ABDS:
384 case ISD::ABDU:
385 case ISD::AVGCEILS:
386 case ISD::AVGCEILU:
387 case ISD::AVGFLOORS:
388 case ISD::AVGFLOORU:
389 case ISD::BSWAP:
390 case ISD::BITREVERSE:
391 case ISD::CTLZ:
392 case ISD::CTTZ:
395 case ISD::CTPOP:
396 case ISD::CLMUL:
397 case ISD::CLMULH:
398 case ISD::CLMULR:
399 case ISD::SELECT:
400 case ISD::VSELECT:
401 case ISD::SELECT_CC:
402 case ISD::ZERO_EXTEND:
403 case ISD::ANY_EXTEND:
404 case ISD::TRUNCATE:
405 case ISD::SIGN_EXTEND:
406 case ISD::FP_TO_SINT:
407 case ISD::FP_TO_UINT:
408 case ISD::FNEG:
409 case ISD::FABS:
410 case ISD::FMINNUM:
411 case ISD::FMAXNUM:
414 case ISD::FMINIMUM:
415 case ISD::FMAXIMUM:
416 case ISD::FMINIMUMNUM:
417 case ISD::FMAXIMUMNUM:
418 case ISD::FCOPYSIGN:
419 case ISD::FSQRT:
420 case ISD::FSIN:
421 case ISD::FCOS:
422 case ISD::FTAN:
423 case ISD::FASIN:
424 case ISD::FACOS:
425 case ISD::FATAN:
426 case ISD::FATAN2:
427 case ISD::FSINH:
428 case ISD::FCOSH:
429 case ISD::FTANH:
430 case ISD::FLDEXP:
431 case ISD::FPOWI:
432 case ISD::FPOW:
433 case ISD::FCBRT:
434 case ISD::FLOG:
435 case ISD::FLOG2:
436 case ISD::FLOG10:
437 case ISD::FEXP:
438 case ISD::FEXP2:
439 case ISD::FEXP10:
440 case ISD::FCEIL:
441 case ISD::FTRUNC:
442 case ISD::FRINT:
443 case ISD::FNEARBYINT:
444 case ISD::FROUND:
445 case ISD::FROUNDEVEN:
446 case ISD::FFLOOR:
447 case ISD::FP_ROUND:
448 case ISD::FP_EXTEND:
450 case ISD::FMA:
455 case ISD::SMIN:
456 case ISD::SMAX:
457 case ISD::UMIN:
458 case ISD::UMAX:
459 case ISD::SMUL_LOHI:
460 case ISD::UMUL_LOHI:
461 case ISD::SADDO:
462 case ISD::UADDO:
463 case ISD::SSUBO:
464 case ISD::USUBO:
465 case ISD::SMULO:
466 case ISD::UMULO:
469 case ISD::FFREXP:
470 case ISD::FMODF:
471 case ISD::FSINCOS:
472 case ISD::FSINCOSPI:
473 case ISD::SADDSAT:
474 case ISD::UADDSAT:
475 case ISD::SSUBSAT:
476 case ISD::USUBSAT:
477 case ISD::SSHLSAT:
478 case ISD::USHLSAT:
481 case ISD::MGATHER:
483 case ISD::SCMP:
484 case ISD::UCMP:
487 case ISD::MASKED_UDIV:
488 case ISD::MASKED_SDIV:
489 case ISD::MASKED_UREM:
490 case ISD::MASKED_SREM:
491 Action = TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0));
492 break;
493 case ISD::SMULFIX:
494 case ISD::SMULFIXSAT:
495 case ISD::UMULFIX:
496 case ISD::UMULFIXSAT:
497 case ISD::SDIVFIX:
498 case ISD::SDIVFIXSAT:
499 case ISD::UDIVFIX:
500 case ISD::UDIVFIXSAT: {
501 unsigned Scale = Node->getConstantOperandVal(2);
502 Action = TLI.getFixedPointOperationAction(Node->getOpcode(),
503 Node->getValueType(0), Scale);
504 break;
505 }
506 case ISD::LROUND:
507 case ISD::LLROUND:
508 case ISD::LRINT:
509 case ISD::LLRINT:
510 case ISD::SINT_TO_FP:
511 case ISD::UINT_TO_FP:
527 case ISD::CTTZ_ELTS:
530 Action = TLI.getOperationAction(Node->getOpcode(),
531 Node->getOperand(0).getValueType());
532 break;
535 Action = TLI.getOperationAction(Node->getOpcode(),
536 Node->getOperand(1).getValueType());
537 break;
538 case ISD::SETCC: {
539 MVT OpVT = Node->getOperand(0).getSimpleValueType();
540 ISD::CondCode CCCode = cast<CondCodeSDNode>(Node->getOperand(2))->get();
541 Action = TLI.getCondCodeAction(CCCode, OpVT);
542 if (Action == TargetLowering::Legal)
543 Action = TLI.getOperationAction(Node->getOpcode(), OpVT);
544 break;
545 }
550 Action =
551 TLI.getPartialReduceMLAAction(Op.getOpcode(), Node->getValueType(0),
552 Node->getOperand(1).getValueType());
553 break;
554
555#define BEGIN_REGISTER_VP_SDNODE(VPID, LEGALPOS, ...) \
556 case ISD::VPID: { \
557 EVT LegalizeVT = LEGALPOS < 0 ? Node->getValueType(-(1 + LEGALPOS)) \
558 : Node->getOperand(LEGALPOS).getValueType(); \
559 if (ISD::VPID == ISD::VP_SETCC) { \
560 ISD::CondCode CCCode = cast<CondCodeSDNode>(Node->getOperand(2))->get(); \
561 Action = TLI.getCondCodeAction(CCCode, LegalizeVT.getSimpleVT()); \
562 if (Action != TargetLowering::Legal) \
563 break; \
564 } \
565 /* Defer non-vector results to LegalizeDAG. */ \
566 if (!Node->getValueType(0).isVector() && \
567 Node->getValueType(0) != MVT::Other) { \
568 Action = TargetLowering::Legal; \
569 break; \
570 } \
571 Action = TLI.getOperationAction(Node->getOpcode(), LegalizeVT); \
572 } break;
573#include "llvm/IR/VPIntrinsics.def"
574 }
575
576 LLVM_DEBUG(dbgs() << "\nLegalizing vector op: "; Node->dump(&DAG));
577
578 SmallVector<SDValue, 8> ResultVals;
579 switch (Action) {
580 default: llvm_unreachable("This action is not supported yet!");
581 case TargetLowering::Promote:
582 assert((Op.getOpcode() != ISD::LOAD && Op.getOpcode() != ISD::STORE) &&
583 "This action is not supported yet!");
584 LLVM_DEBUG(dbgs() << "Promoting\n");
585 Promote(Node, ResultVals);
586 assert(!ResultVals.empty() && "No results for promotion?");
587 break;
588 case TargetLowering::Legal:
589 LLVM_DEBUG(dbgs() << "Legal node: nothing to do\n");
590 break;
591 case TargetLowering::Custom:
592 LLVM_DEBUG(dbgs() << "Trying custom legalization\n");
593 if (LowerOperationWrapper(Node, ResultVals))
594 break;
595 LLVM_DEBUG(dbgs() << "Could not custom legalize node\n");
596 [[fallthrough]];
597 case TargetLowering::Expand:
598 LLVM_DEBUG(dbgs() << "Expanding\n");
599 Expand(Node, ResultVals);
600 break;
601 }
602
603 if (ResultVals.empty())
604 return TranslateLegalizeResults(Op, Node);
605
606 Changed = true;
607 return RecursivelyLegalizeResults(Op, ResultVals);
608}
609
610// FIXME: This is very similar to TargetLowering::LowerOperationWrapper. Can we
611// merge them somehow?
612bool VectorLegalizer::LowerOperationWrapper(SDNode *Node,
613 SmallVectorImpl<SDValue> &Results) {
614 SDValue Res = TLI.LowerOperation(SDValue(Node, 0), DAG);
615
616 if (!Res.getNode())
617 return false;
618
619 if (Res == SDValue(Node, 0))
620 return true;
621
622 // If the original node has one result, take the return value from
623 // LowerOperation as is. It might not be result number 0.
624 if (Node->getNumValues() == 1) {
625 Results.push_back(Res);
626 return true;
627 }
628
629 // If the original node has multiple results, then the return node should
630 // have the same number of results.
631 assert((Node->getNumValues() == Res->getNumValues()) &&
632 "Lowering returned the wrong number of results!");
633
634 // Places new result values base on N result number.
635 for (unsigned I = 0, E = Node->getNumValues(); I != E; ++I)
636 Results.push_back(Res.getValue(I));
637
638 return true;
639}
640
641void VectorLegalizer::PromoteSETCC(SDNode *Node,
642 SmallVectorImpl<SDValue> &Results) {
643 MVT VecVT = Node->getOperand(0).getSimpleValueType();
644 MVT NewVecVT = TLI.getTypeToPromoteTo(Node->getOpcode(), VecVT);
645
646 unsigned ExtOp = VecVT.isFloatingPoint() ? ISD::FP_EXTEND : ISD::ANY_EXTEND;
647
648 SDLoc DL(Node);
649 SmallVector<SDValue, 5> Operands(Node->getNumOperands());
650
651 Operands[0] = DAG.getNode(ExtOp, DL, NewVecVT, Node->getOperand(0));
652 Operands[1] = DAG.getNode(ExtOp, DL, NewVecVT, Node->getOperand(1));
653 Operands[2] = Node->getOperand(2);
654
655 if (Node->getOpcode() == ISD::VP_SETCC) {
656 Operands[3] = Node->getOperand(3); // mask
657 Operands[4] = Node->getOperand(4); // evl
658 }
659
660 SDValue Res = DAG.getNode(Node->getOpcode(), DL, Node->getSimpleValueType(0),
661 Operands, Node->getFlags());
662
663 Results.push_back(Res);
664}
665
666void VectorLegalizer::PromoteSTRICT(SDNode *Node,
667 SmallVectorImpl<SDValue> &Results) {
668 MVT VecVT = Node->getOperand(1).getSimpleValueType();
669 MVT NewVecVT = TLI.getTypeToPromoteTo(Node->getOpcode(), VecVT);
670
671 assert(VecVT.isFloatingPoint());
672
673 SDLoc DL(Node);
674 SmallVector<SDValue, 5> Operands(Node->getNumOperands());
676
677 for (unsigned j = 1; j != Node->getNumOperands(); ++j)
678 if (Node->getOperand(j).getValueType().isVector() &&
679 !(ISD::isVPOpcode(Node->getOpcode()) &&
680 ISD::getVPMaskIdx(Node->getOpcode()) == j)) // Skip mask operand.
681 {
682 // promote the vector operand.
683 SDValue Ext =
684 DAG.getNode(ISD::STRICT_FP_EXTEND, DL, {NewVecVT, MVT::Other},
685 {Node->getOperand(0), Node->getOperand(j)});
686 Operands[j] = Ext.getValue(0);
687 Chains.push_back(Ext.getValue(1));
688 } else
689 Operands[j] = Node->getOperand(j); // Skip no vector operand.
690
691 SDVTList VTs = DAG.getVTList(NewVecVT, Node->getValueType(1));
692
693 Operands[0] = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, Chains);
694
695 SDValue Res =
696 DAG.getNode(Node->getOpcode(), DL, VTs, Operands, Node->getFlags());
697
698 SDValue Round =
699 DAG.getNode(ISD::STRICT_FP_ROUND, DL, {VecVT, MVT::Other},
700 {Res.getValue(1), Res.getValue(0),
701 DAG.getIntPtrConstant(0, DL, /*isTarget=*/true)});
702
703 Results.push_back(Round.getValue(0));
704 Results.push_back(Round.getValue(1));
705}
706
707void VectorLegalizer::PromoteFloatVECREDUCE(SDNode *Node,
708 SmallVectorImpl<SDValue> &Results,
709 bool NonArithmetic) {
710 MVT OpVT = Node->getOperand(0).getSimpleValueType();
711 assert(OpVT.isFloatingPoint() && "Expected floating point reduction!");
712 MVT NewOpVT = TLI.getTypeToPromoteTo(Node->getOpcode(), OpVT);
713
714 SDLoc DL(Node);
715 SDValue NewOp = DAG.getNode(ISD::FP_EXTEND, DL, NewOpVT, Node->getOperand(0));
716 SDValue Rdx =
717 DAG.getNode(Node->getOpcode(), DL, NewOpVT.getVectorElementType(), NewOp,
718 Node->getFlags());
719 SDValue Res =
720 DAG.getNode(ISD::FP_ROUND, DL, Node->getValueType(0), Rdx,
721 DAG.getIntPtrConstant(NonArithmetic, DL, /*isTarget=*/true));
722 Results.push_back(Res);
723}
724
725void VectorLegalizer::PromoteVECTOR_COMPRESS(
726 SDNode *Node, SmallVectorImpl<SDValue> &Results) {
727 SDLoc DL(Node);
728 EVT VT = Node->getValueType(0);
729 MVT PromotedVT = TLI.getTypeToPromoteTo(Node->getOpcode(), VT.getSimpleVT());
730 assert((VT.isInteger() || VT.getSizeInBits() == PromotedVT.getSizeInBits()) &&
731 "Only integer promotion or bitcasts between types is supported");
732
733 SDValue Vec = Node->getOperand(0);
734 SDValue Mask = Node->getOperand(1);
735 SDValue Passthru = Node->getOperand(2);
736 if (VT.isInteger()) {
737 Vec = DAG.getNode(ISD::ANY_EXTEND, DL, PromotedVT, Vec);
738 Mask = TLI.promoteTargetBoolean(DAG, Mask, PromotedVT);
739 Passthru = DAG.getNode(ISD::ANY_EXTEND, DL, PromotedVT, Passthru);
740 } else {
741 Vec = DAG.getBitcast(PromotedVT, Vec);
742 Passthru = DAG.getBitcast(PromotedVT, Passthru);
743 }
744
746 DAG.getNode(ISD::VECTOR_COMPRESS, DL, PromotedVT, Vec, Mask, Passthru);
747 Result = VT.isInteger() ? DAG.getNode(ISD::TRUNCATE, DL, VT, Result)
748 : DAG.getBitcast(VT, Result);
749 Results.push_back(Result);
750}
751
752void VectorLegalizer::Promote(SDNode *Node, SmallVectorImpl<SDValue> &Results) {
753 // For a few operations there is a specific concept for promotion based on
754 // the operand's type.
755 switch (Node->getOpcode()) {
756 case ISD::SINT_TO_FP:
757 case ISD::UINT_TO_FP:
760 // "Promote" the operation by extending the operand.
761 PromoteINT_TO_FP(Node, Results);
762 return;
763 case ISD::FP_TO_UINT:
764 case ISD::FP_TO_SINT:
767 // Promote the operation by extending the operand.
768 PromoteFP_TO_INT(Node, Results);
769 return;
770 case ISD::VP_SETCC:
771 case ISD::SETCC:
772 // Promote the operation by extending the operand.
773 PromoteSETCC(Node, Results);
774 return;
775 case ISD::STRICT_FADD:
776 case ISD::STRICT_FSUB:
777 case ISD::STRICT_FMUL:
778 case ISD::STRICT_FDIV:
780 case ISD::STRICT_FMA:
781 PromoteSTRICT(Node, Results);
782 return;
785 PromoteFloatVECREDUCE(Node, Results, /*NonArithmetic=*/false);
786 return;
791 PromoteFloatVECREDUCE(Node, Results, /*NonArithmetic=*/true);
792 return;
794 PromoteVECTOR_COMPRESS(Node, Results);
795 return;
796
797 case ISD::FP_ROUND:
798 case ISD::FP_EXTEND:
799 // These operations are used to do promotion so they can't be promoted
800 // themselves.
801 llvm_unreachable("Don't know how to promote this operation!");
802 case ISD::VP_FABS:
803 case ISD::VP_FCOPYSIGN:
804 case ISD::VP_FNEG:
805 // Promoting fabs, fneg, and fcopysign changes their semantics.
806 llvm_unreachable("These operations should not be promoted");
807 }
808
809 // There are currently two cases of vector promotion:
810 // 1) Bitcasting a vector of integers to a different type to a vector of the
811 // same overall length. For example, x86 promotes ISD::AND v2i32 to v1i64.
812 // 2) Extending a vector of floats to a vector of the same number of larger
813 // floats. For example, AArch64 promotes ISD::FADD on v4f16 to v4f32.
814 assert(Node->getNumValues() == 1 &&
815 "Can't promote a vector with multiple results!");
816 MVT VT = Node->getSimpleValueType(0);
817 MVT NVT = TLI.getTypeToPromoteTo(Node->getOpcode(), VT);
818 SDLoc dl(Node);
819 SmallVector<SDValue, 4> Operands(Node->getNumOperands());
820
821 for (unsigned j = 0; j != Node->getNumOperands(); ++j) {
822 // Do not promote the mask operand of a VP OP.
823 bool SkipPromote = ISD::isVPOpcode(Node->getOpcode()) &&
824 ISD::getVPMaskIdx(Node->getOpcode()) == j;
825 if (Node->getOperand(j).getValueType().isVector() && !SkipPromote)
826 if (Node->getOperand(j)
827 .getValueType()
828 .getVectorElementType()
829 .isFloatingPoint() &&
831 if (ISD::isVPOpcode(Node->getOpcode())) {
832 unsigned EVLIdx =
834 unsigned MaskIdx = *ISD::getVPMaskIdx(Node->getOpcode());
835 Operands[j] =
836 DAG.getNode(ISD::VP_FP_EXTEND, dl, NVT, Node->getOperand(j),
837 Node->getOperand(MaskIdx), Node->getOperand(EVLIdx));
838 } else {
839 Operands[j] =
840 DAG.getNode(ISD::FP_EXTEND, dl, NVT, Node->getOperand(j));
841 }
842 else
843 Operands[j] = DAG.getNode(ISD::BITCAST, dl, NVT, Node->getOperand(j));
844 else
845 Operands[j] = Node->getOperand(j);
846 }
847
848 SDValue Res =
849 DAG.getNode(Node->getOpcode(), dl, NVT, Operands, Node->getFlags());
850
851 if ((VT.isFloatingPoint() && NVT.isFloatingPoint()) ||
854 if (ISD::isVPOpcode(Node->getOpcode())) {
855 unsigned EVLIdx = *ISD::getVPExplicitVectorLengthIdx(Node->getOpcode());
856 unsigned MaskIdx = *ISD::getVPMaskIdx(Node->getOpcode());
857 Res = DAG.getNode(ISD::VP_FP_ROUND, dl, VT, Res,
858 Node->getOperand(MaskIdx), Node->getOperand(EVLIdx));
859 } else {
860 Res = DAG.getNode(ISD::FP_ROUND, dl, VT, Res,
861 DAG.getIntPtrConstant(0, dl, /*isTarget=*/true));
862 }
863 else
864 Res = DAG.getNode(ISD::BITCAST, dl, VT, Res);
865
866 Results.push_back(Res);
867}
868
869void VectorLegalizer::PromoteINT_TO_FP(SDNode *Node,
870 SmallVectorImpl<SDValue> &Results) {
871 // INT_TO_FP operations may require the input operand be promoted even
872 // when the type is otherwise legal.
873 bool IsStrict = Node->isStrictFPOpcode();
874 MVT VT = Node->getOperand(IsStrict ? 1 : 0).getSimpleValueType();
875 MVT NVT = TLI.getTypeToPromoteTo(Node->getOpcode(), VT);
877 "Vectors have different number of elements!");
878
879 SDLoc dl(Node);
880 SmallVector<SDValue, 4> Operands(Node->getNumOperands());
881
882 unsigned Opc = (Node->getOpcode() == ISD::UINT_TO_FP ||
883 Node->getOpcode() == ISD::STRICT_UINT_TO_FP)
886 for (unsigned j = 0; j != Node->getNumOperands(); ++j) {
887 if (Node->getOperand(j).getValueType().isVector())
888 Operands[j] = DAG.getNode(Opc, dl, NVT, Node->getOperand(j));
889 else
890 Operands[j] = Node->getOperand(j);
891 }
892
893 if (IsStrict) {
894 SDValue Res = DAG.getNode(Node->getOpcode(), dl,
895 {Node->getValueType(0), MVT::Other}, Operands);
896 Results.push_back(Res);
897 Results.push_back(Res.getValue(1));
898 return;
899 }
900
901 SDValue Res =
902 DAG.getNode(Node->getOpcode(), dl, Node->getValueType(0), Operands);
903 Results.push_back(Res);
904}
905
906// For FP_TO_INT we promote the result type to a vector type with wider
907// elements and then truncate the result. This is different from the default
908// PromoteVector which uses bitcast to promote thus assumning that the
909// promoted vector type has the same overall size.
910void VectorLegalizer::PromoteFP_TO_INT(SDNode *Node,
911 SmallVectorImpl<SDValue> &Results) {
912 MVT VT = Node->getSimpleValueType(0);
913 MVT NVT = TLI.getTypeToPromoteTo(Node->getOpcode(), VT);
914 bool IsStrict = Node->isStrictFPOpcode();
916 "Vectors have different number of elements!");
917
918 unsigned NewOpc = Node->getOpcode();
919 // Change FP_TO_UINT to FP_TO_SINT if possible.
920 // TODO: Should we only do this if FP_TO_UINT itself isn't legal?
921 if (NewOpc == ISD::FP_TO_UINT &&
923 NewOpc = ISD::FP_TO_SINT;
924
925 if (NewOpc == ISD::STRICT_FP_TO_UINT &&
927 NewOpc = ISD::STRICT_FP_TO_SINT;
928
929 SDLoc dl(Node);
930 SDValue Promoted, Chain;
931 if (IsStrict) {
932 Promoted = DAG.getNode(NewOpc, dl, {NVT, MVT::Other},
933 {Node->getOperand(0), Node->getOperand(1)});
934 Chain = Promoted.getValue(1);
935 } else
936 Promoted = DAG.getNode(NewOpc, dl, NVT, Node->getOperand(0));
937
938 // Assert that the converted value fits in the original type. If it doesn't
939 // (eg: because the value being converted is too big), then the result of the
940 // original operation was undefined anyway, so the assert is still correct.
941 if (Node->getOpcode() == ISD::FP_TO_UINT ||
942 Node->getOpcode() == ISD::STRICT_FP_TO_UINT)
943 NewOpc = ISD::AssertZext;
944 else
945 NewOpc = ISD::AssertSext;
946
947 Promoted = DAG.getNode(NewOpc, dl, NVT, Promoted,
948 DAG.getValueType(VT.getScalarType()));
949 Promoted = DAG.getNode(ISD::TRUNCATE, dl, VT, Promoted);
950 Results.push_back(Promoted);
951 if (IsStrict)
952 Results.push_back(Chain);
953}
954
955std::pair<SDValue, SDValue> VectorLegalizer::ExpandLoad(SDNode *N) {
956 LoadSDNode *LD = cast<LoadSDNode>(N);
957 return TLI.scalarizeVectorLoad(LD, DAG);
958}
959
960SDValue VectorLegalizer::ExpandStore(SDNode *N) {
961 StoreSDNode *ST = cast<StoreSDNode>(N);
962 SDValue TF = TLI.scalarizeVectorStore(ST, DAG);
963 return TF;
964}
965
966void VectorLegalizer::Expand(SDNode *Node, SmallVectorImpl<SDValue> &Results) {
967 switch (Node->getOpcode()) {
968 case ISD::LOAD: {
969 std::pair<SDValue, SDValue> Tmp = ExpandLoad(Node);
970 Results.push_back(Tmp.first);
971 Results.push_back(Tmp.second);
972 return;
973 }
974 case ISD::STORE:
975 Results.push_back(ExpandStore(Node));
976 return;
978 for (unsigned i = 0, e = Node->getNumValues(); i != e; ++i)
979 Results.push_back(Node->getOperand(i));
980 return;
982 if (SDValue Expanded = ExpandSEXTINREG(Node)) {
983 Results.push_back(Expanded);
984 return;
985 }
986 break;
988 Results.push_back(ExpandANY_EXTEND_VECTOR_INREG(Node));
989 return;
991 Results.push_back(ExpandSIGN_EXTEND_VECTOR_INREG(Node));
992 return;
994 Results.push_back(ExpandZERO_EXTEND_VECTOR_INREG(Node));
995 return;
996 case ISD::BSWAP:
997 if (SDValue Expanded = ExpandBSWAP(Node)) {
998 Results.push_back(Expanded);
999 return;
1000 }
1001 break;
1002 case ISD::VP_BSWAP:
1003 Results.push_back(TLI.expandVPBSWAP(Node, DAG));
1004 return;
1005 case ISD::VSELECT:
1006 if (SDValue Expanded = ExpandVSELECT(Node)) {
1007 Results.push_back(Expanded);
1008 return;
1009 }
1010 break;
1011 case ISD::VP_SELECT:
1012 if (SDValue Expanded = ExpandVP_SELECT(Node)) {
1013 Results.push_back(Expanded);
1014 return;
1015 }
1016 break;
1017 case ISD::VP_SREM:
1018 case ISD::VP_UREM:
1019 if (SDValue Expanded = ExpandVP_REM(Node)) {
1020 Results.push_back(Expanded);
1021 return;
1022 }
1023 break;
1024 case ISD::VP_FNEG:
1025 if (SDValue Expanded = ExpandVP_FNEG(Node)) {
1026 Results.push_back(Expanded);
1027 return;
1028 }
1029 break;
1030 case ISD::VP_FABS:
1031 if (SDValue Expanded = ExpandVP_FABS(Node)) {
1032 Results.push_back(Expanded);
1033 return;
1034 }
1035 break;
1036 case ISD::VP_FCOPYSIGN:
1037 if (SDValue Expanded = ExpandVP_FCOPYSIGN(Node)) {
1038 Results.push_back(Expanded);
1039 return;
1040 }
1041 break;
1042 case ISD::SELECT:
1043 if (SDValue Expanded = ExpandSELECT(Node)) {
1044 Results.push_back(Expanded);
1045 return;
1046 }
1047 break;
1048 case ISD::SELECT_CC: {
1049 if (Node->getValueType(0).isScalableVector()) {
1050 EVT CondVT = TLI.getSetCCResultType(
1051 DAG.getDataLayout(), *DAG.getContext(), Node->getValueType(0));
1052 SDValue SetCC =
1053 DAG.getNode(ISD::SETCC, SDLoc(Node), CondVT, Node->getOperand(0),
1054 Node->getOperand(1), Node->getOperand(4));
1055 Results.push_back(DAG.getSelect(SDLoc(Node), Node->getValueType(0), SetCC,
1056 Node->getOperand(2),
1057 Node->getOperand(3)));
1058 return;
1059 }
1060 break;
1061 }
1062 case ISD::FP_TO_UINT:
1063 ExpandFP_TO_UINT(Node, Results);
1064 return;
1065 case ISD::UINT_TO_FP:
1066 ExpandUINT_TO_FLOAT(Node, Results);
1067 return;
1068 case ISD::FNEG:
1069 if (SDValue Expanded = ExpandFNEG(Node)) {
1070 Results.push_back(Expanded);
1071 return;
1072 }
1073 break;
1074 case ISD::FABS:
1075 if (SDValue Expanded = ExpandFABS(Node)) {
1076 Results.push_back(Expanded);
1077 return;
1078 }
1079 break;
1080 case ISD::FCOPYSIGN:
1081 if (SDValue Expanded = ExpandFCOPYSIGN(Node)) {
1082 Results.push_back(Expanded);
1083 return;
1084 }
1085 break;
1086 case ISD::FCANONICALIZE: {
1087 // If the scalar element type has a
1088 // Legal/Custom FCANONICALIZE, don't
1089 // mess with the vector, fall back.
1090 EVT VT = Node->getValueType(0);
1091 EVT EltVT = VT.getVectorElementType();
1092 if (!VT.isScalableVector() &&
1094 TargetLowering::Expand)
1095 break;
1096 // Otherwise canonicalize the whole vector.
1097 SDValue Mul = TLI.expandFCANONICALIZE(Node, DAG);
1098 Results.push_back(Mul);
1099 return;
1100 }
1101 case ISD::FSUB:
1102 ExpandFSUB(Node, Results);
1103 return;
1104 case ISD::SETCC:
1105 case ISD::VP_SETCC:
1106 ExpandSETCC(Node, Results);
1107 return;
1108 case ISD::ABS:
1110 if (SDValue Expanded = TLI.expandABS(Node, DAG)) {
1111 Results.push_back(Expanded);
1112 return;
1113 }
1114 break;
1115 case ISD::ABDS:
1116 case ISD::ABDU:
1117 if (SDValue Expanded = TLI.expandABD(Node, DAG)) {
1118 Results.push_back(Expanded);
1119 return;
1120 }
1121 break;
1122 case ISD::AVGCEILS:
1123 case ISD::AVGCEILU:
1124 case ISD::AVGFLOORS:
1125 case ISD::AVGFLOORU:
1126 if (SDValue Expanded = TLI.expandAVG(Node, DAG)) {
1127 Results.push_back(Expanded);
1128 return;
1129 }
1130 break;
1131 case ISD::BITREVERSE:
1132 if (SDValue Expanded = ExpandBITREVERSE(Node)) {
1133 Results.push_back(Expanded);
1134 return;
1135 }
1136 break;
1137 case ISD::VP_BITREVERSE:
1138 if (SDValue Expanded = TLI.expandVPBITREVERSE(Node, DAG)) {
1139 Results.push_back(Expanded);
1140 return;
1141 }
1142 break;
1143 case ISD::CTPOP:
1144 if (SDValue Expanded = TLI.expandCTPOP(Node, DAG)) {
1145 Results.push_back(Expanded);
1146 return;
1147 }
1148 break;
1149 case ISD::VP_CTPOP:
1150 if (SDValue Expanded = TLI.expandVPCTPOP(Node, DAG)) {
1151 Results.push_back(Expanded);
1152 return;
1153 }
1154 break;
1155 case ISD::CTLZ:
1157 if (SDValue Expanded = TLI.expandCTLZ(Node, DAG)) {
1158 Results.push_back(Expanded);
1159 return;
1160 }
1161 break;
1162 case ISD::VP_CTLZ:
1163 case ISD::VP_CTLZ_ZERO_POISON:
1164 if (SDValue Expanded = TLI.expandVPCTLZ(Node, DAG)) {
1165 Results.push_back(Expanded);
1166 return;
1167 }
1168 break;
1169 case ISD::CTTZ:
1171 if (SDValue Expanded = TLI.expandCTTZ(Node, DAG)) {
1172 Results.push_back(Expanded);
1173 return;
1174 }
1175 break;
1176 case ISD::VP_CTTZ:
1177 case ISD::VP_CTTZ_ZERO_POISON:
1178 if (SDValue Expanded = TLI.expandVPCTTZ(Node, DAG)) {
1179 Results.push_back(Expanded);
1180 return;
1181 }
1182 break;
1183 case ISD::FSHL:
1184 case ISD::VP_FSHL:
1185 case ISD::FSHR:
1186 case ISD::VP_FSHR:
1187 if (SDValue Expanded = TLI.expandFunnelShift(Node, DAG)) {
1188 Results.push_back(Expanded);
1189 return;
1190 }
1191 break;
1192 case ISD::CLMUL:
1193 case ISD::CLMULR:
1194 case ISD::CLMULH:
1195 if (SDValue Expanded = TLI.expandCLMUL(Node, DAG)) {
1196 Results.push_back(Expanded);
1197 return;
1198 }
1199 break;
1200 case ISD::ROTL:
1201 case ISD::ROTR:
1202 if (SDValue Expanded = TLI.expandROT(Node, false /*AllowVectorOps*/, DAG)) {
1203 Results.push_back(Expanded);
1204 return;
1205 }
1206 break;
1207 case ISD::FMINNUM:
1208 case ISD::FMAXNUM:
1209 if (SDValue Expanded = TLI.expandFMINNUM_FMAXNUM(Node, DAG)) {
1210 Results.push_back(Expanded);
1211 return;
1212 }
1213 break;
1214 case ISD::FMINIMUM:
1215 case ISD::FMAXIMUM:
1216 Results.push_back(TLI.expandFMINIMUM_FMAXIMUM(Node, DAG));
1217 return;
1218 case ISD::FMINIMUMNUM:
1219 case ISD::FMAXIMUMNUM:
1220 Results.push_back(TLI.expandFMINIMUMNUM_FMAXIMUMNUM(Node, DAG));
1221 return;
1222 case ISD::SMIN:
1223 case ISD::SMAX:
1224 case ISD::UMIN:
1225 case ISD::UMAX:
1226 if (SDValue Expanded = TLI.expandIntMINMAX(Node, DAG)) {
1227 Results.push_back(Expanded);
1228 return;
1229 }
1230 break;
1231 case ISD::UADDO:
1232 case ISD::USUBO:
1233 ExpandUADDSUBO(Node, Results);
1234 return;
1235 case ISD::SADDO:
1236 case ISD::SSUBO:
1237 ExpandSADDSUBO(Node, Results);
1238 return;
1239 case ISD::UMULO:
1240 case ISD::SMULO:
1241 ExpandMULO(Node, Results);
1242 return;
1243 case ISD::USUBSAT:
1244 case ISD::SSUBSAT:
1245 case ISD::UADDSAT:
1246 case ISD::SADDSAT:
1247 if (SDValue Expanded = TLI.expandAddSubSat(Node, DAG)) {
1248 Results.push_back(Expanded);
1249 return;
1250 }
1251 break;
1252 case ISD::USHLSAT:
1253 case ISD::SSHLSAT:
1254 if (SDValue Expanded = TLI.expandShlSat(Node, DAG)) {
1255 Results.push_back(Expanded);
1256 return;
1257 }
1258 break;
1261 // Expand the fpsosisat if it is scalable to prevent it from unrolling below.
1262 if (Node->getValueType(0).isScalableVector()) {
1263 if (SDValue Expanded = TLI.expandFP_TO_INT_SAT(Node, DAG)) {
1264 Results.push_back(Expanded);
1265 return;
1266 }
1267 }
1268 break;
1269 case ISD::SMULFIX:
1270 case ISD::UMULFIX:
1271 if (SDValue Expanded = TLI.expandFixedPointMul(Node, DAG)) {
1272 Results.push_back(Expanded);
1273 return;
1274 }
1275 break;
1276 case ISD::SMULFIXSAT:
1277 case ISD::UMULFIXSAT:
1278 // FIXME: We do not expand SMULFIXSAT/UMULFIXSAT here yet, not sure exactly
1279 // why. Maybe it results in worse codegen compared to the unroll for some
1280 // targets? This should probably be investigated. And if we still prefer to
1281 // unroll an explanation could be helpful.
1282 break;
1283 case ISD::SDIVFIX:
1284 case ISD::UDIVFIX:
1285 ExpandFixedPointDiv(Node, Results);
1286 return;
1287 case ISD::SDIVFIXSAT:
1288 case ISD::UDIVFIXSAT:
1289 break;
1290#define DAG_INSTRUCTION(NAME, NARG, ROUND_MODE, INTRINSIC, DAGN) \
1291 case ISD::STRICT_##DAGN:
1292#include "llvm/IR/ConstrainedOps.def"
1293 ExpandStrictFPOp(Node, Results);
1294 return;
1295 case ISD::VECREDUCE_ADD:
1296 case ISD::VECREDUCE_MUL:
1297 case ISD::VECREDUCE_AND:
1298 case ISD::VECREDUCE_OR:
1299 case ISD::VECREDUCE_XOR:
1310 Results.push_back(TLI.expandVecReduce(Node, DAG));
1311 return;
1316 Results.push_back(TLI.expandPartialReduceMLA(Node, DAG));
1317 return;
1320 Results.push_back(TLI.expandVecReduceSeq(Node, DAG));
1321 return;
1322 case ISD::SREM:
1323 case ISD::UREM:
1324 ExpandREM(Node, Results);
1325 return;
1326 case ISD::VP_MERGE:
1327 if (SDValue Expanded = ExpandVP_MERGE(Node)) {
1328 Results.push_back(Expanded);
1329 return;
1330 }
1331 break;
1332 case ISD::FREM: {
1333 RTLIB::Libcall LC = RTLIB::getREM(Node->getValueType(0));
1334 if (tryExpandVecMathCall(Node, LC, Results))
1335 return;
1336
1337 break;
1338 }
1339 case ISD::FSINCOS:
1340 case ISD::FSINCOSPI: {
1341 EVT VT = Node->getValueType(0);
1342 RTLIB::Libcall LC = Node->getOpcode() == ISD::FSINCOS
1343 ? RTLIB::getSINCOS(VT)
1344 : RTLIB::getSINCOSPI(VT);
1345 if (LC != RTLIB::UNKNOWN_LIBCALL &&
1346 TLI.expandMultipleResultFPLibCall(DAG, LC, Node, Results))
1347 return;
1348
1349 // TODO: Try to see if there's a narrower call available to use before
1350 // scalarizing.
1351 break;
1352 }
1353 case ISD::FPOW: {
1354 RTLIB::Libcall LC = RTLIB::getPOW(Node->getValueType(0));
1355 if (tryExpandVecMathCall(Node, LC, Results))
1356 return;
1357
1358 // TODO: Try to see if there's a narrower call available to use before
1359 // scalarizing.
1360 break;
1361 }
1362 case ISD::FCBRT: {
1363 RTLIB::Libcall LC = RTLIB::getCBRT(Node->getValueType(0));
1364 if (tryExpandVecMathCall(Node, LC, Results))
1365 return;
1366
1367 // TODO: Try to see if there's a narrower call available to use before
1368 // scalarizing.
1369 break;
1370 }
1371 case ISD::FMODF: {
1372 EVT VT = Node->getValueType(0);
1373 RTLIB::Libcall LC = RTLIB::getMODF(VT);
1374 if (LC != RTLIB::UNKNOWN_LIBCALL &&
1375 TLI.expandMultipleResultFPLibCall(DAG, LC, Node, Results,
1376 /*CallRetResNo=*/0))
1377 return;
1378 break;
1379 }
1381 Results.push_back(TLI.expandVECTOR_COMPRESS(Node, DAG));
1382 return;
1383 case ISD::CTTZ_ELTS:
1385 Results.push_back(TLI.expandCttzElts(Node, DAG));
1386 return;
1388 Results.push_back(TLI.expandVectorFindLastActive(Node, DAG));
1389 return;
1390 case ISD::SCMP:
1391 case ISD::UCMP:
1392 Results.push_back(TLI.expandCMP(Node, DAG));
1393 return;
1396 Results.push_back(ExpandLOOP_DEPENDENCE_MASK(Node));
1397 return;
1398
1399 case ISD::FADD:
1400 case ISD::FMUL:
1401 case ISD::FMA:
1402 case ISD::FDIV:
1403 case ISD::FCEIL:
1404 case ISD::FFLOOR:
1405 case ISD::FNEARBYINT:
1406 case ISD::FRINT:
1407 case ISD::FROUND:
1408 case ISD::FROUNDEVEN:
1409 case ISD::FTRUNC:
1410 case ISD::FSQRT:
1411 if (SDValue Expanded = TLI.expandVectorNaryOpBySplitting(Node, DAG)) {
1412 Results.push_back(Expanded);
1413 return;
1414 }
1415 break;
1417 if (SDValue Expanded = TLI.expandCONVERT_FROM_ARBITRARY_FP(Node, DAG))
1418 Results.push_back(Expanded);
1419 else
1420 Results.push_back(DAG.getPOISON(Node->getValueType(0)));
1421 return;
1422 case ISD::MASKED_UDIV:
1423 case ISD::MASKED_SDIV:
1424 case ISD::MASKED_UREM:
1425 case ISD::MASKED_SREM:
1426 Results.push_back(ExpandMaskedBinOp(Node));
1427 return;
1428 }
1429
1430 SDValue Unrolled = DAG.UnrollVectorOp(Node);
1431 if (Node->getNumValues() == 1) {
1432 Results.push_back(Unrolled);
1433 } else {
1434 assert(Node->getNumValues() == Unrolled->getNumValues() &&
1435 "VectorLegalizer Expand returned wrong number of results!");
1436 for (unsigned I = 0, E = Unrolled->getNumValues(); I != E; ++I)
1437 Results.push_back(Unrolled.getValue(I));
1438 }
1439}
1440
1441SDValue VectorLegalizer::ExpandSELECT(SDNode *Node) {
1442 // Lower a select instruction where the condition is a scalar and the
1443 // operands are vectors. Lower this select to VSELECT and implement it
1444 // using XOR AND OR. The selector bit is broadcasted.
1445 EVT VT = Node->getValueType(0);
1446 SDLoc DL(Node);
1447
1448 SDValue Mask = Node->getOperand(0);
1449 SDValue Op1 = Node->getOperand(1);
1450 SDValue Op2 = Node->getOperand(2);
1451
1452 assert(VT.isVector() && !Mask.getValueType().isVector()
1453 && Op1.getValueType() == Op2.getValueType() && "Invalid type");
1454
1455 // If we can't even use the basic vector operations of
1456 // AND,OR,XOR, we will have to scalarize the op.
1457 // Notice that the operation may be 'promoted' which means that it is
1458 // 'bitcasted' to another type which is handled.
1459 // Also, we need to be able to construct a splat vector using either
1460 // BUILD_VECTOR or SPLAT_VECTOR.
1461 // FIXME: Should we also permit fixed-length SPLAT_VECTOR as a fallback to
1462 // BUILD_VECTOR?
1463 if (TLI.getOperationAction(ISD::AND, VT) == TargetLowering::Expand ||
1464 TLI.getOperationAction(ISD::XOR, VT) == TargetLowering::Expand ||
1465 TLI.getOperationAction(ISD::OR, VT) == TargetLowering::Expand ||
1468 VT) == TargetLowering::Expand)
1469 return SDValue();
1470
1471 // Generate a mask operand.
1472 EVT MaskTy = VT.changeVectorElementTypeToInteger();
1473
1474 // What is the size of each element in the vector mask.
1475 EVT BitTy = MaskTy.getScalarType();
1476
1477 Mask = DAG.getSelect(DL, BitTy, Mask, DAG.getAllOnesConstant(DL, BitTy),
1478 DAG.getConstant(0, DL, BitTy));
1479
1480 // Broadcast the mask so that the entire vector is all one or all zero.
1481 Mask = DAG.getSplat(MaskTy, DL, Mask);
1482
1483 // Bitcast the operands to be the same type as the mask.
1484 // This is needed when we select between FP types because
1485 // the mask is a vector of integers.
1486 Op1 = DAG.getNode(ISD::BITCAST, DL, MaskTy, Op1);
1487 Op2 = DAG.getNode(ISD::BITCAST, DL, MaskTy, Op2);
1488
1489 SDValue NotMask = DAG.getNOT(DL, Mask, MaskTy);
1490
1491 Op1 = DAG.getNode(ISD::AND, DL, MaskTy, Op1, Mask);
1492 Op2 = DAG.getNode(ISD::AND, DL, MaskTy, Op2, NotMask);
1493 SDValue Val = DAG.getNode(ISD::OR, DL, MaskTy, Op1, Op2);
1494 return DAG.getNode(ISD::BITCAST, DL, Node->getValueType(0), Val);
1495}
1496
1497SDValue VectorLegalizer::ExpandSEXTINREG(SDNode *Node) {
1498 EVT VT = Node->getValueType(0);
1499
1500 // Make sure that the SRA and SHL instructions are available.
1501 if (TLI.getOperationAction(ISD::SRA, VT) == TargetLowering::Expand ||
1502 TLI.getOperationAction(ISD::SHL, VT) == TargetLowering::Expand)
1503 return SDValue();
1504
1505 SDLoc DL(Node);
1506 EVT OrigTy = cast<VTSDNode>(Node->getOperand(1))->getVT();
1507
1508 unsigned BW = VT.getScalarSizeInBits();
1509 unsigned OrigBW = OrigTy.getScalarSizeInBits();
1510 SDValue ShiftSz = DAG.getConstant(BW - OrigBW, DL, VT);
1511
1512 SDValue Op = DAG.getNode(ISD::SHL, DL, VT, Node->getOperand(0), ShiftSz);
1513 return DAG.getNode(ISD::SRA, DL, VT, Op, ShiftSz);
1514}
1515
1516// Generically expand a vector anyext in register to a shuffle of the relevant
1517// lanes into the appropriate locations, with other lanes left undef.
1518SDValue VectorLegalizer::ExpandANY_EXTEND_VECTOR_INREG(SDNode *Node) {
1519 SDLoc DL(Node);
1520 EVT VT = Node->getValueType(0);
1521 int NumElements = VT.getVectorNumElements();
1522 SDValue Src = Node->getOperand(0);
1523 EVT SrcVT = Src.getValueType();
1524 int NumSrcElements = SrcVT.getVectorNumElements();
1525
1526 // *_EXTEND_VECTOR_INREG SrcVT can be smaller than VT - so insert the vector
1527 // into a larger vector type.
1528 if (SrcVT.bitsLE(VT)) {
1529 assert((VT.getSizeInBits() % SrcVT.getScalarSizeInBits()) == 0 &&
1530 "ANY_EXTEND_VECTOR_INREG vector size mismatch");
1531 NumSrcElements = VT.getSizeInBits() / SrcVT.getScalarSizeInBits();
1532 SrcVT = EVT::getVectorVT(*DAG.getContext(), SrcVT.getScalarType(),
1533 NumSrcElements);
1534 Src = DAG.getInsertSubvector(DL, DAG.getUNDEF(SrcVT), Src, 0);
1535 }
1536
1537 // Build a base mask of undef shuffles.
1538 SmallVector<int, 16> ShuffleMask;
1539 ShuffleMask.resize(NumSrcElements, -1);
1540
1541 // Place the extended lanes into the correct locations.
1542 int ExtLaneScale = NumSrcElements / NumElements;
1543 int EndianOffset = DAG.getDataLayout().isBigEndian() ? ExtLaneScale - 1 : 0;
1544 for (int i = 0; i < NumElements; ++i)
1545 ShuffleMask[i * ExtLaneScale + EndianOffset] = i;
1546
1547 return DAG.getNode(
1548 ISD::BITCAST, DL, VT,
1549 DAG.getVectorShuffle(SrcVT, DL, Src, DAG.getPOISON(SrcVT), ShuffleMask));
1550}
1551
1552SDValue VectorLegalizer::ExpandSIGN_EXTEND_VECTOR_INREG(SDNode *Node) {
1553 SDLoc DL(Node);
1554 EVT VT = Node->getValueType(0);
1555 SDValue Src = Node->getOperand(0);
1556 EVT SrcVT = Src.getValueType();
1557
1558 // First build an any-extend node which can be legalized above when we
1559 // recurse through it.
1561
1562 // Now we need sign extend. Do this by shifting the elements. Even if these
1563 // aren't legal operations, they have a better chance of being legalized
1564 // without full scalarization than the sign extension does.
1565 unsigned EltWidth = VT.getScalarSizeInBits();
1566 unsigned SrcEltWidth = SrcVT.getScalarSizeInBits();
1567 SDValue ShiftAmount = DAG.getConstant(EltWidth - SrcEltWidth, DL, VT);
1568 return DAG.getNode(ISD::SRA, DL, VT,
1569 DAG.getNode(ISD::SHL, DL, VT, Op, ShiftAmount),
1570 ShiftAmount);
1571}
1572
1573// Generically expand a vector zext in register to a shuffle of the relevant
1574// lanes into the appropriate locations, a blend of zero into the high bits,
1575// and a bitcast to the wider element type.
1576SDValue VectorLegalizer::ExpandZERO_EXTEND_VECTOR_INREG(SDNode *Node) {
1577 SDLoc DL(Node);
1578 EVT VT = Node->getValueType(0);
1579 int NumElements = VT.getVectorNumElements();
1580 SDValue Src = Node->getOperand(0);
1581 EVT SrcVT = Src.getValueType();
1582 int NumSrcElements = SrcVT.getVectorNumElements();
1583
1584 // *_EXTEND_VECTOR_INREG SrcVT can be smaller than VT - so insert the vector
1585 // into a larger vector type.
1586 if (SrcVT.bitsLE(VT)) {
1587 assert((VT.getSizeInBits() % SrcVT.getScalarSizeInBits()) == 0 &&
1588 "ZERO_EXTEND_VECTOR_INREG vector size mismatch");
1589 NumSrcElements = VT.getSizeInBits() / SrcVT.getScalarSizeInBits();
1590 SrcVT = EVT::getVectorVT(*DAG.getContext(), SrcVT.getScalarType(),
1591 NumSrcElements);
1592 Src = DAG.getInsertSubvector(DL, DAG.getUNDEF(SrcVT), Src, 0);
1593 }
1594
1595 // Build up a zero vector to blend into this one.
1596 SDValue Zero = DAG.getConstant(0, DL, SrcVT);
1597
1598 // Shuffle the incoming lanes into the correct position, and pull all other
1599 // lanes from the zero vector.
1600 auto ShuffleMask = llvm::to_vector<16>(llvm::seq<int>(0, NumSrcElements));
1601
1602 int ExtLaneScale = NumSrcElements / NumElements;
1603 int EndianOffset = DAG.getDataLayout().isBigEndian() ? ExtLaneScale - 1 : 0;
1604 for (int i = 0; i < NumElements; ++i)
1605 ShuffleMask[i * ExtLaneScale + EndianOffset] = NumSrcElements + i;
1606
1607 return DAG.getNode(ISD::BITCAST, DL, VT,
1608 DAG.getVectorShuffle(SrcVT, DL, Zero, Src, ShuffleMask));
1609}
1610
1611static void createBSWAPShuffleMask(EVT VT, SmallVectorImpl<int> &ShuffleMask) {
1612 int ScalarSizeInBytes = VT.getScalarSizeInBits() / 8;
1613 for (int I = 0, E = VT.getVectorNumElements(); I != E; ++I)
1614 for (int J = ScalarSizeInBytes - 1; J >= 0; --J)
1615 ShuffleMask.push_back((I * ScalarSizeInBytes) + J);
1616}
1617
1618SDValue VectorLegalizer::ExpandBSWAP(SDNode *Node) {
1619 EVT VT = Node->getValueType(0);
1620
1621 // Scalable vectors can't use shuffle expansion.
1622 if (VT.isScalableVector())
1623 return TLI.expandBSWAP(Node, DAG);
1624
1625 // Generate a byte wise shuffle mask for the BSWAP.
1626 SmallVector<int, 16> ShuffleMask;
1627 createBSWAPShuffleMask(VT, ShuffleMask);
1628 EVT ByteVT = EVT::getVectorVT(*DAG.getContext(), MVT::i8, ShuffleMask.size());
1629
1630 // Only emit a shuffle if the mask is legal.
1631 if (TLI.isShuffleMaskLegal(ShuffleMask, ByteVT)) {
1632 SDLoc DL(Node);
1633 SDValue Op = DAG.getNode(ISD::BITCAST, DL, ByteVT, Node->getOperand(0));
1634 Op = DAG.getVectorShuffle(ByteVT, DL, Op, DAG.getPOISON(ByteVT),
1635 ShuffleMask);
1636 return DAG.getNode(ISD::BITCAST, DL, VT, Op);
1637 }
1638
1639 // If we have the appropriate vector bit operations, it is better to use them
1640 // than unrolling and expanding each component.
1641 if (TLI.isOperationLegalOrCustom(ISD::SHL, VT) &&
1645 return TLI.expandBSWAP(Node, DAG);
1646
1647 // Otherwise let the caller unroll.
1648 return SDValue();
1649}
1650
1651SDValue VectorLegalizer::ExpandBITREVERSE(SDNode *Node) {
1652 EVT VT = Node->getValueType(0);
1653
1654 // We can't unroll or use shuffles for scalable vectors.
1655 if (VT.isScalableVector())
1656 return TLI.expandBITREVERSE(Node, DAG);
1657
1658 // If we have the scalar operation, it's probably cheaper to unroll it.
1660 return SDValue();
1661
1662 // If the vector element width is a whole number of bytes, test if its legal
1663 // to BSWAP shuffle the bytes and then perform the BITREVERSE on the byte
1664 // vector. This greatly reduces the number of bit shifts necessary.
1665 unsigned ScalarSizeInBits = VT.getScalarSizeInBits();
1666 if (ScalarSizeInBits > 8 && (ScalarSizeInBits % 8) == 0) {
1667 SmallVector<int, 16> BSWAPMask;
1668 createBSWAPShuffleMask(VT, BSWAPMask);
1669
1670 EVT ByteVT = EVT::getVectorVT(*DAG.getContext(), MVT::i8, BSWAPMask.size());
1671 if (TLI.isShuffleMaskLegal(BSWAPMask, ByteVT) &&
1673 (TLI.isOperationLegalOrCustom(ISD::SHL, ByteVT) &&
1674 TLI.isOperationLegalOrCustom(ISD::SRL, ByteVT) &&
1677 SDLoc DL(Node);
1678 SDValue Op = DAG.getNode(ISD::BITCAST, DL, ByteVT, Node->getOperand(0));
1679 Op = DAG.getVectorShuffle(ByteVT, DL, Op, DAG.getPOISON(ByteVT),
1680 BSWAPMask);
1681 Op = DAG.getNode(ISD::BITREVERSE, DL, ByteVT, Op);
1682 Op = DAG.getNode(ISD::BITCAST, DL, VT, Op);
1683 return Op;
1684 }
1685 }
1686
1687 // If we have the appropriate vector bit operations, it is better to use them
1688 // than unrolling and expanding each component.
1689 if (TLI.isOperationLegalOrCustom(ISD::SHL, VT) &&
1693 return TLI.expandBITREVERSE(Node, DAG);
1694
1695 // Otherwise unroll.
1696 return SDValue();
1697}
1698
1699SDValue VectorLegalizer::ExpandVSELECT(SDNode *Node) {
1700 // Implement VSELECT in terms of XOR, AND, OR
1701 // on platforms which do not support blend natively.
1702 SDLoc DL(Node);
1703
1704 SDValue Mask = Node->getOperand(0);
1705 SDValue Op1 = Node->getOperand(1);
1706 SDValue Op2 = Node->getOperand(2);
1707
1708 EVT VT = Mask.getValueType();
1709
1710 // If we can't even use the basic vector operations of
1711 // AND,OR,XOR, we will have to scalarize the op.
1712 // Notice that the operation may be 'promoted' which means that it is
1713 // 'bitcasted' to another type which is handled.
1714 if (TLI.getOperationAction(ISD::AND, VT) == TargetLowering::Expand ||
1715 TLI.getOperationAction(ISD::XOR, VT) == TargetLowering::Expand ||
1716 TLI.getOperationAction(ISD::OR, VT) == TargetLowering::Expand)
1717 return SDValue();
1718
1719 // This operation also isn't safe with AND, OR, XOR when the boolean type is
1720 // 0/1 and the select operands aren't also booleans, as we need an all-ones
1721 // vector constant to mask with.
1722 // FIXME: Sign extend 1 to all ones if that's legal on the target.
1723 auto BoolContents = TLI.getBooleanContents(Op1.getValueType());
1724 if (BoolContents != TargetLowering::ZeroOrNegativeOneBooleanContent &&
1725 !(BoolContents == TargetLowering::ZeroOrOneBooleanContent &&
1726 Op1.getValueType().getVectorElementType() == MVT::i1))
1727 return SDValue();
1728
1729 // If the mask and the type are different sizes, unroll the vector op. This
1730 // can occur when getSetCCResultType returns something that is different in
1731 // size from the operand types. For example, v4i8 = select v4i32, v4i8, v4i8.
1732 if (VT.getSizeInBits() != Op1.getValueSizeInBits())
1733 return SDValue();
1734
1735 // Bitcast the operands to be the same type as the mask.
1736 // This is needed when we select between FP types because
1737 // the mask is a vector of integers.
1738 Op1 = DAG.getNode(ISD::BITCAST, DL, VT, Op1);
1739 Op2 = DAG.getNode(ISD::BITCAST, DL, VT, Op2);
1740
1741 SDValue NotMask = DAG.getNOT(DL, Mask, VT);
1742
1743 Op1 = DAG.getNode(ISD::AND, DL, VT, Op1, Mask);
1744 Op2 = DAG.getNode(ISD::AND, DL, VT, Op2, NotMask);
1745 SDValue Val = DAG.getNode(ISD::OR, DL, VT, Op1, Op2);
1746 return DAG.getNode(ISD::BITCAST, DL, Node->getValueType(0), Val);
1747}
1748
1749SDValue VectorLegalizer::ExpandVP_SELECT(SDNode *Node) {
1750 // Implement VP_SELECT in terms of VP_XOR, VP_AND and VP_OR on platforms which
1751 // do not support it natively.
1752 SDLoc DL(Node);
1753
1754 SDValue Mask = Node->getOperand(0);
1755 SDValue Op1 = Node->getOperand(1);
1756 SDValue Op2 = Node->getOperand(2);
1757 SDValue EVL = Node->getOperand(3);
1758
1759 EVT VT = Mask.getValueType();
1760
1761 // If we can't even use the basic vector operations of
1762 // VP_AND,VP_OR,VP_XOR, we will have to scalarize the op.
1763 if (TLI.getOperationAction(ISD::VP_AND, VT) == TargetLowering::Expand ||
1764 TLI.getOperationAction(ISD::VP_XOR, VT) == TargetLowering::Expand ||
1765 TLI.getOperationAction(ISD::VP_OR, VT) == TargetLowering::Expand)
1766 return SDValue();
1767
1768 // This operation also isn't safe when the operands aren't also booleans.
1769 if (Op1.getValueType().getVectorElementType() != MVT::i1)
1770 return SDValue();
1771
1772 SDValue Ones = DAG.getAllOnesConstant(DL, VT);
1773 SDValue NotMask = DAG.getNode(ISD::VP_XOR, DL, VT, Mask, Ones, Ones, EVL);
1774
1775 Op1 = DAG.getNode(ISD::VP_AND, DL, VT, Op1, Mask, Ones, EVL);
1776 Op2 = DAG.getNode(ISD::VP_AND, DL, VT, Op2, NotMask, Ones, EVL);
1777 return DAG.getNode(ISD::VP_OR, DL, VT, Op1, Op2, Ones, EVL);
1778}
1779
1780SDValue VectorLegalizer::ExpandVP_MERGE(SDNode *Node) {
1781 // Implement VP_MERGE in terms of VSELECT. Construct a mask where vector
1782 // indices less than the EVL/pivot are true. Combine that with the original
1783 // mask for a full-length mask. Use a full-length VSELECT to select between
1784 // the true and false values.
1785 SDLoc DL(Node);
1786
1787 SDValue Mask = Node->getOperand(0);
1788 SDValue Op1 = Node->getOperand(1);
1789 SDValue Op2 = Node->getOperand(2);
1790 SDValue EVL = Node->getOperand(3);
1791
1792 EVT MaskVT = Mask.getValueType();
1793 bool IsFixedLen = MaskVT.isFixedLengthVector();
1794
1795 EVT EVLVecVT = EVT::getVectorVT(*DAG.getContext(), EVL.getValueType(),
1796 MaskVT.getVectorElementCount());
1797
1798 // If we can't construct the EVL mask efficiently, it's better to unroll.
1799 if ((IsFixedLen &&
1801 (!IsFixedLen &&
1802 (!TLI.isOperationLegalOrCustom(ISD::STEP_VECTOR, EVLVecVT) ||
1804 return SDValue();
1805
1806 // If using a SETCC would result in a different type than the mask type,
1807 // unroll.
1808 if (TLI.getSetCCResultType(DAG.getDataLayout(), *DAG.getContext(),
1809 EVLVecVT) != MaskVT)
1810 return SDValue();
1811
1812 SDValue StepVec = DAG.getStepVector(DL, EVLVecVT);
1813 SDValue SplatEVL = DAG.getSplat(EVLVecVT, DL, EVL);
1814 SDValue EVLMask =
1815 DAG.getSetCC(DL, MaskVT, StepVec, SplatEVL, ISD::CondCode::SETULT);
1816
1817 SDValue FullMask = DAG.getNode(ISD::AND, DL, MaskVT, Mask, EVLMask);
1818 return DAG.getSelect(DL, Node->getValueType(0), FullMask, Op1, Op2);
1819}
1820
1821SDValue VectorLegalizer::ExpandVP_REM(SDNode *Node) {
1822 // Implement VP_SREM/UREM in terms of VP_SDIV/VP_UDIV, VP_MUL, VP_SUB.
1823 EVT VT = Node->getValueType(0);
1824
1825 unsigned DivOpc = Node->getOpcode() == ISD::VP_SREM ? ISD::VP_SDIV : ISD::VP_UDIV;
1826
1827 if (!TLI.isOperationLegalOrCustom(DivOpc, VT) ||
1828 !TLI.isOperationLegalOrCustom(ISD::VP_MUL, VT) ||
1829 !TLI.isOperationLegalOrCustom(ISD::VP_SUB, VT))
1830 return SDValue();
1831
1832 SDLoc DL(Node);
1833
1834 SDValue Dividend = Node->getOperand(0);
1835 SDValue Divisor = Node->getOperand(1);
1836 SDValue Mask = Node->getOperand(2);
1837 SDValue EVL = Node->getOperand(3);
1838
1839 // X % Y -> X-X/Y*Y
1840 SDValue Div = DAG.getNode(DivOpc, DL, VT, Dividend, Divisor, Mask, EVL);
1841 SDValue Mul = DAG.getNode(ISD::VP_MUL, DL, VT, Divisor, Div, Mask, EVL);
1842 return DAG.getNode(ISD::VP_SUB, DL, VT, Dividend, Mul, Mask, EVL);
1843}
1844
1845SDValue VectorLegalizer::ExpandVP_FNEG(SDNode *Node) {
1846 EVT VT = Node->getValueType(0);
1847 EVT IntVT = VT.changeVectorElementTypeToInteger();
1848
1849 if (!TLI.isOperationLegalOrCustom(ISD::VP_XOR, IntVT))
1850 return SDValue();
1851
1852 SDValue Mask = Node->getOperand(1);
1853 SDValue EVL = Node->getOperand(2);
1854
1855 SDLoc DL(Node);
1856 SDValue Cast = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(0));
1857 SDValue SignMask = DAG.getConstant(
1858 APInt::getSignMask(IntVT.getScalarSizeInBits()), DL, IntVT);
1859 SDValue Xor = DAG.getNode(ISD::VP_XOR, DL, IntVT, Cast, SignMask, Mask, EVL);
1860 return DAG.getNode(ISD::BITCAST, DL, VT, Xor);
1861}
1862
1863SDValue VectorLegalizer::ExpandVP_FABS(SDNode *Node) {
1864 EVT VT = Node->getValueType(0);
1865 EVT IntVT = VT.changeVectorElementTypeToInteger();
1866
1867 if (!TLI.isOperationLegalOrCustom(ISD::VP_AND, IntVT))
1868 return SDValue();
1869
1870 SDValue Mask = Node->getOperand(1);
1871 SDValue EVL = Node->getOperand(2);
1872
1873 SDLoc DL(Node);
1874 SDValue Cast = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(0));
1875 SDValue ClearSignMask = DAG.getConstant(
1877 SDValue ClearSign =
1878 DAG.getNode(ISD::VP_AND, DL, IntVT, Cast, ClearSignMask, Mask, EVL);
1879 return DAG.getNode(ISD::BITCAST, DL, VT, ClearSign);
1880}
1881
1882SDValue VectorLegalizer::ExpandVP_FCOPYSIGN(SDNode *Node) {
1883 EVT VT = Node->getValueType(0);
1884
1885 if (VT != Node->getOperand(1).getValueType())
1886 return SDValue();
1887
1888 EVT IntVT = VT.changeVectorElementTypeToInteger();
1889 if (!TLI.isOperationLegalOrCustom(ISD::VP_AND, IntVT) ||
1890 !TLI.isOperationLegalOrCustom(ISD::VP_XOR, IntVT))
1891 return SDValue();
1892
1893 SDValue Mask = Node->getOperand(2);
1894 SDValue EVL = Node->getOperand(3);
1895
1896 SDLoc DL(Node);
1897 SDValue Mag = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(0));
1898 SDValue Sign = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(1));
1899
1900 SDValue SignMask = DAG.getConstant(
1901 APInt::getSignMask(IntVT.getScalarSizeInBits()), DL, IntVT);
1902 SDValue SignBit =
1903 DAG.getNode(ISD::VP_AND, DL, IntVT, Sign, SignMask, Mask, EVL);
1904
1905 SDValue ClearSignMask = DAG.getConstant(
1907 SDValue ClearedSign =
1908 DAG.getNode(ISD::VP_AND, DL, IntVT, Mag, ClearSignMask, Mask, EVL);
1909
1910 SDValue CopiedSign = DAG.getNode(ISD::VP_OR, DL, IntVT, ClearedSign, SignBit,
1911 Mask, EVL, SDNodeFlags::Disjoint);
1912
1913 return DAG.getNode(ISD::BITCAST, DL, VT, CopiedSign);
1914}
1915
1916SDValue VectorLegalizer::ExpandLOOP_DEPENDENCE_MASK(SDNode *N) {
1917 return TLI.expandLoopDependenceMask(N, DAG);
1918}
1919
1920SDValue VectorLegalizer::ExpandMaskedBinOp(SDNode *N) {
1921 // Masked bin ops don't have undefined behaviour when dividing by zero
1922 // on disabled lanes and produce poison instead. Replace the divisor on the
1923 // disabled lanes with 1 to avoid division by zero or overflow.
1924 SDLoc dl(N);
1925 EVT VT = N->getValueType(0);
1926 SDValue SafeDivisor = DAG.getSelect(
1927 dl, VT, N->getOperand(2), N->getOperand(1), DAG.getConstant(1, dl, VT));
1928 return DAG.getNode(ISD::getUnmaskedBinOpOpcode(N->getOpcode()), dl, VT,
1929 N->getOperand(0), SafeDivisor);
1930}
1931
1932void VectorLegalizer::ExpandFP_TO_UINT(SDNode *Node,
1933 SmallVectorImpl<SDValue> &Results) {
1934 // Attempt to expand using TargetLowering.
1935 SDValue Result, Chain;
1936 if (TLI.expandFP_TO_UINT(Node, Result, Chain, DAG)) {
1937 Results.push_back(Result);
1938 if (Node->isStrictFPOpcode())
1939 Results.push_back(Chain);
1940 return;
1941 }
1942
1943 // Otherwise go ahead and unroll.
1944 if (Node->isStrictFPOpcode()) {
1945 UnrollStrictFPOp(Node, Results);
1946 return;
1947 }
1948
1949 Results.push_back(DAG.UnrollVectorOp(Node));
1950}
1951
1952void VectorLegalizer::ExpandUINT_TO_FLOAT(SDNode *Node,
1953 SmallVectorImpl<SDValue> &Results) {
1954 bool IsStrict = Node->isStrictFPOpcode();
1955 unsigned OpNo = IsStrict ? 1 : 0;
1956 SDValue Src = Node->getOperand(OpNo);
1957 EVT SrcVT = Src.getValueType();
1958 EVT DstVT = Node->getValueType(0);
1959 SDLoc DL(Node);
1960
1961 // Attempt to expand using TargetLowering.
1963 SDValue Chain;
1964 if (TLI.expandUINT_TO_FP(Node, Result, Chain, DAG)) {
1965 Results.push_back(Result);
1966 if (IsStrict)
1967 Results.push_back(Chain);
1968 return;
1969 }
1970
1971 // Make sure that the SINT_TO_FP and SRL instructions are available.
1972 if (((!IsStrict && TLI.getOperationAction(ISD::SINT_TO_FP, SrcVT) ==
1973 TargetLowering::Expand) ||
1974 (IsStrict && TLI.getOperationAction(ISD::STRICT_SINT_TO_FP, SrcVT) ==
1975 TargetLowering::Expand)) ||
1976 TLI.getOperationAction(ISD::SRL, SrcVT) == TargetLowering::Expand) {
1977 if (IsStrict) {
1978 UnrollStrictFPOp(Node, Results);
1979 return;
1980 }
1981
1982 Results.push_back(DAG.UnrollVectorOp(Node));
1983 return;
1984 }
1985
1986 unsigned BW = SrcVT.getScalarSizeInBits();
1987 assert((BW == 64 || BW == 32) &&
1988 "Elements in vector-UINT_TO_FP must be 32 or 64 bits wide");
1989
1990 // If STRICT_/FMUL is not supported by the target (in case of f16) replace the
1991 // UINT_TO_FP with a larger float and round to the smaller type
1992 if ((!IsStrict && !TLI.isOperationLegalOrCustom(ISD::FMUL, DstVT)) ||
1993 (IsStrict && !TLI.isOperationLegalOrCustom(ISD::STRICT_FMUL, DstVT))) {
1994 EVT FPVT = BW == 32 ? MVT::f32 : MVT::f64;
1995 SDValue UIToFP;
1997 SDValue TargetZero = DAG.getIntPtrConstant(0, DL, /*isTarget=*/true);
1998 EVT FloatVecVT = SrcVT.changeVectorElementType(*DAG.getContext(), FPVT);
1999 if (IsStrict) {
2000 UIToFP = DAG.getNode(ISD::STRICT_UINT_TO_FP, DL, {FloatVecVT, MVT::Other},
2001 {Node->getOperand(0), Src});
2002 Result = DAG.getNode(ISD::STRICT_FP_ROUND, DL, {DstVT, MVT::Other},
2003 {Node->getOperand(0), UIToFP, TargetZero});
2004 Results.push_back(Result);
2005 Results.push_back(Result.getValue(1));
2006 } else {
2007 UIToFP = DAG.getNode(ISD::UINT_TO_FP, DL, FloatVecVT, Src);
2008 Result = DAG.getNode(ISD::FP_ROUND, DL, DstVT, UIToFP, TargetZero);
2009 Results.push_back(Result);
2010 }
2011
2012 return;
2013 }
2014
2015 SDValue HalfWord = DAG.getConstant(BW / 2, DL, SrcVT);
2016
2017 // Constants to clear the upper part of the word.
2018 // Notice that we can also use SHL+SHR, but using a constant is slightly
2019 // faster on x86.
2020 uint64_t HWMask = (BW == 64) ? 0x00000000FFFFFFFF : 0x0000FFFF;
2021 SDValue HalfWordMask = DAG.getConstant(HWMask, DL, SrcVT);
2022
2023 // Two to the power of half-word-size.
2024 SDValue TWOHW = DAG.getConstantFP(1ULL << (BW / 2), DL, DstVT);
2025
2026 // Clear upper part of LO, lower HI
2027 SDValue HI = DAG.getNode(ISD::SRL, DL, SrcVT, Src, HalfWord);
2028 SDValue LO = DAG.getNode(ISD::AND, DL, SrcVT, Src, HalfWordMask);
2029
2030 if (IsStrict) {
2031 // Convert hi and lo to floats
2032 // Convert the hi part back to the upper values
2033 // TODO: Can any fast-math-flags be set on these nodes?
2034 SDValue fHI = DAG.getNode(ISD::STRICT_SINT_TO_FP, DL, {DstVT, MVT::Other},
2035 {Node->getOperand(0), HI});
2036 fHI = DAG.getNode(ISD::STRICT_FMUL, DL, {DstVT, MVT::Other},
2037 {fHI.getValue(1), fHI, TWOHW});
2038 SDValue fLO = DAG.getNode(ISD::STRICT_SINT_TO_FP, DL, {DstVT, MVT::Other},
2039 {Node->getOperand(0), LO});
2040
2041 SDValue TF = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, fHI.getValue(1),
2042 fLO.getValue(1));
2043
2044 // Add the two halves
2045 SDValue Result =
2046 DAG.getNode(ISD::STRICT_FADD, DL, {DstVT, MVT::Other}, {TF, fHI, fLO});
2047
2048 Results.push_back(Result);
2049 Results.push_back(Result.getValue(1));
2050 return;
2051 }
2052
2053 // Convert hi and lo to floats
2054 // Convert the hi part back to the upper values
2055 // TODO: Can any fast-math-flags be set on these nodes?
2056 SDValue fHI = DAG.getNode(ISD::SINT_TO_FP, DL, DstVT, HI);
2057 fHI = DAG.getNode(ISD::FMUL, DL, DstVT, fHI, TWOHW);
2058 SDValue fLO = DAG.getNode(ISD::SINT_TO_FP, DL, DstVT, LO);
2059
2060 // Add the two halves
2061 Results.push_back(DAG.getNode(ISD::FADD, DL, DstVT, fHI, fLO));
2062}
2063
2064SDValue VectorLegalizer::ExpandFNEG(SDNode *Node) {
2065 EVT VT = Node->getValueType(0);
2066 EVT IntVT = VT.changeVectorElementTypeToInteger();
2067
2068 if (!TLI.isOperationLegalOrCustom(ISD::XOR, IntVT))
2069 return SDValue();
2070
2071 // Heuristic check to determine whether vector should be expanded to integer
2072 // operations or unrolled to scalar operations.
2073 // 1. Scalable vector is never unrolled.
2074 // 2. Fixed vector is unrolled if one of followings is true:
2075 // a. Vector only has 1 element and target knows how to handle scalar
2076 // FNEG (either legal or custom expand or promote).
2077 // b. Vector has more than 1 element and target supports scalar
2078 // FNEG natively and vector length <= 2(1 XOR + 1 CONST).
2079 // FIXME: Scalar construction instruction count varies in every architecture,
2080 // here we assume 1 instruction for now.
2081 if (VT.isFixedLengthVector()) {
2082 EVT EltVT = VT.getVectorElementType();
2083 unsigned NumElts = VT.getVectorNumElements();
2084 if ((NumElts == 1 &&
2086 (NumElts < 3 && TLI.isOperationLegal(ISD::FNEG, EltVT) &&
2087 TLI.isExtractVecEltCheap(VT, 0) &&
2088 (NumElts == 1 || TLI.isExtractVecEltCheap(VT, 1))))
2089 return SDValue();
2090 }
2091
2092 SDLoc DL(Node);
2093 SDValue Cast = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(0));
2094 SDValue SignMask = DAG.getConstant(
2095 APInt::getSignMask(IntVT.getScalarSizeInBits()), DL, IntVT);
2096 SDValue Xor = DAG.getNode(ISD::XOR, DL, IntVT, Cast, SignMask);
2097 return DAG.getNode(ISD::BITCAST, DL, VT, Xor);
2098}
2099
2100SDValue VectorLegalizer::ExpandFABS(SDNode *Node) {
2101 EVT VT = Node->getValueType(0);
2102 EVT IntVT = VT.changeVectorElementTypeToInteger();
2103
2104 if (!TLI.isOperationLegalOrCustom(ISD::AND, IntVT))
2105 return SDValue();
2106
2107 // Heuristic check to determine whether vector should be expanded to integer
2108 // operations or unrolled to scalar operations.
2109 // 1. Scalable vector is never unrolled.
2110 // 2. Fixed vector is unrolled if one of followings is true:
2111 // a. Vector only has 1 element and target knows how to handle scalar
2112 // FABS(either legal or custom expand or promote).
2113 // b. Vector has more than 1 element and target supports scalar
2114 // FABS natively and vector length <= 2(1 AND + 1 CONST).
2115 // FIXME: Scalar construction instruction count varies in every architecture,
2116 // here we assume 1 instruction for now.
2117 if (VT.isFixedLengthVector()) {
2118 EVT EltVT = VT.getVectorElementType();
2119 unsigned NumElts = VT.getVectorNumElements();
2120 if ((NumElts == 1 &&
2122 (NumElts < 3 && TLI.isOperationLegal(ISD::FABS, EltVT) &&
2123 TLI.isExtractVecEltCheap(VT, 0) &&
2124 (NumElts == 1 || TLI.isExtractVecEltCheap(VT, 1))))
2125 return SDValue();
2126 }
2127
2128 SDLoc DL(Node);
2129 SDValue Cast = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(0));
2130 SDValue ClearSignMask = DAG.getConstant(
2132 SDValue ClearedSign = DAG.getNode(ISD::AND, DL, IntVT, Cast, ClearSignMask);
2133 return DAG.getNode(ISD::BITCAST, DL, VT, ClearedSign);
2134}
2135
2136SDValue VectorLegalizer::ExpandFCOPYSIGN(SDNode *Node) {
2137 EVT VT = Node->getValueType(0);
2138 EVT IntVT = VT.changeVectorElementTypeToInteger();
2139
2140 if (VT != Node->getOperand(1).getValueType() ||
2141 !TLI.isOperationLegalOrCustom(ISD::AND, IntVT) ||
2142 !TLI.isOperationLegalOrCustom(ISD::OR, IntVT))
2143 return SDValue();
2144
2145 // Heuristic check to determine whether vector should be expanded to integer
2146 // operations or unrolled to scalar operations.
2147 // 1. Scalable vector is never unrolled.
2148 // 2. Fixed vector is unrolled if one of followings is true:
2149 // a. Vector only has 1 element and target knows how to handle scalar
2150 // FCOPYSIGN(either legal or custom expand or promote).
2151 // b. Vector has more than 1 element and target supports scalar
2152 // FCOPYSIGN natively and vector length <= 5(2 AND + 1 OR + 2 CONST).
2153 // FIXME: Scalar construction instruction count varies in every architecture,
2154 // here we assume 1 instruction for now.
2155 if (VT.isFixedLengthVector()) {
2156 EVT EltVT = VT.getVectorElementType();
2157 unsigned NumElts = VT.getVectorNumElements();
2158 if ((NumElts == 1 &&
2160 (NumElts < 6 && TLI.isOperationLegal(ISD::FCOPYSIGN, EltVT) &&
2161 TLI.isExtractVecEltCheap(VT, 0) &&
2162 (NumElts == 1 || TLI.isExtractVecEltCheap(VT, 1))))
2163 return SDValue();
2164 }
2165
2166 SDLoc DL(Node);
2167 SDValue Mag = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(0));
2168 SDValue Sign = DAG.getNode(ISD::BITCAST, DL, IntVT, Node->getOperand(1));
2169
2170 SDValue SignMask = DAG.getConstant(
2171 APInt::getSignMask(IntVT.getScalarSizeInBits()), DL, IntVT);
2172 SDValue SignBit = DAG.getNode(ISD::AND, DL, IntVT, Sign, SignMask);
2173
2174 SDValue ClearSignMask = DAG.getConstant(
2176 SDValue ClearedSign = DAG.getNode(ISD::AND, DL, IntVT, Mag, ClearSignMask);
2177
2178 SDValue CopiedSign = DAG.getNode(ISD::OR, DL, IntVT, ClearedSign, SignBit,
2180
2181 return DAG.getNode(ISD::BITCAST, DL, VT, CopiedSign);
2182}
2183
2184void VectorLegalizer::ExpandFSUB(SDNode *Node,
2185 SmallVectorImpl<SDValue> &Results) {
2186 // For floating-point values, (a-b) is the same as a+(-b). If FNEG is legal,
2187 // we can defer this to operation legalization where it will be lowered as
2188 // a+(-b).
2189 EVT VT = Node->getValueType(0);
2190 if (TLI.isOperationLegalOrCustom(ISD::FNEG, VT) &&
2192 return; // Defer to LegalizeDAG
2193
2194 if (SDValue Expanded = TLI.expandVectorNaryOpBySplitting(Node, DAG)) {
2195 Results.push_back(Expanded);
2196 return;
2197 }
2198
2199 SDValue Tmp = DAG.UnrollVectorOp(Node);
2200 Results.push_back(Tmp);
2201}
2202
2203void VectorLegalizer::ExpandSETCC(SDNode *Node,
2204 SmallVectorImpl<SDValue> &Results) {
2205 bool NeedInvert = false;
2206 bool IsVP = Node->getOpcode() == ISD::VP_SETCC;
2207 bool IsStrict = Node->getOpcode() == ISD::STRICT_FSETCC ||
2208 Node->getOpcode() == ISD::STRICT_FSETCCS;
2209 bool IsSignaling = Node->getOpcode() == ISD::STRICT_FSETCCS;
2210 unsigned Offset = IsStrict ? 1 : 0;
2211
2212 SDValue Chain = IsStrict ? Node->getOperand(0) : SDValue();
2213 SDValue LHS = Node->getOperand(0 + Offset);
2214 SDValue RHS = Node->getOperand(1 + Offset);
2215 SDValue CC = Node->getOperand(2 + Offset);
2216
2217 MVT OpVT = LHS.getSimpleValueType();
2218 ISD::CondCode CCCode = cast<CondCodeSDNode>(CC)->get();
2219
2220 if (TLI.getCondCodeAction(CCCode, OpVT) != TargetLowering::Expand) {
2221 if (IsStrict) {
2222 UnrollStrictFPOp(Node, Results);
2223 return;
2224 }
2225 Results.push_back(UnrollVSETCC(Node));
2226 return;
2227 }
2228
2229 SDValue Mask, EVL;
2230 if (IsVP) {
2231 Mask = Node->getOperand(3 + Offset);
2232 EVL = Node->getOperand(4 + Offset);
2233 }
2234
2235 SDLoc dl(Node);
2236 bool Legalized =
2237 TLI.LegalizeSetCCCondCode(DAG, Node->getValueType(0), LHS, RHS, CC, Mask,
2238 EVL, NeedInvert, dl, Chain, IsSignaling);
2239
2240 if (Legalized) {
2241 // If we expanded the SETCC by swapping LHS and RHS, or by inverting the
2242 // condition code, create a new SETCC node.
2243 if (CC.getNode()) {
2244 if (IsStrict) {
2245 LHS = DAG.getNode(Node->getOpcode(), dl, Node->getVTList(),
2246 {Chain, LHS, RHS, CC}, Node->getFlags());
2247 Chain = LHS.getValue(1);
2248 } else if (IsVP) {
2249 LHS = DAG.getNode(ISD::VP_SETCC, dl, Node->getValueType(0),
2250 {LHS, RHS, CC, Mask, EVL}, Node->getFlags());
2251 } else {
2252 LHS = DAG.getNode(ISD::SETCC, dl, Node->getValueType(0), LHS, RHS, CC,
2253 Node->getFlags());
2254 }
2255 }
2256
2257 // If we expanded the SETCC by inverting the condition code, then wrap
2258 // the existing SETCC in a NOT to restore the intended condition.
2259 if (NeedInvert) {
2260 if (!IsVP)
2261 LHS = DAG.getLogicalNOT(dl, LHS, LHS->getValueType(0));
2262 else
2263 LHS = DAG.getVPLogicalNOT(dl, LHS, Mask, EVL, LHS->getValueType(0));
2264 }
2265 } else {
2266 assert(!IsStrict && "Don't know how to expand for strict nodes.");
2267
2268 // Otherwise, SETCC for the given comparison type must be completely
2269 // illegal; expand it into a SELECT_CC.
2270 EVT VT = Node->getValueType(0);
2271 LHS = DAG.getNode(ISD::SELECT_CC, dl, VT, LHS, RHS,
2272 DAG.getBoolConstant(true, dl, VT, LHS.getValueType()),
2273 DAG.getBoolConstant(false, dl, VT, LHS.getValueType()),
2274 CC, Node->getFlags());
2275 }
2276
2277 Results.push_back(LHS);
2278 if (IsStrict)
2279 Results.push_back(Chain);
2280}
2281
2282void VectorLegalizer::ExpandUADDSUBO(SDNode *Node,
2283 SmallVectorImpl<SDValue> &Results) {
2284 SDValue Result, Overflow;
2285 TLI.expandUADDSUBO(Node, Result, Overflow, DAG);
2286 Results.push_back(Result);
2287 Results.push_back(Overflow);
2288}
2289
2290void VectorLegalizer::ExpandSADDSUBO(SDNode *Node,
2291 SmallVectorImpl<SDValue> &Results) {
2292 SDValue Result, Overflow;
2293 TLI.expandSADDSUBO(Node, Result, Overflow, DAG);
2294 Results.push_back(Result);
2295 Results.push_back(Overflow);
2296}
2297
2298void VectorLegalizer::ExpandMULO(SDNode *Node,
2299 SmallVectorImpl<SDValue> &Results) {
2300 SDValue Result, Overflow;
2301 if (!TLI.expandMULO(Node, Result, Overflow, DAG))
2302 std::tie(Result, Overflow) = DAG.UnrollVectorOverflowOp(Node);
2303
2304 Results.push_back(Result);
2305 Results.push_back(Overflow);
2306}
2307
2308void VectorLegalizer::ExpandFixedPointDiv(SDNode *Node,
2309 SmallVectorImpl<SDValue> &Results) {
2310 SDNode *N = Node;
2311 if (SDValue Expanded = TLI.expandFixedPointDiv(N->getOpcode(), SDLoc(N),
2312 N->getOperand(0), N->getOperand(1), N->getConstantOperandVal(2), DAG))
2313 Results.push_back(Expanded);
2314}
2315
2316void VectorLegalizer::ExpandStrictFPOp(SDNode *Node,
2317 SmallVectorImpl<SDValue> &Results) {
2318 if (Node->getOpcode() == ISD::STRICT_UINT_TO_FP) {
2319 ExpandUINT_TO_FLOAT(Node, Results);
2320 return;
2321 }
2322 if (Node->getOpcode() == ISD::STRICT_FP_TO_UINT) {
2323 ExpandFP_TO_UINT(Node, Results);
2324 return;
2325 }
2326
2327 if (Node->getOpcode() == ISD::STRICT_FSETCC ||
2328 Node->getOpcode() == ISD::STRICT_FSETCCS) {
2329 ExpandSETCC(Node, Results);
2330 return;
2331 }
2332
2333 UnrollStrictFPOp(Node, Results);
2334}
2335
2336void VectorLegalizer::ExpandREM(SDNode *Node,
2337 SmallVectorImpl<SDValue> &Results) {
2338 assert((Node->getOpcode() == ISD::SREM || Node->getOpcode() == ISD::UREM) &&
2339 "Expected REM node");
2340
2342 if (!TLI.expandREM(Node, Result, DAG))
2343 Result = DAG.UnrollVectorOp(Node);
2344 Results.push_back(Result);
2345}
2346
2347// Try to expand libm nodes into vector math routine calls. Callers provide the
2348// LibFunc equivalent of the passed in Node, which is used to lookup mappings
2349// within TargetLibraryInfo. The only mappings considered are those where the
2350// result and all operands are the same vector type. While predicated nodes are
2351// not supported, we will emit calls to masked routines by passing in an all
2352// true mask.
2353bool VectorLegalizer::tryExpandVecMathCall(SDNode *Node, RTLIB::Libcall LC,
2354 SmallVectorImpl<SDValue> &Results) {
2355 // Chain must be propagated but currently strict fp operations are down
2356 // converted to their none strict counterpart.
2357 assert(!Node->isStrictFPOpcode() && "Unexpected strict fp operation!");
2358
2359 RTLIB::LibcallImpl LCImpl = DAG.getLibcalls().getLibcallImpl(LC);
2360 if (LCImpl == RTLIB::Unsupported)
2361 return false;
2362
2363 EVT VT = Node->getValueType(0);
2364 const RTLIB::RuntimeLibcallsInfo &RTLCI = TLI.getRuntimeLibcallsInfo();
2365 LLVMContext &Ctx = *DAG.getContext();
2366
2367 auto [FuncTy, FuncAttrs] = RTLCI.getFunctionTy(
2368 Ctx, DAG.getSubtarget().getTargetTriple(), DAG.getDataLayout(), LCImpl);
2369
2370 SDLoc DL(Node);
2371 TargetLowering::ArgListTy Args;
2372
2373 bool HasMaskArg = RTLCI.hasVectorMaskArgument(LCImpl);
2374
2375 // Sanity check just in case function has unexpected parameters.
2376 assert(FuncTy->getNumParams() == Node->getNumOperands() + HasMaskArg &&
2377 EVT::getEVT(FuncTy->getReturnType(), true) == VT &&
2378 "mismatch in value type and call signature type");
2379
2380 for (unsigned I = 0, E = FuncTy->getNumParams(); I != E; ++I) {
2381 Type *ParamTy = FuncTy->getParamType(I);
2382
2383 if (HasMaskArg && I == E - 1) {
2384 assert(cast<VectorType>(ParamTy)->getElementType()->isIntegerTy(1) &&
2385 "unexpected vector mask type");
2386 EVT MaskVT = TLI.getSetCCResultType(DAG.getDataLayout(), Ctx, VT);
2387 Args.emplace_back(DAG.getBoolConstant(true, DL, MaskVT, VT),
2388 MaskVT.getTypeForEVT(Ctx));
2389
2390 } else {
2391 SDValue Op = Node->getOperand(I);
2392 assert(Op.getValueType() == EVT::getEVT(ParamTy, true) &&
2393 "mismatch in value type and call argument type");
2394 Args.emplace_back(Op, ParamTy);
2395 }
2396 }
2397
2398 // Emit a call to the vector function.
2399 SDValue Callee =
2400 DAG.getExternalSymbol(LCImpl, TLI.getPointerTy(DAG.getDataLayout()));
2401 CallingConv::ID CC = RTLCI.getLibcallImplCallingConv(LCImpl);
2402
2403 TargetLowering::CallLoweringInfo CLI(DAG);
2404 CLI.setDebugLoc(DL)
2405 .setChain(DAG.getEntryNode())
2406 .setLibCallee(CC, FuncTy->getReturnType(), Callee, std::move(Args));
2407
2408 std::pair<SDValue, SDValue> CallResult = TLI.LowerCallTo(CLI);
2409 Results.push_back(CallResult.first);
2410 return true;
2411}
2412
2413void VectorLegalizer::UnrollStrictFPOp(SDNode *Node,
2414 SmallVectorImpl<SDValue> &Results) {
2415 EVT VT = Node->getValueType(0);
2416 EVT EltVT = VT.getVectorElementType();
2417 unsigned NumElems = VT.getVectorNumElements();
2418 unsigned NumOpers = Node->getNumOperands();
2419 const TargetLowering &TLI = DAG.getTargetLoweringInfo();
2420
2421 EVT TmpEltVT = EltVT;
2422 if (Node->getOpcode() == ISD::STRICT_FSETCC ||
2423 Node->getOpcode() == ISD::STRICT_FSETCCS)
2424 TmpEltVT = TLI.getSetCCResultType(DAG.getDataLayout(),
2425 *DAG.getContext(), TmpEltVT);
2426
2427 EVT ValueVTs[] = {TmpEltVT, MVT::Other};
2428 SDValue Chain = Node->getOperand(0);
2429 SDLoc dl(Node);
2430
2431 SmallVector<SDValue, 32> OpValues;
2432 SmallVector<SDValue, 32> OpChains;
2433 for (unsigned i = 0; i < NumElems; ++i) {
2435 SDValue Idx = DAG.getVectorIdxConstant(i, dl);
2436
2437 // The Chain is the first operand.
2438 Opers.push_back(Chain);
2439
2440 // Now process the remaining operands.
2441 for (unsigned j = 1; j < NumOpers; ++j) {
2442 SDValue Oper = Node->getOperand(j);
2443 EVT OperVT = Oper.getValueType();
2444
2445 if (OperVT.isVector())
2446 Oper = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl,
2447 OperVT.getVectorElementType(), Oper, Idx);
2448
2449 Opers.push_back(Oper);
2450 }
2451
2452 SDValue ScalarOp = DAG.getNode(Node->getOpcode(), dl, ValueVTs, Opers);
2453 SDValue ScalarResult = ScalarOp.getValue(0);
2454 SDValue ScalarChain = ScalarOp.getValue(1);
2455
2456 if (Node->getOpcode() == ISD::STRICT_FSETCC ||
2457 Node->getOpcode() == ISD::STRICT_FSETCCS)
2458 ScalarResult = DAG.getSelect(dl, EltVT, ScalarResult,
2459 DAG.getAllOnesConstant(dl, EltVT),
2460 DAG.getConstant(0, dl, EltVT));
2461
2462 OpValues.push_back(ScalarResult);
2463 OpChains.push_back(ScalarChain);
2464 }
2465
2466 SDValue Result = DAG.getBuildVector(VT, dl, OpValues);
2467 SDValue NewChain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, OpChains);
2468
2469 Results.push_back(Result);
2470 Results.push_back(NewChain);
2471}
2472
2473SDValue VectorLegalizer::UnrollVSETCC(SDNode *Node) {
2474 EVT VT = Node->getValueType(0);
2475 unsigned NumElems = VT.getVectorNumElements();
2476 EVT EltVT = VT.getVectorElementType();
2477 SDValue LHS = Node->getOperand(0);
2478 SDValue RHS = Node->getOperand(1);
2479 SDValue CC = Node->getOperand(2);
2480 EVT TmpEltVT = LHS.getValueType().getVectorElementType();
2481 SDLoc dl(Node);
2482 SmallVector<SDValue, 8> Ops(NumElems);
2483 for (unsigned i = 0; i < NumElems; ++i) {
2484 SDValue LHSElem = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, TmpEltVT, LHS,
2485 DAG.getVectorIdxConstant(i, dl));
2486 SDValue RHSElem = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, TmpEltVT, RHS,
2487 DAG.getVectorIdxConstant(i, dl));
2488 // FIXME: We should use i1 setcc + boolext here, but it causes regressions.
2489 Ops[i] = DAG.getNode(ISD::SETCC, dl,
2491 *DAG.getContext(), TmpEltVT),
2492 LHSElem, RHSElem, CC);
2493 Ops[i] = DAG.getSelect(dl, EltVT, Ops[i],
2494 DAG.getBoolConstant(true, dl, EltVT, VT),
2495 DAG.getConstant(0, dl, EltVT));
2496 }
2497 return DAG.getBuildVector(VT, dl, Ops);
2498}
2499
2501 return VectorLegalizer(*this).Run();
2502}
return SDValue()
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Function Alias Analysis Results
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
This file defines the DenseMap class.
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
static void createBSWAPShuffleMask(EVT VT, SmallVectorImpl< int > &ShuffleMask)
#define I(x, y, z)
Definition MD5.cpp:57
#define T
This file defines the SmallVector class.
#define LLVM_DEBUG(...)
Definition Debug.h:119
This file describes how to lower LLVM code to machine code.
Value * RHS
Value * LHS
BinaryOperator * Mul
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
Definition APInt.h:230
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition APInt.h:210
bool isBigEndian() const
Definition DataLayout.h:218
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Definition DenseMap.h:239
size_t size() const
Definition Function.h:858
LLVM_ABI RTLIB::LibcallImpl getLibcallImpl(RTLIB::Libcall Call) const
Return the lowering's selection of implementation call for Call.
const Triple & getTargetTriple() const
unsigned getVectorNumElements() const
bool isVector() const
Return true if this is a vector value type.
TypeSize getSizeInBits() const
Returns the size of the specified MVT in bits.
MVT getVectorElementType() const
bool isFloatingPoint() const
Return true if this is a FP or a vector FP type.
MVT getScalarType() const
If this is a vector, return the element type, otherwise return this.
Represent a mutable reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:294
Represents one node in the SelectionDAG.
unsigned getNumValues() const
Return the number of values defined/returned by this operator.
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
SDNode * getNode() const
get the SDNode which holds the desired result
SDValue getValue(unsigned R) const
EVT getValueType() const
Return the ValueType of the referenced return value.
TypeSize getValueSizeInBits() const
Returns the size of the value in bits.
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
const SDValue & getRoot() const
Return the root tag of the SelectionDAG.
const TargetSubtargetInfo & getSubtarget() const
LLVM_ABI SDVTList getVTList(EVT VT)
Return an SDVTList that represents the list of values specified.
LLVM_ABI SDValue getAllOnesConstant(const SDLoc &DL, EVT VT, bool IsTarget=false, bool IsOpaque=false)
LLVM_ABI bool LegalizeVectors()
This transforms the SelectionDAG into a SelectionDAG that only uses vector math operations supported ...
LLVM_ABI SDValue UnrollVectorOp(SDNode *N, unsigned ResNE=0)
Utility function used by legalize and lowering to "unroll" a vector operation by splitting out the sc...
LLVM_ABI SDValue getConstantFP(double Val, const SDLoc &DL, EVT VT, bool isTarget=false)
Create a ConstantFPSDNode wrapping a constant value.
SDValue getInsertSubvector(const SDLoc &DL, SDValue Vec, SDValue SubVec, unsigned Idx)
Insert SubVec at the Idx element of Vec.
LLVM_ABI SDValue getStepVector(const SDLoc &DL, EVT ResVT, const APInt &StepVal)
Returns a vector of type ResVT whose elements contain the linear sequence <0, Step,...
SDValue getSetCC(const SDLoc &DL, EVT VT, SDValue LHS, SDValue RHS, ISD::CondCode Cond, SDValue Chain=SDValue(), bool IsSignaling=false, SDNodeFlags Flags={})
Helper function to make it easier to build SetCC's if you just have an ISD::CondCode instead of an SD...
LLVM_ABI SDValue getNOT(const SDLoc &DL, SDValue Val, EVT VT)
Create a bitwise NOT operation as (XOR Val, -1).
const TargetLowering & getTargetLoweringInfo() const
LLVM_ABI std::pair< SDValue, SDValue > UnrollVectorOverflowOp(SDNode *N, unsigned ResNE=0)
Like UnrollVectorOp(), but for the [US](ADD|SUB|MUL)O family of opcodes.
allnodes_const_iterator allnodes_begin() const
SDValue getUNDEF(EVT VT)
Return an UNDEF node. UNDEF does not have a useful SDLoc.
SDValue getBuildVector(EVT VT, const SDLoc &DL, ArrayRef< SDValue > Ops)
Return an ISD::BUILD_VECTOR node.
allnodes_const_iterator allnodes_end() const
LLVM_ABI SDValue getBitcast(EVT VT, SDValue V)
Return a bitcast using the SDLoc of the value operand, and casting to the provided type.
SDValue getSelect(const SDLoc &DL, EVT VT, SDValue Cond, SDValue LHS, SDValue RHS, SDNodeFlags Flags=SDNodeFlags())
Helper function to make it easier to build Select's if you just have operands and don't want to check...
const DataLayout & getDataLayout() const
LLVM_ABI SDValue getConstant(uint64_t Val, const SDLoc &DL, EVT VT, bool isTarget=false, bool isOpaque=false)
Create a ConstantSDNode wrapping a constant value.
LLVM_ABI void RemoveDeadNodes()
This method deletes all unreachable nodes in the SelectionDAG.
LLVM_ABI SDValue getExternalSymbol(const char *Sym, EVT VT)
LLVM_ABI SDValue getVPLogicalNOT(const SDLoc &DL, SDValue Val, SDValue Mask, SDValue EVL, EVT VT)
Create a vector-predicated logical NOT operation as (VP_XOR Val, BooleanOne, Mask,...
const LibcallLoweringInfo & getLibcalls() const
LLVM_ABI SDValue getIntPtrConstant(uint64_t Val, const SDLoc &DL, bool isTarget=false)
LLVM_ABI SDValue getValueType(EVT)
LLVM_ABI SDValue getNode(unsigned Opcode, const SDLoc &DL, EVT VT, ArrayRef< SDUse > Ops)
Gets or creates the specified node.
LLVM_ABI unsigned AssignTopologicalOrder()
Topological-sort the AllNodes list and a assign a unique node id for each node in the DAG based on th...
LLVM_ABI SDValue getBoolConstant(bool V, const SDLoc &DL, EVT VT, EVT OpVT)
Create a true or false constant of type VT using the target's BooleanContent for type OpVT.
LLVM_ABI SDValue getVectorIdxConstant(uint64_t Val, const SDLoc &DL, bool isTarget=false)
SDValue getPOISON(EVT VT)
Return a POISON node. POISON does not have a useful SDLoc.
LLVMContext * getContext() const
const SDValue & setRoot(SDValue N)
Set the current root tag of the SelectionDAG.
LLVM_ABI SDNode * UpdateNodeOperands(SDNode *N, SDValue Op)
Mutate the specified node in-place to have the specified operands.
SDValue getEntryNode() const
Return the token chain corresponding to the entry of the function.
SDValue getSplat(EVT VT, const SDLoc &DL, SDValue Op)
Returns a node representing a splat of one value into all lanes of the provided vector type.
LLVM_ABI SDValue getVectorShuffle(EVT VT, const SDLoc &dl, SDValue N1, SDValue N2, ArrayRef< int > Mask)
Return an ISD::VECTOR_SHUFFLE node.
LLVM_ABI SDValue getLogicalNOT(const SDLoc &DL, SDValue Val, EVT VT)
Create a logical NOT operation as (XOR Val, BooleanOne).
ilist< SDNode >::iterator allnodes_iterator
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void resize(size_type N)
void push_back(const T &Elt)
virtual bool isShuffleMaskLegal(ArrayRef< int >, EVT) const
Targets can use this to indicate that they only support some VECTOR_SHUFFLE operations,...
SDValue promoteTargetBoolean(SelectionDAG &DAG, SDValue Bool, EVT ValVT) const
Promote the given target boolean to a target boolean of the given type.
LegalizeAction getCondCodeAction(ISD::CondCode CC, MVT VT) const
Return how the condition code should be treated: either it is legal, needs to be expanded to some oth...
LegalizeAction getTruncStoreAction(EVT ValVT, EVT MemVT, Align Alignment, unsigned AddrSpace) const
Return how this store with truncation should be treated: either it is legal, needs to be promoted to ...
virtual bool isExtractVecEltCheap(EVT VT, unsigned Index) const
Return true if extraction of a scalar element from the given vector type at the given index is cheap.
LegalizeAction getFixedPointOperationAction(unsigned Op, EVT VT, unsigned Scale) const
Some fixed point operations may be natively supported by the target but only for specific scales.
bool isStrictFPEnabled() const
Return true if the target support strict float operation.
virtual EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Context, EVT VT) const
Return the ValueType of the result of SETCC operations.
BooleanContent getBooleanContents(bool isVec, bool isFloat) const
For targets without i1 registers, this gives the nature of the high-bits of boolean values held in ty...
virtual MVT getPointerTy(const DataLayout &DL, uint32_t AS=0) const
Return the pointer type for the given address space, defaults to the pointer type from the data layou...
bool isOperationLegal(unsigned Op, EVT VT) const
Return true if the specified operation is legal on this target.
bool isOperationLegalOrCustom(unsigned Op, EVT VT, bool LegalOnly=false) const
Return true if the specified operation is legal on this target or can be made legal with custom lower...
LegalizeAction getPartialReduceMLAAction(unsigned Opc, EVT AccVT, EVT InputVT) const
Return how a PARTIAL_REDUCE_U/SMLA node with Acc type AccVT and Input type InputVT should be treated.
LegalizeAction getLoadAction(EVT ValVT, EVT MemVT, Align Alignment, unsigned AddrSpace, unsigned ExtType, bool Atomic) const
Return how this load with extension should be treated: either it is legal, needs to be promoted to a ...
LegalizeAction getStrictFPOperationAction(unsigned Op, EVT VT) const
LegalizeAction getOperationAction(unsigned Op, EVT VT) const
Return how this operation should be treated: either it is legal, needs to be promoted to a larger siz...
MVT getTypeToPromoteTo(unsigned Op, MVT VT) const
If the action for this operation is to promote, this method returns the ValueType to promote to.
bool isOperationLegalOrCustomOrPromote(unsigned Op, EVT VT, bool LegalOnly=false) const
Return true if the specified operation is legal on this target or can be made legal with custom lower...
const RTLIB::RuntimeLibcallsInfo & getRuntimeLibcallsInfo() const
This class defines information used to lower LLVM code to legal SelectionDAG operators that the targe...
SDValue expandAddSubSat(SDNode *Node, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::[US][ADD|SUB]SAT.
bool expandMultipleResultFPLibCall(SelectionDAG &DAG, RTLIB::Libcall LC, SDNode *Node, SmallVectorImpl< SDValue > &Results, std::optional< unsigned > CallRetResNo={}) const
Expands a node with multiple results to an FP or vector libcall.
SDValue expandVPCTLZ(SDNode *N, SelectionDAG &DAG) const
Expand VP_CTLZ/VP_CTLZ_ZERO_POISON nodes.
bool expandMULO(SDNode *Node, SDValue &Result, SDValue &Overflow, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::[US]MULO.
SDValue scalarizeVectorStore(StoreSDNode *ST, SelectionDAG &DAG) const
SDValue expandVPBSWAP(SDNode *N, SelectionDAG &DAG) const
Expand VP_BSWAP nodes.
SDValue expandVecReduceSeq(SDNode *Node, SelectionDAG &DAG) const
Expand a VECREDUCE_SEQ_* into an explicit ordered calculation.
SDValue expandFCANONICALIZE(SDNode *Node, SelectionDAG &DAG) const
Expand FCANONICALIZE to FMUL with 1.
SDValue expandCTLZ(SDNode *N, SelectionDAG &DAG) const
Expand CTLZ/CTLZ_ZERO_POISON nodes.
SDValue expandBITREVERSE(SDNode *N, SelectionDAG &DAG) const
Expand BITREVERSE nodes.
SDValue expandCTTZ(SDNode *N, SelectionDAG &DAG) const
Expand CTTZ/CTTZ_ZERO_POISON nodes.
SDValue expandABD(SDNode *N, SelectionDAG &DAG) const
Expand ABDS/ABDU nodes.
SDValue expandCLMUL(SDNode *N, SelectionDAG &DAG) const
Expand carryless multiply.
SDValue expandShlSat(SDNode *Node, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::[US]SHLSAT.
SDValue expandFP_TO_INT_SAT(SDNode *N, SelectionDAG &DAG) const
Expand FP_TO_[US]INT_SAT into FP_TO_[US]INT and selects or min/max.
SDValue expandCttzElts(SDNode *Node, SelectionDAG &DAG) const
Expand a CTTZ_ELTS or CTTZ_ELTS_ZERO_POISON by calculating (VL - i) for each active lane (i),...
void expandSADDSUBO(SDNode *Node, SDValue &Result, SDValue &Overflow, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::S(ADD|SUB)O.
SDValue expandVPBITREVERSE(SDNode *N, SelectionDAG &DAG) const
Expand VP_BITREVERSE nodes.
SDValue expandABS(SDNode *N, SelectionDAG &DAG, bool IsNegative=false) const
Expand ABS nodes.
SDValue expandVecReduce(SDNode *Node, SelectionDAG &DAG) const
Expand a VECREDUCE_* into an explicit calculation.
bool expandFP_TO_UINT(SDNode *N, SDValue &Result, SDValue &Chain, SelectionDAG &DAG) const
Expand float to UINT conversion.
bool expandREM(SDNode *Node, SDValue &Result, SelectionDAG &DAG) const
Expand an SREM or UREM using SDIV/UDIV or SDIVREM/UDIVREM, if legal.
SDValue expandFMINIMUMNUM_FMAXIMUMNUM(SDNode *N, SelectionDAG &DAG) const
Expand fminimumnum/fmaximumnum into multiple comparison with selects.
SDValue expandLoopDependenceMask(SDNode *N, SelectionDAG &DAG) const
Expand LOOP_DEPENDENCE_MASK nodes.
SDValue expandCTPOP(SDNode *N, SelectionDAG &DAG) const
Expand CTPOP nodes.
SDValue expandVectorNaryOpBySplitting(SDNode *Node, SelectionDAG &DAG) const
std::pair< SDValue, SDValue > LowerCallTo(CallLoweringInfo &CLI) const
This function lowers an abstract call to a function into an actual call.
SDValue expandBSWAP(SDNode *N, SelectionDAG &DAG) const
Expand BSWAP nodes.
SDValue expandFMINIMUM_FMAXIMUM(SDNode *N, SelectionDAG &DAG) const
Expand fminimum/fmaximum into multiple comparison with selects.
std::pair< SDValue, SDValue > scalarizeVectorLoad(LoadSDNode *LD, SelectionDAG &DAG) const
Turn load of vector type into a load of the individual elements.
SDValue expandFunnelShift(SDNode *N, SelectionDAG &DAG) const
Expand funnel shift.
bool LegalizeSetCCCondCode(SelectionDAG &DAG, EVT VT, SDValue &LHS, SDValue &RHS, SDValue &CC, SDValue Mask, SDValue EVL, bool &NeedInvert, const SDLoc &dl, SDValue &Chain, bool IsSignaling=false) const
Legalize a SETCC or VP_SETCC with given LHS and RHS and condition code CC on the current target.
virtual SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const
This callback is invoked for operations that are unsupported by the target, which are registered to u...
SDValue expandVPCTPOP(SDNode *N, SelectionDAG &DAG) const
Expand VP_CTPOP nodes.
SDValue expandFixedPointDiv(unsigned Opcode, const SDLoc &dl, SDValue LHS, SDValue RHS, unsigned Scale, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::[US]DIVFIX[SAT].
SDValue expandVPCTTZ(SDNode *N, SelectionDAG &DAG) const
Expand VP_CTTZ/VP_CTTZ_ZERO_POISON nodes.
SDValue expandVECTOR_COMPRESS(SDNode *Node, SelectionDAG &DAG) const
Expand a vector VECTOR_COMPRESS into a sequence of extract element, store temporarily,...
SDValue expandCONVERT_FROM_ARBITRARY_FP(SDNode *Node, SelectionDAG &DAG) const
Expand CONVERT_FROM_ARBITRARY_FP using bit manipulation.
SDValue expandROT(SDNode *N, bool AllowVectorOps, SelectionDAG &DAG) const
Expand rotations.
SDValue expandFMINNUM_FMAXNUM(SDNode *N, SelectionDAG &DAG) const
Expand fminnum/fmaxnum into fminnum_ieee/fmaxnum_ieee with quieted inputs.
SDValue expandCMP(SDNode *Node, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::[US]CMP.
SDValue expandFixedPointMul(SDNode *Node, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::[U|S]MULFIX[SAT].
SDValue expandIntMINMAX(SDNode *Node, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::[US][MIN|MAX].
SDValue expandVectorFindLastActive(SDNode *N, SelectionDAG &DAG) const
Expand VECTOR_FIND_LAST_ACTIVE nodes.
SDValue expandPartialReduceMLA(SDNode *Node, SelectionDAG &DAG) const
Expands PARTIAL_REDUCE_S/UMLA nodes to a series of simpler operations, consisting of zext/sext,...
void expandUADDSUBO(SDNode *Node, SDValue &Result, SDValue &Overflow, SelectionDAG &DAG) const
Method for building the DAG expansion of ISD::U(ADD|SUB)O.
bool expandUINT_TO_FP(SDNode *N, SDValue &Result, SDValue &Chain, SelectionDAG &DAG) const
Expand UINT(i64) to double(f64) conversion.
SDValue expandAVG(SDNode *N, SelectionDAG &DAG) const
Expand vector/scalar AVGCEILS/AVGCEILU/AVGFLOORS/AVGFLOORU nodes.
Changed
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
@ SETCC
SetCC operator - This evaluates to a true value iff the condition is true.
Definition ISDOpcodes.h:823
@ MERGE_VALUES
MERGE_VALUES - This node takes multiple discrete operands and returns them all as its individual resu...
Definition ISDOpcodes.h:261
@ STRICT_FSETCC
STRICT_FSETCC/STRICT_FSETCCS - Constrained versions of SETCC, used for floating-point operands only.
Definition ISDOpcodes.h:511
@ PARTIAL_REDUCE_SMLA
PARTIAL_REDUCE_[U|S]MLA(Accumulator, Input1, Input2) The partial reduction nodes sign or zero extend ...
@ LOOP_DEPENDENCE_RAW_MASK
@ VECREDUCE_SEQ_FADD
Generic reduction nodes.
@ SMUL_LOHI
SMUL_LOHI/UMUL_LOHI - Multiply two integers of type iN, producing a signed/unsigned value of type i[2...
Definition ISDOpcodes.h:275
@ BSWAP
Byte Swap and Counting operators.
Definition ISDOpcodes.h:783
@ SMULFIX
RESULT = [US]MULFIX(LHS, RHS, SCALE) - Perform fixed point multiplication on 2 integers with the same...
Definition ISDOpcodes.h:394
@ ADD
Simple integer binary arithmetic operators.
Definition ISDOpcodes.h:264
@ LOAD
LOAD and STORE have token chains as their first operand, then the same operands as an LLVM load/store...
@ SMULFIXSAT
Same as the corresponding unsaturated fixed point instructions, but the result is clamped between the...
Definition ISDOpcodes.h:400
@ ANY_EXTEND
ANY_EXTEND - Used for integer types. The high bits are undefined.
Definition ISDOpcodes.h:857
@ CTTZ_ELTS
Returns the number of number of trailing (least significant) zero elements in a vector.
@ FMA
FMA - Perform a * b + c with no intermediate rounding step.
Definition ISDOpcodes.h:518
@ VECTOR_FIND_LAST_ACTIVE
Finds the index of the last active mask element Operands: Mask.
@ FMODF
FMODF - Decomposes the operand into integral and fractional parts, each having the same type and sign...
@ FATAN2
FATAN2 - atan2, inspired by libm.
@ FSINCOSPI
FSINCOSPI - Compute both the sine and cosine times pi more accurately than FSINCOS(pi*x),...
@ SINT_TO_FP
[SU]INT_TO_FP - These operators convert integers (whose interpreted sign depends on the first letter)...
Definition ISDOpcodes.h:884
@ VECREDUCE_FMAX
FMIN/FMAX nodes can have flags, for NaN/NoNaN variants.
@ FADD
Simple binary floating point operators.
Definition ISDOpcodes.h:417
@ VECREDUCE_FMAXIMUM
FMINIMUM/FMAXIMUM nodes propatate NaNs and signed zeroes using the llvm.minimum and llvm....
@ ABS
ABS - Determine the unsigned absolute value of a signed integer value of the same bitwidth.
Definition ISDOpcodes.h:747
@ SIGN_EXTEND_VECTOR_INREG
SIGN_EXTEND_VECTOR_INREG(Vector) - This operator represents an in-register sign-extension of the low ...
Definition ISDOpcodes.h:914
@ SDIVREM
SDIVREM/UDIVREM - Divide two integers and produce both a quotient and remainder result.
Definition ISDOpcodes.h:280
@ FPTRUNC_ROUND
FPTRUNC_ROUND - This corresponds to the fptrunc_round intrinsic.
Definition ISDOpcodes.h:515
@ BITCAST
BITCAST - This operator converts between integer, vector and FP values, as if the value was stored to...
Definition ISDOpcodes.h:997
@ CLMUL
Carry-less multiplication operations.
Definition ISDOpcodes.h:778
@ FLDEXP
FLDEXP - ldexp, inspired by libm (op0 * 2**op1).
@ SDIVFIX
RESULT = [US]DIVFIX(LHS, RHS, SCALE) - Perform fixed point division on 2 integers with the same width...
Definition ISDOpcodes.h:407
@ STRICT_FSQRT
Constrained versions of libm-equivalent floating point intrinsics.
Definition ISDOpcodes.h:438
@ CONVERT_FROM_ARBITRARY_FP
CONVERT_FROM_ARBITRARY_FP - This operator converts from an arbitrary floating-point represented as an...
@ CTLZ_ZERO_POISON
Definition ISDOpcodes.h:792
@ PARTIAL_REDUCE_UMLA
@ SIGN_EXTEND
Conversion operators.
Definition ISDOpcodes.h:848
@ AVGCEILS
AVGCEILS/AVGCEILU - Rounding averaging add - Add two integers using an integer of type i[N+2],...
Definition ISDOpcodes.h:715
@ STRICT_UINT_TO_FP
Definition ISDOpcodes.h:485
@ VECREDUCE_FADD
These reductions have relaxed evaluation order semantics, and have a single vector operand.
@ PARTIAL_REDUCE_FMLA
@ FSINCOS
FSINCOS - Compute both fsin and fcos as a single operation.
@ FNEG
Perform various unary floating-point operations inspired by libm.
@ SSUBO
Same for subtraction.
Definition ISDOpcodes.h:352
@ STEP_VECTOR
STEP_VECTOR(IMM) - Returns a scalable vector whose lanes are comprised of a linear sequence of unsign...
Definition ISDOpcodes.h:691
@ FCANONICALIZE
Returns platform specific canonical encoding of a floating point number.
Definition ISDOpcodes.h:541
@ SSUBSAT
RESULT = [US]SUBSAT(LHS, RHS) - Perform saturation subtraction on 2 integers with the same bit width ...
Definition ISDOpcodes.h:374
@ SELECT
Select(COND, TRUEVAL, FALSEVAL).
Definition ISDOpcodes.h:800
@ SPLAT_VECTOR
SPLAT_VECTOR(VAL) - Returns a vector with the scalar value VAL duplicated in all lanes.
Definition ISDOpcodes.h:672
@ SADDO
RESULT, BOOL = [SU]ADDO(LHS, RHS) - Overflow-aware nodes for addition.
Definition ISDOpcodes.h:348
@ VECREDUCE_ADD
Integer reductions may have a result type larger than the vector element type.
@ MULHU
MULHU/MULHS - Multiply high - Multiply two integers of type iN, producing an unsigned/signed value of...
Definition ISDOpcodes.h:704
@ SHL
Shift and rotation operations.
Definition ISDOpcodes.h:769
@ FMINNUM_IEEE
FMINNUM_IEEE/FMAXNUM_IEEE - Perform floating-point minimumNumber or maximumNumber on two values,...
@ EXTRACT_VECTOR_ELT
EXTRACT_VECTOR_ELT(VECTOR, IDX) - Returns a single element from VECTOR identified by the (potentially...
Definition ISDOpcodes.h:576
@ ZERO_EXTEND
ZERO_EXTEND - Used for integer types, zeroing the new bits.
Definition ISDOpcodes.h:854
@ SELECT_CC
Select with condition operator - This selects between a true value and a false value (ops #2 and #3) ...
Definition ISDOpcodes.h:815
@ FMINNUM
FMINNUM/FMAXNUM - Perform floating-point minimum maximum on two values, following IEEE-754 definition...
@ SSHLSAT
RESULT = [US]SHLSAT(LHS, RHS) - Perform saturation left shift.
Definition ISDOpcodes.h:386
@ SMULO
Same for multiplication.
Definition ISDOpcodes.h:356
@ ANY_EXTEND_VECTOR_INREG
ANY_EXTEND_VECTOR_INREG(Vector) - This operator represents an in-register any-extension of the low la...
Definition ISDOpcodes.h:903
@ SIGN_EXTEND_INREG
SIGN_EXTEND_INREG - This operator atomically performs a SHL/SRA pair to sign extend a small value in ...
Definition ISDOpcodes.h:892
@ SMIN
[US]{MIN/MAX} - Binary minimum or maximum of signed or unsigned integers.
Definition ISDOpcodes.h:727
@ MASKED_UDIV
Masked vector arithmetic that returns poison on disabled lanes.
@ SDIVFIXSAT
Same as the corresponding unsaturated fixed point instructions, but the result is clamped between the...
Definition ISDOpcodes.h:413
@ FP_EXTEND
X = FP_EXTEND(Y) - Extend a smaller FP type into a larger FP type.
Definition ISDOpcodes.h:982
@ VSELECT
Select with a vector condition (op #0) and two vector operands (ops #1 and #2), returning a vector re...
Definition ISDOpcodes.h:809
@ STRICT_SINT_TO_FP
STRICT_[US]INT_TO_FP - Convert a signed or unsigned integer to a floating point value.
Definition ISDOpcodes.h:484
@ MGATHER
Masked gather and scatter - load and store operations for a vector of random addresses with additiona...
@ STRICT_FP_TO_UINT
Definition ISDOpcodes.h:478
@ STRICT_FP_ROUND
X = STRICT_FP_ROUND(Y, TRUNC) - Rounding 'Y' from a larger floating point type down to the precision ...
Definition ISDOpcodes.h:500
@ STRICT_FP_TO_SINT
STRICT_FP_TO_[US]INT - Convert a floating point value to a signed or unsigned integer.
Definition ISDOpcodes.h:477
@ FMINIMUM
FMINIMUM/FMAXIMUM - NaN-propagating minimum/maximum that also treat -0.0 as less than 0....
@ FP_TO_SINT
FP_TO_[US]INT - Convert a floating point value to a signed or unsigned integer.
Definition ISDOpcodes.h:930
@ STRICT_FP_EXTEND
X = STRICT_FP_EXTEND(Y) - Extend a smaller FP type into a larger FP type.
Definition ISDOpcodes.h:505
@ AND
Bitwise operators - logical and, logical or, logical xor.
Definition ISDOpcodes.h:739
@ SCMP
[US]CMP - 3-way comparison of signed or unsigned integers.
Definition ISDOpcodes.h:735
@ AVGFLOORS
AVGFLOORS/AVGFLOORU - Averaging add - Add two integers using an integer of type i[N+1],...
Definition ISDOpcodes.h:710
@ STRICT_FADD
Constrained versions of the binary floating point operators.
Definition ISDOpcodes.h:427
@ TokenFactor
TokenFactor - This node takes multiple tokens as input and produces a single token result.
Definition ISDOpcodes.h:53
@ CTTZ_ZERO_POISON
Bit counting operators with a poisoned result for zero inputs.
Definition ISDOpcodes.h:791
@ FFREXP
FFREXP - frexp, extract fractional and exponent component of a floating-point value.
@ FP_ROUND
X = FP_ROUND(Y, TRUNC) - Rounding 'Y' from a larger floating point type down to the precision of the ...
Definition ISDOpcodes.h:963
@ VECTOR_COMPRESS
VECTOR_COMPRESS(Vec, Mask, Passthru) consecutively place vector elements based on mask e....
Definition ISDOpcodes.h:699
@ ZERO_EXTEND_VECTOR_INREG
ZERO_EXTEND_VECTOR_INREG(Vector) - This operator represents an in-register zero-extension of the low ...
Definition ISDOpcodes.h:925
@ FP_TO_SINT_SAT
FP_TO_[US]INT_SAT - Convert floating point value in operand 0 to a signed or unsigned scalar integer ...
Definition ISDOpcodes.h:949
@ VECREDUCE_FMINIMUM
@ TRUNCATE
TRUNCATE - Completely drop the high bits.
Definition ISDOpcodes.h:860
@ VECREDUCE_SEQ_FMUL
@ AssertSext
AssertSext, AssertZext - These nodes record if a register contains a value that has already been zero...
Definition ISDOpcodes.h:62
@ FCOPYSIGN
FCOPYSIGN(X, Y) - Return the value of X with the sign of Y.
Definition ISDOpcodes.h:534
@ PARTIAL_REDUCE_SUMLA
@ SADDSAT
RESULT = [US]ADDSAT(LHS, RHS) - Perform saturation addition on 2 integers with the same bit width (W)...
Definition ISDOpcodes.h:365
@ CTTZ_ELTS_ZERO_POISON
@ FMINIMUMNUM
FMINIMUMNUM/FMAXIMUMNUM - minimumnum/maximumnum that is same with FMINNUM_IEEE and FMAXNUM_IEEE besid...
@ ABDS
ABDS/ABDU - Absolute difference - Return the absolute difference between two numbers interpreted as s...
Definition ISDOpcodes.h:722
@ ABS_MIN_POISON
ABS with a poison result for INT_MIN.
Definition ISDOpcodes.h:751
@ BUILD_VECTOR
BUILD_VECTOR(ELT0, ELT1, ELT2, ELT3,...) - Return a fixed-width vector with the specified,...
Definition ISDOpcodes.h:556
@ LOOP_DEPENDENCE_WAR_MASK
The llvm.loop.dependence.
LLVM_ABI NodeType getUnmaskedBinOpOpcode(unsigned MaskedOpc)
Given a MaskedOpc of ISD::MASKED_(U|S)(DIV|REM), returns the unmasked ISD::(U|S)(DIV|REM).
LLVM_ABI std::optional< unsigned > getVPMaskIdx(unsigned Opcode)
The operand position of the vector mask.
LLVM_ABI std::optional< unsigned > getVPExplicitVectorLengthIdx(unsigned Opcode)
The operand position of the explicit vector length parameter.
CondCode
ISD::CondCode enum - These are ordered carefully to make the bitfields below work out,...
LoadExtType
LoadExtType enum - This enum defines the three variants of LOADEXT (load with extension).
LLVM_ABI bool isVPOpcode(unsigned Opcode)
Whether this is a vector-predicated Opcode.
LLVM_ABI Libcall getREM(EVT VT)
LLVM_ABI Libcall getSINCOSPI(EVT RetVT)
getSINCOSPI - Return the SINCOSPI_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getMODF(EVT VT)
getMODF - Return the MODF_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getCBRT(EVT RetVT)
getCBRT - Return the CBRT_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getPOW(EVT RetVT)
getPOW - Return the POW_* value for the given types, or UNKNOWN_LIBCALL if there is none.
LLVM_ABI Libcall getSINCOS(EVT RetVT)
getSINCOS - Return the SINCOS_* value for the given types, or UNKNOWN_LIBCALL if there is none.
NodeAddr< NodeBase * > Node
Definition RDFGraph.h:381
This is an optimization pass for GlobalISel generic memory operations.
@ Offset
Definition DWP.cpp:557
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1745
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:209
SmallVector< ValueTypeFromRangeType< R >, Size > to_vector(R &&Range)
Given a range of type R, iterate the entire range and return a SmallVector with elements of the vecto...
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
MutableArrayRef(T &OneElt) -> MutableArrayRef< T >
@ Xor
Bitwise or logical XOR of integers.
DWARFExpression::Operation Op
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
auto seq(T Begin, T End)
Iterate over an integral type from Begin up to - but not including - End.
Definition Sequence.h:305
#define N
Extended Value Type.
Definition ValueTypes.h:35
EVT changeVectorElementTypeToInteger() const
Return a vector with the same number of elements as this vector, but with the element type converted ...
Definition ValueTypes.h:90
static EVT getVectorVT(LLVMContext &Context, EVT VT, unsigned NumElements, bool IsScalable=false)
Returns the EVT that represents a vector NumElements in length, where each element is of type VT.
Definition ValueTypes.h:70
ElementCount getVectorElementCount() const
Definition ValueTypes.h:358
TypeSize getSizeInBits() const
Return the size of the specified value type in bits.
Definition ValueTypes.h:381
uint64_t getScalarSizeInBits() const
Definition ValueTypes.h:393
static LLVM_ABI EVT getEVT(Type *Ty, bool HandleUnknown=false)
Return the value type corresponding to the specified type.
EVT changeVectorElementType(LLVMContext &Context, EVT EltVT) const
Return a VT for a vector type whose attributes match ourselves with the exception of the element type...
Definition ValueTypes.h:98
MVT getSimpleVT() const
Return the SimpleValueType held in the specified simple EVT.
Definition ValueTypes.h:324
bool isFixedLengthVector() const
Definition ValueTypes.h:189
bool isVector() const
Return true if this is a vector value type.
Definition ValueTypes.h:176
EVT getScalarType() const
If this is a vector type, return the element type, otherwise return this.
Definition ValueTypes.h:331
LLVM_ABI Type * getTypeForEVT(LLVMContext &Context) const
This method returns an LLVM type corresponding to the specified EVT.
bool isScalableVector() const
Return true if this is a vector type where the runtime length is machine dependent.
Definition ValueTypes.h:182
EVT getVectorElementType() const
Given a vector type, return the type of each element.
Definition ValueTypes.h:336
unsigned getVectorNumElements() const
Given a vector type, return the number of elements it contains.
Definition ValueTypes.h:344
bool bitsLE(EVT VT) const
Return true if this has no more bits than VT.
Definition ValueTypes.h:316
bool isInteger() const
Return true if this is an integer or a vector integer type.
Definition ValueTypes.h:160
CallingConv::ID getLibcallImplCallingConv(RTLIB::LibcallImpl Call) const
Get the CallingConv that should be used for the specified libcall.
std::pair< FunctionType *, AttributeList > getFunctionTy(LLVMContext &Ctx, const Triple &TT, const DataLayout &DL, RTLIB::LibcallImpl LibcallImpl) const
static bool hasVectorMaskArgument(RTLIB::LibcallImpl Impl)
Returns true if the function has a vector mask argument, which is assumed to be the last argument.