LLVM 23.0.0git
ConstantFolding.cpp
Go to the documentation of this file.
1//===-- ConstantFolding.cpp - Fold instructions into constants ------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines routines for folding instructions into constants.
10//
11// Also, to supplement the basic IR ConstantExpr simplifications,
12// this file defines some additional folding routines that can make use of
13// DataLayout information. These functions cannot go in IR due to library
14// dependency issues.
15//
16//===----------------------------------------------------------------------===//
17
19#include "llvm/ADT/APFloat.h"
20#include "llvm/ADT/APInt.h"
21#include "llvm/ADT/APSInt.h"
22#include "llvm/ADT/ArrayRef.h"
23#include "llvm/ADT/DenseMap.h"
24#include "llvm/ADT/STLExtras.h"
26#include "llvm/ADT/StringRef.h"
31#include "llvm/Config/config.h"
32#include "llvm/IR/Constant.h"
34#include "llvm/IR/Constants.h"
35#include "llvm/IR/DataLayout.h"
37#include "llvm/IR/Function.h"
38#include "llvm/IR/GlobalValue.h"
40#include "llvm/IR/InstrTypes.h"
41#include "llvm/IR/Instruction.h"
44#include "llvm/IR/Intrinsics.h"
45#include "llvm/IR/IntrinsicsAArch64.h"
46#include "llvm/IR/IntrinsicsAMDGPU.h"
47#include "llvm/IR/IntrinsicsARM.h"
48#include "llvm/IR/IntrinsicsNVPTX.h"
49#include "llvm/IR/IntrinsicsWebAssembly.h"
50#include "llvm/IR/IntrinsicsX86.h"
52#include "llvm/IR/Operator.h"
53#include "llvm/IR/Type.h"
54#include "llvm/IR/Value.h"
59#include <cassert>
60#include <cerrno>
61#include <cfenv>
62#include <cmath>
63#include <cstdint>
64
65using namespace llvm;
66
68 "disable-fp-call-folding",
69 cl::desc("Disable constant-folding of FP intrinsics and libcalls."),
70 cl::init(false), cl::Hidden);
71
72namespace {
73
74//===----------------------------------------------------------------------===//
75// Constant Folding internal helper functions
76//===----------------------------------------------------------------------===//
77
78static Constant *foldConstVectorToAPInt(APInt &Result, Type *DestTy,
79 Constant *C, Type *SrcEltTy,
80 unsigned NumSrcElts,
81 const DataLayout &DL) {
82 // Now that we know that the input value is a vector of integers, just shift
83 // and insert them into our result.
84 unsigned BitShift = DL.getTypeSizeInBits(SrcEltTy);
85 for (unsigned i = 0; i != NumSrcElts; ++i) {
86 Constant *Element;
87 if (DL.isLittleEndian())
88 Element = C->getAggregateElement(NumSrcElts - i - 1);
89 else
90 Element = C->getAggregateElement(i);
91
92 if (isa_and_nonnull<UndefValue>(Element)) {
93 Result <<= BitShift;
94 continue;
95 }
96
97 auto *ElementCI = dyn_cast_or_null<ConstantInt>(Element);
98 if (!ElementCI)
99 return ConstantExpr::getBitCast(C, DestTy);
100
101 Result <<= BitShift;
102 Result |= ElementCI->getValue().zext(Result.getBitWidth());
103 }
104
105 return nullptr;
106}
107
108/// Constant fold bitcast, symbolically evaluating it with DataLayout.
109/// This always returns a non-null constant, but it may be a
110/// ConstantExpr if unfoldable.
111Constant *FoldBitCast(Constant *C, Type *DestTy, const DataLayout &DL) {
112 assert(CastInst::castIsValid(Instruction::BitCast, C, DestTy) &&
113 "Invalid constantexpr bitcast!");
114
115 // Catch the obvious splat cases.
116 if (Constant *Res = ConstantFoldLoadFromUniformValue(C, DestTy, DL))
117 return Res;
118
119 if (auto *VTy = dyn_cast<VectorType>(C->getType())) {
120 // Handle a vector->scalar integer/fp cast.
121 if (isa<IntegerType>(DestTy) || DestTy->isFloatingPointTy()) {
122 unsigned NumSrcElts = cast<FixedVectorType>(VTy)->getNumElements();
123 Type *SrcEltTy = VTy->getElementType();
124
125 // If the vector is a vector of floating point, convert it to vector of int
126 // to simplify things.
127 if (SrcEltTy->isFloatingPointTy()) {
128 unsigned FPWidth = SrcEltTy->getPrimitiveSizeInBits();
129 auto *SrcIVTy = FixedVectorType::get(
130 IntegerType::get(C->getContext(), FPWidth), NumSrcElts);
131 // Ask IR to do the conversion now that #elts line up.
132 C = ConstantExpr::getBitCast(C, SrcIVTy);
133 }
134
135 APInt Result(DL.getTypeSizeInBits(DestTy), 0);
136 if (Constant *CE = foldConstVectorToAPInt(Result, DestTy, C,
137 SrcEltTy, NumSrcElts, DL))
138 return CE;
139
140 if (isa<IntegerType>(DestTy))
141 return ConstantInt::get(DestTy, Result);
142
143 APFloat FP(DestTy->getFltSemantics(), Result);
144 return ConstantFP::get(DestTy->getContext(), FP);
145 }
146 }
147
148 // The code below only handles casts to vectors currently.
149 auto *DestVTy = dyn_cast<VectorType>(DestTy);
150 if (!DestVTy)
151 return ConstantExpr::getBitCast(C, DestTy);
152
153 // If this is a scalar -> vector cast, convert the input into a <1 x scalar>
154 // vector so the code below can handle it uniformly.
155 if (!isa<VectorType>(C->getType()) &&
157 Constant *Ops = C; // don't take the address of C!
158 return FoldBitCast(ConstantVector::get(Ops), DestTy, DL);
159 }
160
161 // Some of what follows may extend to cover scalable vectors but the current
162 // implementation is fixed length specific.
163 if (!isa<FixedVectorType>(C->getType()))
164 return ConstantExpr::getBitCast(C, DestTy);
165
166 // If this is a bitcast from constant vector -> vector, fold it.
169 return ConstantExpr::getBitCast(C, DestTy);
170
171 // If the element types match, IR can fold it.
172 unsigned NumDstElt = cast<FixedVectorType>(DestVTy)->getNumElements();
173 unsigned NumSrcElt = cast<FixedVectorType>(C->getType())->getNumElements();
174 if (NumDstElt == NumSrcElt)
175 return ConstantExpr::getBitCast(C, DestTy);
176
177 Type *SrcEltTy = cast<VectorType>(C->getType())->getElementType();
178 Type *DstEltTy = DestVTy->getElementType();
179
180 // Otherwise, we're changing the number of elements in a vector, which
181 // requires endianness information to do the right thing. For example,
182 // bitcast (<2 x i64> <i64 0, i64 1> to <4 x i32>)
183 // folds to (little endian):
184 // <4 x i32> <i32 0, i32 0, i32 1, i32 0>
185 // and to (big endian):
186 // <4 x i32> <i32 0, i32 0, i32 0, i32 1>
187
188 // First thing is first. We only want to think about integer here, so if
189 // we have something in FP form, recast it as integer.
190 if (DstEltTy->isFloatingPointTy()) {
191 // Fold to an vector of integers with same size as our FP type.
192 unsigned FPWidth = DstEltTy->getPrimitiveSizeInBits();
193 auto *DestIVTy = FixedVectorType::get(
194 IntegerType::get(C->getContext(), FPWidth), NumDstElt);
195 // Recursively handle this integer conversion, if possible.
196 C = FoldBitCast(C, DestIVTy, DL);
197
198 // Finally, IR can handle this now that #elts line up.
199 return ConstantExpr::getBitCast(C, DestTy);
200 }
201
202 // Okay, we know the destination is integer, if the input is FP, convert
203 // it to integer first.
204 if (SrcEltTy->isFloatingPointTy()) {
205 unsigned FPWidth = SrcEltTy->getPrimitiveSizeInBits();
206 auto *SrcIVTy = FixedVectorType::get(
207 IntegerType::get(C->getContext(), FPWidth), NumSrcElt);
208 // Ask IR to do the conversion now that #elts line up.
209 C = ConstantExpr::getBitCast(C, SrcIVTy);
210 assert((isa<ConstantVector>(C) || // FIXME: Remove ConstantVector.
212 "Constant folding cannot fail for plain fp->int bitcast!");
213 }
214
215 // Now we know that the input and output vectors are both integer vectors
216 // of the same size, and that their #elements is not the same. Do the
217 // conversion here, which depends on whether the input or output has
218 // more elements.
219 bool isLittleEndian = DL.isLittleEndian();
220
222 if (NumDstElt < NumSrcElt) {
223 // Handle: bitcast (<4 x i32> <i32 0, i32 1, i32 2, i32 3> to <2 x i64>)
225 unsigned Ratio = NumSrcElt/NumDstElt;
226 unsigned SrcBitSize = SrcEltTy->getPrimitiveSizeInBits();
227 unsigned SrcElt = 0;
228 for (unsigned i = 0; i != NumDstElt; ++i) {
229 // Build each element of the result.
230 Constant *Elt = Zero;
231 unsigned ShiftAmt = isLittleEndian ? 0 : SrcBitSize*(Ratio-1);
232 for (unsigned j = 0; j != Ratio; ++j) {
233 Constant *Src = C->getAggregateElement(SrcElt++);
236 cast<VectorType>(C->getType())->getElementType());
237 else
239 if (!Src) // Reject constantexpr elements.
240 return ConstantExpr::getBitCast(C, DestTy);
241
242 // Zero extend the element to the right size.
243 Src = ConstantFoldCastOperand(Instruction::ZExt, Src, Elt->getType(),
244 DL);
245 assert(Src && "Constant folding cannot fail on plain integers");
246
247 // Shift it to the right place, depending on endianness.
249 Instruction::Shl, Src, ConstantInt::get(Src->getType(), ShiftAmt),
250 DL);
251 assert(Src && "Constant folding cannot fail on plain integers");
252
253 ShiftAmt += isLittleEndian ? SrcBitSize : -SrcBitSize;
254
255 // Mix it in.
256 Elt = ConstantFoldBinaryOpOperands(Instruction::Or, Elt, Src, DL);
257 assert(Elt && "Constant folding cannot fail on plain integers");
258 }
259 Result.push_back(Elt);
260 }
261 return ConstantVector::get(Result);
262 }
263
264 // Handle: bitcast (<2 x i64> <i64 0, i64 1> to <4 x i32>)
265 unsigned Ratio = NumDstElt/NumSrcElt;
266 unsigned DstBitSize = DL.getTypeSizeInBits(DstEltTy);
267
268 // Loop over each source value, expanding into multiple results.
269 for (unsigned i = 0; i != NumSrcElt; ++i) {
270 auto *Element = C->getAggregateElement(i);
271
272 if (!Element) // Reject constantexpr elements.
273 return ConstantExpr::getBitCast(C, DestTy);
274
275 if (isa<UndefValue>(Element)) {
276 // Correctly Propagate undef values.
277 Result.append(Ratio, UndefValue::get(DstEltTy));
278 continue;
279 }
280
281 auto *Src = dyn_cast<ConstantInt>(Element);
282 if (!Src)
283 return ConstantExpr::getBitCast(C, DestTy);
284
285 unsigned ShiftAmt = isLittleEndian ? 0 : DstBitSize*(Ratio-1);
286 for (unsigned j = 0; j != Ratio; ++j) {
287 // Shift the piece of the value into the right place, depending on
288 // endianness.
289 APInt Elt = Src->getValue().lshr(ShiftAmt);
290 ShiftAmt += isLittleEndian ? DstBitSize : -DstBitSize;
291
292 // Truncate and remember this piece.
293 Result.push_back(ConstantInt::get(DstEltTy, Elt.trunc(DstBitSize)));
294 }
295 }
296
297 return ConstantVector::get(Result);
298}
299
300} // end anonymous namespace
301
302/// If this constant is a constant offset from a global, return the global and
303/// the constant. Because of constantexprs, this function is recursive.
305 APInt &Offset, const DataLayout &DL,
306 DSOLocalEquivalent **DSOEquiv) {
307 if (DSOEquiv)
308 *DSOEquiv = nullptr;
309
310 // Trivial case, constant is the global.
311 if ((GV = dyn_cast<GlobalValue>(C))) {
312 unsigned BitWidth = DL.getIndexTypeSizeInBits(GV->getType());
313 Offset = APInt(BitWidth, 0);
314 return true;
315 }
316
317 if (auto *FoundDSOEquiv = dyn_cast<DSOLocalEquivalent>(C)) {
318 if (DSOEquiv)
319 *DSOEquiv = FoundDSOEquiv;
320 GV = FoundDSOEquiv->getGlobalValue();
321 unsigned BitWidth = DL.getIndexTypeSizeInBits(GV->getType());
322 Offset = APInt(BitWidth, 0);
323 return true;
324 }
325
326 // Otherwise, if this isn't a constant expr, bail out.
327 auto *CE = dyn_cast<ConstantExpr>(C);
328 if (!CE) return false;
329
330 // Look through ptr->int and ptr->ptr casts.
331 if (CE->getOpcode() == Instruction::PtrToInt ||
332 CE->getOpcode() == Instruction::PtrToAddr)
333 return IsConstantOffsetFromGlobal(CE->getOperand(0), GV, Offset, DL,
334 DSOEquiv);
335
336 // i32* getelementptr ([5 x i32]* @a, i32 0, i32 5)
337 auto *GEP = dyn_cast<GEPOperator>(CE);
338 if (!GEP)
339 return false;
340
341 unsigned BitWidth = DL.getIndexTypeSizeInBits(GEP->getType());
342 APInt TmpOffset(BitWidth, 0);
343
344 // If the base isn't a global+constant, we aren't either.
345 if (!IsConstantOffsetFromGlobal(CE->getOperand(0), GV, TmpOffset, DL,
346 DSOEquiv))
347 return false;
348
349 // Otherwise, add any offset that our operands provide.
350 if (!GEP->accumulateConstantOffset(DL, TmpOffset))
351 return false;
352
353 Offset = TmpOffset;
354 return true;
355}
356
358 const DataLayout &DL) {
359 do {
360 Type *SrcTy = C->getType();
361 if (SrcTy == DestTy)
362 return C;
363
364 TypeSize DestSize = DL.getTypeSizeInBits(DestTy);
365 TypeSize SrcSize = DL.getTypeSizeInBits(SrcTy);
366 if (!TypeSize::isKnownGE(SrcSize, DestSize))
367 return nullptr;
368
369 // Catch the obvious splat cases (since all-zeros can coerce non-integral
370 // pointers legally).
371 if (Constant *Res = ConstantFoldLoadFromUniformValue(C, DestTy, DL))
372 return Res;
373
374 // If the type sizes are the same and a cast is legal, just directly
375 // cast the constant.
376 // But be careful not to coerce non-integral pointers illegally.
377 if (SrcSize == DestSize &&
378 DL.isNonIntegralPointerType(SrcTy->getScalarType()) ==
379 DL.isNonIntegralPointerType(DestTy->getScalarType())) {
380 Instruction::CastOps Cast = Instruction::BitCast;
381 // If we are going from a pointer to int or vice versa, we spell the cast
382 // differently.
383 if (SrcTy->isIntegerTy() && DestTy->isPointerTy())
384 Cast = Instruction::IntToPtr;
385 else if (SrcTy->isPointerTy() && DestTy->isIntegerTy())
386 Cast = Instruction::PtrToInt;
387
388 if (CastInst::castIsValid(Cast, C, DestTy))
389 return ConstantFoldCastOperand(Cast, C, DestTy, DL);
390 }
391
392 // If this isn't an aggregate type, there is nothing we can do to drill down
393 // and find a bitcastable constant.
394 if (!SrcTy->isAggregateType() && !SrcTy->isVectorTy())
395 return nullptr;
396
397 // We're simulating a load through a pointer that was bitcast to point to
398 // a different type, so we can try to walk down through the initial
399 // elements of an aggregate to see if some part of the aggregate is
400 // castable to implement the "load" semantic model.
401 if (SrcTy->isStructTy()) {
402 // Struct types might have leading zero-length elements like [0 x i32],
403 // which are certainly not what we are looking for, so skip them.
404 unsigned Elem = 0;
405 Constant *ElemC;
406 do {
407 ElemC = C->getAggregateElement(Elem++);
408 } while (ElemC && DL.getTypeSizeInBits(ElemC->getType()).isZero());
409 C = ElemC;
410 } else {
411 // For non-byte-sized vector elements, the first element is not
412 // necessarily located at the vector base address.
413 if (auto *VT = dyn_cast<VectorType>(SrcTy))
414 if (!DL.typeSizeEqualsStoreSize(VT->getElementType()))
415 return nullptr;
416
417 C = C->getAggregateElement(0u);
418 }
419 } while (C);
420
421 return nullptr;
422}
423
424namespace {
425
426/// Recursive helper to read bits out of global. C is the constant being copied
427/// out of. ByteOffset is an offset into C. CurPtr is the pointer to copy
428/// results into and BytesLeft is the number of bytes left in
429/// the CurPtr buffer. DL is the DataLayout.
430bool ReadDataFromGlobal(Constant *C, uint64_t ByteOffset, unsigned char *CurPtr,
431 unsigned BytesLeft, const DataLayout &DL) {
432 assert(ByteOffset <= DL.getTypeAllocSize(C->getType()) &&
433 "Out of range access");
434
435 // Reading type padding, return zero.
436 if (ByteOffset >= DL.getTypeStoreSize(C->getType()))
437 return true;
438
439 // If this element is zero or undefined, we can just return since *CurPtr is
440 // zero initialized.
442 return true;
443
444 auto *CI = dyn_cast<ConstantInt>(C);
445 if (CI && CI->getType()->isIntegerTy()) {
446 if ((CI->getBitWidth() & 7) != 0)
447 return false;
448 const APInt &Val = CI->getValue();
449 unsigned IntBytes = unsigned(CI->getBitWidth()/8);
450
451 for (unsigned i = 0; i != BytesLeft && ByteOffset != IntBytes; ++i) {
452 unsigned n = ByteOffset;
453 if (!DL.isLittleEndian())
454 n = IntBytes - n - 1;
455 CurPtr[i] = Val.extractBits(8, n * 8).getZExtValue();
456 ++ByteOffset;
457 }
458 return true;
459 }
460
461 auto *CFP = dyn_cast<ConstantFP>(C);
462 if (CFP && CFP->getType()->isFloatingPointTy()) {
463 if (CFP->getType()->isDoubleTy()) {
464 C = FoldBitCast(C, Type::getInt64Ty(C->getContext()), DL);
465 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL);
466 }
467 if (CFP->getType()->isFloatTy()){
468 C = FoldBitCast(C, Type::getInt32Ty(C->getContext()), DL);
469 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL);
470 }
471 if (CFP->getType()->isHalfTy()){
472 C = FoldBitCast(C, Type::getInt16Ty(C->getContext()), DL);
473 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL);
474 }
475 return false;
476 }
477
478 if (auto *CS = dyn_cast<ConstantStruct>(C)) {
479 const StructLayout *SL = DL.getStructLayout(CS->getType());
480 unsigned Index = SL->getElementContainingOffset(ByteOffset);
481 uint64_t CurEltOffset = SL->getElementOffset(Index);
482 ByteOffset -= CurEltOffset;
483
484 while (true) {
485 // If the element access is to the element itself and not to tail padding,
486 // read the bytes from the element.
487 uint64_t EltSize = DL.getTypeAllocSize(CS->getOperand(Index)->getType());
488
489 if (ByteOffset < EltSize &&
490 !ReadDataFromGlobal(CS->getOperand(Index), ByteOffset, CurPtr,
491 BytesLeft, DL))
492 return false;
493
494 ++Index;
495
496 // Check to see if we read from the last struct element, if so we're done.
497 if (Index == CS->getType()->getNumElements())
498 return true;
499
500 // If we read all of the bytes we needed from this element we're done.
501 uint64_t NextEltOffset = SL->getElementOffset(Index);
502
503 if (BytesLeft <= NextEltOffset - CurEltOffset - ByteOffset)
504 return true;
505
506 // Move to the next element of the struct.
507 CurPtr += NextEltOffset - CurEltOffset - ByteOffset;
508 BytesLeft -= NextEltOffset - CurEltOffset - ByteOffset;
509 ByteOffset = 0;
510 CurEltOffset = NextEltOffset;
511 }
512 // not reached.
513 }
514
518 uint64_t NumElts, EltSize;
519 Type *EltTy;
520 if (auto *AT = dyn_cast<ArrayType>(C->getType())) {
521 NumElts = AT->getNumElements();
522 EltTy = AT->getElementType();
523 EltSize = DL.getTypeAllocSize(EltTy);
524 } else {
525 NumElts = cast<FixedVectorType>(C->getType())->getNumElements();
526 EltTy = cast<FixedVectorType>(C->getType())->getElementType();
527 // TODO: For non-byte-sized vectors, current implementation assumes there is
528 // padding to the next byte boundary between elements.
529 if (!DL.typeSizeEqualsStoreSize(EltTy))
530 return false;
531
532 EltSize = DL.getTypeStoreSize(EltTy);
533 }
534 uint64_t Index = ByteOffset / EltSize;
535 uint64_t Offset = ByteOffset - Index * EltSize;
536
537 for (; Index != NumElts; ++Index) {
538 if (!ReadDataFromGlobal(C->getAggregateElement(Index), Offset, CurPtr,
539 BytesLeft, DL))
540 return false;
541
542 uint64_t BytesWritten = EltSize - Offset;
543 assert(BytesWritten <= EltSize && "Not indexing into this element?");
544 if (BytesWritten >= BytesLeft)
545 return true;
546
547 Offset = 0;
548 BytesLeft -= BytesWritten;
549 CurPtr += BytesWritten;
550 }
551 return true;
552 }
553
554 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
555 if (CE->getOpcode() == Instruction::IntToPtr &&
556 CE->getOperand(0)->getType() == DL.getIntPtrType(CE->getType())) {
557 return ReadDataFromGlobal(CE->getOperand(0), ByteOffset, CurPtr,
558 BytesLeft, DL);
559 }
560 }
561
562 // Otherwise, unknown initializer type.
563 return false;
564}
565
566Constant *FoldReinterpretLoadFromConst(Constant *C, Type *LoadTy,
567 int64_t Offset, const DataLayout &DL) {
568 // Bail out early. Not expect to load from scalable global variable.
569 if (isa<ScalableVectorType>(LoadTy))
570 return nullptr;
571
572 auto *IntType = dyn_cast<IntegerType>(LoadTy);
573
574 // If this isn't an integer load we can't fold it directly.
575 if (!IntType) {
576 // If this is a non-integer load, we can try folding it as an int load and
577 // then bitcast the result. This can be useful for union cases. Note
578 // that address spaces don't matter here since we're not going to result in
579 // an actual new load.
580 if (!LoadTy->isFloatingPointTy() && !LoadTy->isPointerTy() &&
581 !LoadTy->isVectorTy())
582 return nullptr;
583
584 Type *MapTy = Type::getIntNTy(C->getContext(),
585 DL.getTypeSizeInBits(LoadTy).getFixedValue());
586 if (Constant *Res = FoldReinterpretLoadFromConst(C, MapTy, Offset, DL)) {
587 if (Res->isNullValue() && !LoadTy->isX86_AMXTy())
588 // Materializing a zero can be done trivially without a bitcast
589 return Constant::getNullValue(LoadTy);
590 Type *CastTy = LoadTy->isPtrOrPtrVectorTy() ? DL.getIntPtrType(LoadTy) : LoadTy;
591 Res = FoldBitCast(Res, CastTy, DL);
592 if (LoadTy->isPtrOrPtrVectorTy()) {
593 // For vector of pointer, we needed to first convert to a vector of integer, then do vector inttoptr
594 if (Res->isNullValue() && !LoadTy->isX86_AMXTy())
595 return Constant::getNullValue(LoadTy);
596 if (DL.isNonIntegralPointerType(LoadTy->getScalarType()))
597 // Be careful not to replace a load of an addrspace value with an inttoptr here
598 return nullptr;
599 Res = ConstantExpr::getIntToPtr(Res, LoadTy);
600 }
601 return Res;
602 }
603 return nullptr;
604 }
605
606 unsigned BytesLoaded = (IntType->getBitWidth() + 7) / 8;
607 if (BytesLoaded > 32 || BytesLoaded == 0)
608 return nullptr;
609
610 // If we're not accessing anything in this constant, the result is undefined.
611 if (Offset <= -1 * static_cast<int64_t>(BytesLoaded))
612 return PoisonValue::get(IntType);
613
614 // TODO: We should be able to support scalable types.
615 TypeSize InitializerSize = DL.getTypeAllocSize(C->getType());
616 if (InitializerSize.isScalable())
617 return nullptr;
618
619 // If we're not accessing anything in this constant, the result is undefined.
620 if (Offset >= (int64_t)InitializerSize.getFixedValue())
621 return PoisonValue::get(IntType);
622
623 unsigned char RawBytes[32] = {0};
624 unsigned char *CurPtr = RawBytes;
625 unsigned BytesLeft = BytesLoaded;
626
627 // If we're loading off the beginning of the global, some bytes may be valid.
628 if (Offset < 0) {
629 CurPtr += -Offset;
630 BytesLeft += Offset;
631 Offset = 0;
632 }
633
634 if (!ReadDataFromGlobal(C, Offset, CurPtr, BytesLeft, DL))
635 return nullptr;
636
637 APInt ResultVal = APInt(IntType->getBitWidth(), 0);
638 if (DL.isLittleEndian()) {
639 ResultVal = RawBytes[BytesLoaded - 1];
640 for (unsigned i = 1; i != BytesLoaded; ++i) {
641 ResultVal <<= 8;
642 ResultVal |= RawBytes[BytesLoaded - 1 - i];
643 }
644 } else {
645 ResultVal = RawBytes[0];
646 for (unsigned i = 1; i != BytesLoaded; ++i) {
647 ResultVal <<= 8;
648 ResultVal |= RawBytes[i];
649 }
650 }
651
652 return ConstantInt::get(IntType->getContext(), ResultVal);
653}
654
655} // anonymous namespace
656
657// If GV is a constant with an initializer read its representation starting
658// at Offset and return it as a constant array of unsigned char. Otherwise
659// return null.
662 if (!GV->isConstant() || !GV->hasDefinitiveInitializer())
663 return nullptr;
664
665 const DataLayout &DL = GV->getDataLayout();
666 Constant *Init = const_cast<Constant *>(GV->getInitializer());
667 TypeSize InitSize = DL.getTypeAllocSize(Init->getType());
668 if (InitSize < Offset)
669 return nullptr;
670
671 uint64_t NBytes = InitSize - Offset;
672 if (NBytes > UINT16_MAX)
673 // Bail for large initializers in excess of 64K to avoid allocating
674 // too much memory.
675 // Offset is assumed to be less than or equal than InitSize (this
676 // is enforced in ReadDataFromGlobal).
677 return nullptr;
678
679 SmallVector<unsigned char, 256> RawBytes(static_cast<size_t>(NBytes));
680 unsigned char *CurPtr = RawBytes.data();
681
682 if (!ReadDataFromGlobal(Init, Offset, CurPtr, NBytes, DL))
683 return nullptr;
684
685 return ConstantDataArray::get(GV->getContext(), RawBytes);
686}
687
688/// If this Offset points exactly to the start of an aggregate element, return
689/// that element, otherwise return nullptr.
691 const DataLayout &DL) {
692 if (Offset.isZero())
693 return Base;
694
696 return nullptr;
697
698 Type *ElemTy = Base->getType();
699 SmallVector<APInt> Indices = DL.getGEPIndicesForOffset(ElemTy, Offset);
700 if (!Offset.isZero() || !Indices[0].isZero())
701 return nullptr;
702
703 Constant *C = Base;
704 for (const APInt &Index : drop_begin(Indices)) {
705 if (Index.isNegative() || Index.getActiveBits() >= 32)
706 return nullptr;
707
708 C = C->getAggregateElement(Index.getZExtValue());
709 if (!C)
710 return nullptr;
711 }
712
713 return C;
714}
715
717 const APInt &Offset,
718 const DataLayout &DL) {
719 if (Constant *AtOffset = getConstantAtOffset(C, Offset, DL))
720 if (Constant *Result = ConstantFoldLoadThroughBitcast(AtOffset, Ty, DL))
721 return Result;
722
723 // Explicitly check for out-of-bounds access, so we return poison even if the
724 // constant is a uniform value.
725 TypeSize Size = DL.getTypeAllocSize(C->getType());
726 if (!Size.isScalable() && Offset.sge(Size.getFixedValue()))
727 return PoisonValue::get(Ty);
728
729 // Try an offset-independent fold of a uniform value.
730 if (Constant *Result = ConstantFoldLoadFromUniformValue(C, Ty, DL))
731 return Result;
732
733 // Try hard to fold loads from bitcasted strange and non-type-safe things.
734 if (Offset.getSignificantBits() <= 64)
735 if (Constant *Result =
736 FoldReinterpretLoadFromConst(C, Ty, Offset.getSExtValue(), DL))
737 return Result;
738
739 return nullptr;
740}
741
746
749 const DataLayout &DL) {
750 // We can only fold loads from constant globals with a definitive initializer.
751 // Check this upfront, to skip expensive offset calculations.
753 if (!GV || !GV->isConstant() || !GV->hasDefinitiveInitializer())
754 return nullptr;
755
756 C = cast<Constant>(C->stripAndAccumulateConstantOffsets(
757 DL, Offset, /* AllowNonInbounds */ true));
758
759 if (C == GV)
760 if (Constant *Result = ConstantFoldLoadFromConst(GV->getInitializer(), Ty,
761 Offset, DL))
762 return Result;
763
764 // If this load comes from anywhere in a uniform constant global, the value
765 // is always the same, regardless of the loaded offset.
766 return ConstantFoldLoadFromUniformValue(GV->getInitializer(), Ty, DL);
767}
768
770 const DataLayout &DL) {
771 APInt Offset(DL.getIndexTypeSizeInBits(C->getType()), 0);
772 return ConstantFoldLoadFromConstPtr(C, Ty, std::move(Offset), DL);
773}
774
776 const DataLayout &DL) {
777 if (isa<PoisonValue>(C))
778 return PoisonValue::get(Ty);
779 if (isa<UndefValue>(C))
780 return UndefValue::get(Ty);
781 // If padding is needed when storing C to memory, then it isn't considered as
782 // uniform.
783 if (!DL.typeSizeEqualsStoreSize(C->getType()))
784 return nullptr;
785 if (C->isNullValue() && !Ty->isX86_AMXTy())
786 return Constant::getNullValue(Ty);
787 if (C->isAllOnesValue() &&
788 (Ty->isIntOrIntVectorTy() || Ty->isFPOrFPVectorTy()))
789 return Constant::getAllOnesValue(Ty);
790 return nullptr;
791}
792
793namespace {
794
795/// One of Op0/Op1 is a constant expression.
796/// Attempt to symbolically evaluate the result of a binary operator merging
797/// these together. If target data info is available, it is provided as DL,
798/// otherwise DL is null.
799Constant *SymbolicallyEvaluateBinop(unsigned Opc, Constant *Op0, Constant *Op1,
800 const DataLayout &DL) {
801 // SROA
802
803 // Fold (and 0xffffffff00000000, (shl x, 32)) -> shl.
804 // Fold (lshr (or X, Y), 32) -> (lshr [X/Y], 32) if one doesn't contribute
805 // bits.
806
807 if (Opc == Instruction::And) {
808 KnownBits Known0 = computeKnownBits(Op0, DL);
809 KnownBits Known1 = computeKnownBits(Op1, DL);
810 if ((Known1.One | Known0.Zero).isAllOnes()) {
811 // All the bits of Op0 that the 'and' could be masking are already zero.
812 return Op0;
813 }
814 if ((Known0.One | Known1.Zero).isAllOnes()) {
815 // All the bits of Op1 that the 'and' could be masking are already zero.
816 return Op1;
817 }
818
819 Known0 &= Known1;
820 if (Known0.isConstant())
821 return ConstantInt::get(Op0->getType(), Known0.getConstant());
822 }
823
824 // If the constant expr is something like &A[123] - &A[4].f, fold this into a
825 // constant. This happens frequently when iterating over a global array.
826 if (Opc == Instruction::Sub) {
827 GlobalValue *GV1, *GV2;
828 APInt Offs1, Offs2;
829
830 if (IsConstantOffsetFromGlobal(Op0, GV1, Offs1, DL))
831 if (IsConstantOffsetFromGlobal(Op1, GV2, Offs2, DL) && GV1 == GV2) {
832 unsigned OpSize = DL.getTypeSizeInBits(Op0->getType());
833
834 // (&GV+C1) - (&GV+C2) -> C1-C2, pointer arithmetic cannot overflow.
835 // PtrToInt may change the bitwidth so we have convert to the right size
836 // first.
837 return ConstantInt::get(Op0->getType(), Offs1.zextOrTrunc(OpSize) -
838 Offs2.zextOrTrunc(OpSize));
839 }
840 }
841
842 return nullptr;
843}
844
845/// If array indices are not pointer-sized integers, explicitly cast them so
846/// that they aren't implicitly casted by the getelementptr.
847Constant *CastGEPIndices(Type *SrcElemTy, ArrayRef<Constant *> Ops,
848 Type *ResultTy, GEPNoWrapFlags NW,
849 std::optional<ConstantRange> InRange,
850 const DataLayout &DL, const TargetLibraryInfo *TLI) {
851 Type *IntIdxTy = DL.getIndexType(ResultTy);
852 Type *IntIdxScalarTy = IntIdxTy->getScalarType();
853
854 bool Any = false;
856 for (unsigned i = 1, e = Ops.size(); i != e; ++i) {
857 if ((i == 1 ||
859 SrcElemTy, Ops.slice(1, i - 1)))) &&
860 Ops[i]->getType()->getScalarType() != IntIdxScalarTy) {
861 Any = true;
862 Type *NewType =
863 Ops[i]->getType()->isVectorTy() ? IntIdxTy : IntIdxScalarTy;
865 CastInst::getCastOpcode(Ops[i], true, NewType, true), Ops[i], NewType,
866 DL);
867 if (!NewIdx)
868 return nullptr;
869 NewIdxs.push_back(NewIdx);
870 } else
871 NewIdxs.push_back(Ops[i]);
872 }
873
874 if (!Any)
875 return nullptr;
876
877 Constant *C =
878 ConstantExpr::getGetElementPtr(SrcElemTy, Ops[0], NewIdxs, NW, InRange);
879 return ConstantFoldConstant(C, DL, TLI);
880}
881
882/// If we can symbolically evaluate the GEP constant expression, do so.
883Constant *SymbolicallyEvaluateGEP(const GEPOperator *GEP,
885 const DataLayout &DL,
886 const TargetLibraryInfo *TLI) {
887 Type *SrcElemTy = GEP->getSourceElementType();
888 Type *ResTy = GEP->getType();
889 if (!SrcElemTy->isSized() || isa<ScalableVectorType>(SrcElemTy))
890 return nullptr;
891
892 if (Constant *C = CastGEPIndices(SrcElemTy, Ops, ResTy, GEP->getNoWrapFlags(),
893 GEP->getInRange(), DL, TLI))
894 return C;
895
896 Constant *Ptr = Ops[0];
897 if (!Ptr->getType()->isPointerTy())
898 return nullptr;
899
900 Type *IntIdxTy = DL.getIndexType(Ptr->getType());
901
902 for (unsigned i = 1, e = Ops.size(); i != e; ++i)
903 if (!isa<ConstantInt>(Ops[i]) || !Ops[i]->getType()->isIntegerTy())
904 return nullptr;
905
906 unsigned BitWidth = DL.getTypeSizeInBits(IntIdxTy);
908 BitWidth,
909 DL.getIndexedOffsetInType(
910 SrcElemTy, ArrayRef((Value *const *)Ops.data() + 1, Ops.size() - 1)),
911 /*isSigned=*/true, /*implicitTrunc=*/true);
912
913 std::optional<ConstantRange> InRange = GEP->getInRange();
914 if (InRange)
915 InRange = InRange->sextOrTrunc(BitWidth);
916
917 // If this is a GEP of a GEP, fold it all into a single GEP.
918 GEPNoWrapFlags NW = GEP->getNoWrapFlags();
919 bool Overflow = false;
920 while (auto *GEP = dyn_cast<GEPOperator>(Ptr)) {
921 NW &= GEP->getNoWrapFlags();
922
923 SmallVector<Value *, 4> NestedOps(llvm::drop_begin(GEP->operands()));
924
925 // Do not try the incorporate the sub-GEP if some index is not a number.
926 bool AllConstantInt = true;
927 for (Value *NestedOp : NestedOps)
928 if (!isa<ConstantInt>(NestedOp)) {
929 AllConstantInt = false;
930 break;
931 }
932 if (!AllConstantInt)
933 break;
934
935 // Adjust inrange offset and intersect inrange attributes
936 if (auto GEPRange = GEP->getInRange()) {
937 auto AdjustedGEPRange = GEPRange->sextOrTrunc(BitWidth).subtract(Offset);
938 InRange =
939 InRange ? InRange->intersectWith(AdjustedGEPRange) : AdjustedGEPRange;
940 }
941
942 Ptr = cast<Constant>(GEP->getOperand(0));
943 SrcElemTy = GEP->getSourceElementType();
944 Offset = Offset.sadd_ov(
945 APInt(BitWidth, DL.getIndexedOffsetInType(SrcElemTy, NestedOps),
946 /*isSigned=*/true, /*implicitTrunc=*/true),
947 Overflow);
948 }
949
950 // Preserving nusw (without inbounds) also requires that the offset
951 // additions did not overflow.
952 if (NW.hasNoUnsignedSignedWrap() && !NW.isInBounds() && Overflow)
954
955 // If the base value for this address is a literal integer value, fold the
956 // getelementptr to the resulting integer value casted to the pointer type.
957 APInt BaseIntVal(DL.getPointerTypeSizeInBits(Ptr->getType()), 0);
958 if (auto *CE = dyn_cast<ConstantExpr>(Ptr)) {
959 if (CE->getOpcode() == Instruction::IntToPtr) {
960 if (auto *Base = dyn_cast<ConstantInt>(CE->getOperand(0)))
961 BaseIntVal = Base->getValue().zextOrTrunc(BaseIntVal.getBitWidth());
962 }
963 }
964
965 if ((Ptr->isNullValue() || BaseIntVal != 0) &&
966 !DL.mustNotIntroduceIntToPtr(Ptr->getType())) {
967
968 // If the index size is smaller than the pointer size, add to the low
969 // bits only.
970 BaseIntVal.insertBits(BaseIntVal.trunc(BitWidth) + Offset, 0);
971 Constant *C = ConstantInt::get(Ptr->getContext(), BaseIntVal);
972 return ConstantExpr::getIntToPtr(C, ResTy);
973 }
974
975 // Try to infer inbounds for GEPs of globals.
976 if (!NW.isInBounds() && Offset.isNonNegative()) {
977 bool CanBeNull, CanBeFreed;
978 uint64_t DerefBytes =
979 Ptr->getPointerDereferenceableBytes(DL, CanBeNull, CanBeFreed);
980 if (DerefBytes != 0 && !CanBeNull && Offset.sle(DerefBytes))
982 }
983
984 // nusw + nneg -> nuw
985 if (NW.hasNoUnsignedSignedWrap() && Offset.isNonNegative())
987
988 // Otherwise canonicalize this to a single ptradd.
989 LLVMContext &Ctx = Ptr->getContext();
990 return ConstantExpr::getPtrAdd(Ptr, ConstantInt::get(Ctx, Offset), NW,
991 InRange);
992}
993
994/// Attempt to constant fold an instruction with the
995/// specified opcode and operands. If successful, the constant result is
996/// returned, if not, null is returned. Note that this function can fail when
997/// attempting to fold instructions like loads and stores, which have no
998/// constant expression form.
999Constant *ConstantFoldInstOperandsImpl(const Value *InstOrCE, unsigned Opcode,
1001 const DataLayout &DL,
1002 const TargetLibraryInfo *TLI,
1003 bool AllowNonDeterministic) {
1004 Type *DestTy = InstOrCE->getType();
1005
1006 if (Instruction::isUnaryOp(Opcode))
1007 return ConstantFoldUnaryOpOperand(Opcode, Ops[0], DL);
1008
1009 if (Instruction::isBinaryOp(Opcode)) {
1010 switch (Opcode) {
1011 default:
1012 break;
1013 case Instruction::FAdd:
1014 case Instruction::FSub:
1015 case Instruction::FMul:
1016 case Instruction::FDiv:
1017 case Instruction::FRem:
1018 // Handle floating point instructions separately to account for denormals
1019 // TODO: If a constant expression is being folded rather than an
1020 // instruction, denormals will not be flushed/treated as zero
1021 if (const auto *I = dyn_cast<Instruction>(InstOrCE)) {
1022 return ConstantFoldFPInstOperands(Opcode, Ops[0], Ops[1], DL, I,
1023 AllowNonDeterministic);
1024 }
1025 }
1026 return ConstantFoldBinaryOpOperands(Opcode, Ops[0], Ops[1], DL);
1027 }
1028
1029 if (Instruction::isCast(Opcode))
1030 return ConstantFoldCastOperand(Opcode, Ops[0], DestTy, DL);
1031
1032 if (auto *GEP = dyn_cast<GEPOperator>(InstOrCE)) {
1033 Type *SrcElemTy = GEP->getSourceElementType();
1035 return nullptr;
1036
1037 if (Constant *C = SymbolicallyEvaluateGEP(GEP, Ops, DL, TLI))
1038 return C;
1039
1040 return ConstantExpr::getGetElementPtr(SrcElemTy, Ops[0], Ops.slice(1),
1041 GEP->getNoWrapFlags(),
1042 GEP->getInRange());
1043 }
1044
1045 if (auto *CE = dyn_cast<ConstantExpr>(InstOrCE))
1046 return CE->getWithOperands(Ops);
1047
1048 switch (Opcode) {
1049 default: return nullptr;
1050 case Instruction::ICmp:
1051 case Instruction::FCmp: {
1052 auto *C = cast<CmpInst>(InstOrCE);
1053 return ConstantFoldCompareInstOperands(C->getPredicate(), Ops[0], Ops[1],
1054 DL, TLI, C);
1055 }
1056 case Instruction::Freeze:
1057 return isGuaranteedNotToBeUndefOrPoison(Ops[0]) ? Ops[0] : nullptr;
1058 case Instruction::Call:
1059 if (auto *F = dyn_cast<Function>(Ops.back())) {
1060 const auto *Call = cast<CallBase>(InstOrCE);
1062 return ConstantFoldCall(Call, F, Ops.slice(0, Ops.size() - 1), TLI,
1063 AllowNonDeterministic);
1064 }
1065 return nullptr;
1066 case Instruction::Select:
1067 return ConstantFoldSelectInstruction(Ops[0], Ops[1], Ops[2]);
1068 case Instruction::ExtractElement:
1070 case Instruction::ExtractValue:
1072 Ops[0], cast<ExtractValueInst>(InstOrCE)->getIndices());
1073 case Instruction::InsertElement:
1074 return ConstantExpr::getInsertElement(Ops[0], Ops[1], Ops[2]);
1075 case Instruction::InsertValue:
1077 Ops[0], Ops[1], cast<InsertValueInst>(InstOrCE)->getIndices());
1078 case Instruction::ShuffleVector:
1080 Ops[0], Ops[1], cast<ShuffleVectorInst>(InstOrCE)->getShuffleMask());
1081 case Instruction::Load: {
1082 const auto *LI = dyn_cast<LoadInst>(InstOrCE);
1083 if (LI->isVolatile())
1084 return nullptr;
1085 return ConstantFoldLoadFromConstPtr(Ops[0], LI->getType(), DL);
1086 }
1087 }
1088}
1089
1090} // end anonymous namespace
1091
1092//===----------------------------------------------------------------------===//
1093// Constant Folding public APIs
1094//===----------------------------------------------------------------------===//
1095
1096namespace {
1097
1098Constant *
1099ConstantFoldConstantImpl(const Constant *C, const DataLayout &DL,
1100 const TargetLibraryInfo *TLI,
1103 return const_cast<Constant *>(C);
1104
1106 for (const Use &OldU : C->operands()) {
1107 Constant *OldC = cast<Constant>(&OldU);
1108 Constant *NewC = OldC;
1109 // Recursively fold the ConstantExpr's operands. If we have already folded
1110 // a ConstantExpr, we don't have to process it again.
1111 if (isa<ConstantVector>(OldC) || isa<ConstantExpr>(OldC)) {
1112 auto It = FoldedOps.find(OldC);
1113 if (It == FoldedOps.end()) {
1114 NewC = ConstantFoldConstantImpl(OldC, DL, TLI, FoldedOps);
1115 FoldedOps.insert({OldC, NewC});
1116 } else {
1117 NewC = It->second;
1118 }
1119 }
1120 Ops.push_back(NewC);
1121 }
1122
1123 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1124 if (Constant *Res = ConstantFoldInstOperandsImpl(
1125 CE, CE->getOpcode(), Ops, DL, TLI, /*AllowNonDeterministic=*/true))
1126 return Res;
1127 return const_cast<Constant *>(C);
1128 }
1129
1131 return ConstantVector::get(Ops);
1132}
1133
1134} // end anonymous namespace
1135
1137 const DataLayout &DL,
1138 const TargetLibraryInfo *TLI) {
1139 // Handle PHI nodes quickly here...
1140 if (auto *PN = dyn_cast<PHINode>(I)) {
1141 Constant *CommonValue = nullptr;
1142
1144 for (Value *Incoming : PN->incoming_values()) {
1145 // If the incoming value is undef then skip it. Note that while we could
1146 // skip the value if it is equal to the phi node itself we choose not to
1147 // because that would break the rule that constant folding only applies if
1148 // all operands are constants.
1150 continue;
1151 // If the incoming value is not a constant, then give up.
1152 auto *C = dyn_cast<Constant>(Incoming);
1153 if (!C)
1154 return nullptr;
1155 // Fold the PHI's operands.
1156 C = ConstantFoldConstantImpl(C, DL, TLI, FoldedOps);
1157 // If the incoming value is a different constant to
1158 // the one we saw previously, then give up.
1159 if (CommonValue && C != CommonValue)
1160 return nullptr;
1161 CommonValue = C;
1162 }
1163
1164 // If we reach here, all incoming values are the same constant or undef.
1165 return CommonValue ? CommonValue : UndefValue::get(PN->getType());
1166 }
1167
1168 // Scan the operand list, checking to see if they are all constants, if so,
1169 // hand off to ConstantFoldInstOperandsImpl.
1170 if (!all_of(I->operands(), [](const Use &U) { return isa<Constant>(U); }))
1171 return nullptr;
1172
1175 for (const Use &OpU : I->operands()) {
1176 auto *Op = cast<Constant>(&OpU);
1177 // Fold the Instruction's operands.
1178 Op = ConstantFoldConstantImpl(Op, DL, TLI, FoldedOps);
1179 Ops.push_back(Op);
1180 }
1181
1182 return ConstantFoldInstOperands(I, Ops, DL, TLI);
1183}
1184
1186 const TargetLibraryInfo *TLI) {
1188 return ConstantFoldConstantImpl(C, DL, TLI, FoldedOps);
1189}
1190
1193 const DataLayout &DL,
1194 const TargetLibraryInfo *TLI,
1195 bool AllowNonDeterministic) {
1196 return ConstantFoldInstOperandsImpl(I, I->getOpcode(), Ops, DL, TLI,
1197 AllowNonDeterministic);
1198}
1199
1201 unsigned IntPredicate, Constant *Ops0, Constant *Ops1, const DataLayout &DL,
1202 const TargetLibraryInfo *TLI, const Instruction *I) {
1203 CmpInst::Predicate Predicate = (CmpInst::Predicate)IntPredicate;
1204 // fold: icmp (inttoptr x), null -> icmp x, 0
1205 // fold: icmp null, (inttoptr x) -> icmp 0, x
1206 // fold: icmp (ptrtoint x), 0 -> icmp x, null
1207 // fold: icmp 0, (ptrtoint x) -> icmp null, x
1208 // fold: icmp (inttoptr x), (inttoptr y) -> icmp trunc/zext x, trunc/zext y
1209 // fold: icmp (ptrtoint x), (ptrtoint y) -> icmp x, y
1210 //
1211 // FIXME: The following comment is out of data and the DataLayout is here now.
1212 // ConstantExpr::getCompare cannot do this, because it doesn't have DL
1213 // around to know if bit truncation is happening.
1214 if (auto *CE0 = dyn_cast<ConstantExpr>(Ops0)) {
1215 if (Ops1->isNullValue()) {
1216 if (CE0->getOpcode() == Instruction::IntToPtr) {
1217 Type *IntPtrTy = DL.getIntPtrType(CE0->getType());
1218 // Convert the integer value to the right size to ensure we get the
1219 // proper extension or truncation.
1220 if (Constant *C = ConstantFoldIntegerCast(CE0->getOperand(0), IntPtrTy,
1221 /*IsSigned*/ false, DL)) {
1222 Constant *Null = Constant::getNullValue(C->getType());
1223 return ConstantFoldCompareInstOperands(Predicate, C, Null, DL, TLI);
1224 }
1225 }
1226
1227 // icmp only compares the address part of the pointer, so only do this
1228 // transform if the integer size matches the address size.
1229 if (CE0->getOpcode() == Instruction::PtrToInt ||
1230 CE0->getOpcode() == Instruction::PtrToAddr) {
1231 Type *AddrTy = DL.getAddressType(CE0->getOperand(0)->getType());
1232 if (CE0->getType() == AddrTy) {
1233 Constant *C = CE0->getOperand(0);
1234 Constant *Null = Constant::getNullValue(C->getType());
1235 return ConstantFoldCompareInstOperands(Predicate, C, Null, DL, TLI);
1236 }
1237 }
1238 }
1239
1240 if (auto *CE1 = dyn_cast<ConstantExpr>(Ops1)) {
1241 if (CE0->getOpcode() == CE1->getOpcode()) {
1242 if (CE0->getOpcode() == Instruction::IntToPtr) {
1243 Type *IntPtrTy = DL.getIntPtrType(CE0->getType());
1244
1245 // Convert the integer value to the right size to ensure we get the
1246 // proper extension or truncation.
1247 Constant *C0 = ConstantFoldIntegerCast(CE0->getOperand(0), IntPtrTy,
1248 /*IsSigned*/ false, DL);
1249 Constant *C1 = ConstantFoldIntegerCast(CE1->getOperand(0), IntPtrTy,
1250 /*IsSigned*/ false, DL);
1251 if (C0 && C1)
1252 return ConstantFoldCompareInstOperands(Predicate, C0, C1, DL, TLI);
1253 }
1254
1255 // icmp only compares the address part of the pointer, so only do this
1256 // transform if the integer size matches the address size.
1257 if (CE0->getOpcode() == Instruction::PtrToInt ||
1258 CE0->getOpcode() == Instruction::PtrToAddr) {
1259 Type *AddrTy = DL.getAddressType(CE0->getOperand(0)->getType());
1260 if (CE0->getType() == AddrTy &&
1261 CE0->getOperand(0)->getType() == CE1->getOperand(0)->getType()) {
1263 Predicate, CE0->getOperand(0), CE1->getOperand(0), DL, TLI);
1264 }
1265 }
1266 }
1267 }
1268
1269 // Convert pointer comparison (base+offset1) pred (base+offset2) into
1270 // offset1 pred offset2, for the case where the offset is inbounds. This
1271 // only works for equality and unsigned comparison, as inbounds permits
1272 // crossing the sign boundary. However, the offset comparison itself is
1273 // signed.
1274 if (Ops0->getType()->isPointerTy() && !ICmpInst::isSigned(Predicate)) {
1275 unsigned IndexWidth = DL.getIndexTypeSizeInBits(Ops0->getType());
1276 APInt Offset0(IndexWidth, 0);
1277 bool IsEqPred = ICmpInst::isEquality(Predicate);
1278 Value *Stripped0 = Ops0->stripAndAccumulateConstantOffsets(
1279 DL, Offset0, /*AllowNonInbounds=*/IsEqPred,
1280 /*AllowInvariantGroup=*/false, /*ExternalAnalysis=*/nullptr,
1281 /*LookThroughIntToPtr=*/IsEqPred);
1282 APInt Offset1(IndexWidth, 0);
1283 Value *Stripped1 = Ops1->stripAndAccumulateConstantOffsets(
1284 DL, Offset1, /*AllowNonInbounds=*/IsEqPred,
1285 /*AllowInvariantGroup=*/false, /*ExternalAnalysis=*/nullptr,
1286 /*LookThroughIntToPtr=*/IsEqPred);
1287 if (Stripped0 == Stripped1)
1288 return ConstantInt::getBool(
1289 Ops0->getContext(),
1290 ICmpInst::compare(Offset0, Offset1,
1291 ICmpInst::getSignedPredicate(Predicate)));
1292 }
1293 } else if (isa<ConstantExpr>(Ops1)) {
1294 // If RHS is a constant expression, but the left side isn't, swap the
1295 // operands and try again.
1296 Predicate = ICmpInst::getSwappedPredicate(Predicate);
1297 return ConstantFoldCompareInstOperands(Predicate, Ops1, Ops0, DL, TLI);
1298 }
1299
1300 if (CmpInst::isFPPredicate(Predicate)) {
1301 // Flush any denormal constant float input according to denormal handling
1302 // mode.
1303 Ops0 = FlushFPConstant(Ops0, I, /*IsOutput=*/false);
1304 if (!Ops0)
1305 return nullptr;
1306 Ops1 = FlushFPConstant(Ops1, I, /*IsOutput=*/false);
1307 if (!Ops1)
1308 return nullptr;
1309 }
1310
1311 return ConstantFoldCompareInstruction(Predicate, Ops0, Ops1);
1312}
1313
1315 const DataLayout &DL) {
1317
1318 return ConstantFoldUnaryInstruction(Opcode, Op);
1319}
1320
1322 Constant *RHS,
1323 const DataLayout &DL) {
1325 if (isa<ConstantExpr>(LHS) || isa<ConstantExpr>(RHS))
1326 if (Constant *C = SymbolicallyEvaluateBinop(Opcode, LHS, RHS, DL))
1327 return C;
1328
1330 return ConstantExpr::get(Opcode, LHS, RHS);
1331 return ConstantFoldBinaryInstruction(Opcode, LHS, RHS);
1332}
1333
1336 switch (Mode) {
1338 return nullptr;
1339 case DenormalMode::IEEE:
1340 return ConstantFP::get(Ty->getContext(), APF);
1342 return ConstantFP::get(
1343 Ty->getContext(),
1346 return ConstantFP::get(Ty->getContext(),
1347 APFloat::getZero(APF.getSemantics(), false));
1348 default:
1349 break;
1350 }
1351
1352 llvm_unreachable("unknown denormal mode");
1353}
1354
1355/// Return the denormal mode that can be assumed when executing a floating point
1356/// operation at \p CtxI.
1358 if (!CtxI || !CtxI->getParent() || !CtxI->getFunction())
1359 return DenormalMode::getDynamic();
1360 return CtxI->getFunction()->getDenormalMode(
1361 Ty->getScalarType()->getFltSemantics());
1362}
1363
1365 const Instruction *Inst,
1366 bool IsOutput) {
1367 const APFloat &APF = CFP->getValueAPF();
1368 if (!APF.isDenormal())
1369 return CFP;
1370
1372 return flushDenormalConstant(CFP->getType(), APF,
1373 IsOutput ? Mode.Output : Mode.Input);
1374}
1375
1377 bool IsOutput) {
1378 if (ConstantFP *CFP = dyn_cast<ConstantFP>(Operand))
1379 return flushDenormalConstantFP(CFP, Inst, IsOutput);
1380
1382 return Operand;
1383
1384 Type *Ty = Operand->getType();
1385 VectorType *VecTy = dyn_cast<VectorType>(Ty);
1386 if (VecTy) {
1387 if (auto *Splat = dyn_cast_or_null<ConstantFP>(Operand->getSplatValue())) {
1388 ConstantFP *Folded = flushDenormalConstantFP(Splat, Inst, IsOutput);
1389 if (!Folded)
1390 return nullptr;
1391 return ConstantVector::getSplat(VecTy->getElementCount(), Folded);
1392 }
1393
1394 Ty = VecTy->getElementType();
1395 }
1396
1397 if (isa<ConstantExpr>(Operand))
1398 return Operand;
1399
1400 if (const auto *CV = dyn_cast<ConstantVector>(Operand)) {
1402 for (unsigned i = 0, e = CV->getNumOperands(); i != e; ++i) {
1403 Constant *Element = CV->getAggregateElement(i);
1404 if (isa<UndefValue>(Element)) {
1405 NewElts.push_back(Element);
1406 continue;
1407 }
1408
1409 ConstantFP *CFP = dyn_cast<ConstantFP>(Element);
1410 if (!CFP)
1411 return nullptr;
1412
1413 ConstantFP *Folded = flushDenormalConstantFP(CFP, Inst, IsOutput);
1414 if (!Folded)
1415 return nullptr;
1416 NewElts.push_back(Folded);
1417 }
1418
1419 return ConstantVector::get(NewElts);
1420 }
1421
1422 if (const auto *CDV = dyn_cast<ConstantDataVector>(Operand)) {
1424 for (unsigned I = 0, E = CDV->getNumElements(); I < E; ++I) {
1425 const APFloat &Elt = CDV->getElementAsAPFloat(I);
1426 if (!Elt.isDenormal()) {
1427 NewElts.push_back(ConstantFP::get(Ty, Elt));
1428 } else {
1429 DenormalMode Mode = getInstrDenormalMode(Inst, Ty);
1430 ConstantFP *Folded =
1431 flushDenormalConstant(Ty, Elt, IsOutput ? Mode.Output : Mode.Input);
1432 if (!Folded)
1433 return nullptr;
1434 NewElts.push_back(Folded);
1435 }
1436 }
1437
1438 return ConstantVector::get(NewElts);
1439 }
1440
1441 return nullptr;
1442}
1443
1445 Constant *RHS, const DataLayout &DL,
1446 const Instruction *I,
1447 bool AllowNonDeterministic) {
1448 if (Instruction::isBinaryOp(Opcode)) {
1449 // Flush denormal inputs if needed.
1450 Constant *Op0 = FlushFPConstant(LHS, I, /* IsOutput */ false);
1451 if (!Op0)
1452 return nullptr;
1453 Constant *Op1 = FlushFPConstant(RHS, I, /* IsOutput */ false);
1454 if (!Op1)
1455 return nullptr;
1456
1457 // If nsz or an algebraic FMF flag is set, the result of the FP operation
1458 // may change due to future optimization. Don't constant fold them if
1459 // non-deterministic results are not allowed.
1460 if (!AllowNonDeterministic)
1462 if (FP->hasNoSignedZeros() || FP->hasAllowReassoc() ||
1463 FP->hasAllowContract() || FP->hasAllowReciprocal())
1464 return nullptr;
1465
1466 // Calculate constant result.
1467 Constant *C = ConstantFoldBinaryOpOperands(Opcode, Op0, Op1, DL);
1468 if (!C)
1469 return nullptr;
1470
1471 // Flush denormal output if needed.
1472 C = FlushFPConstant(C, I, /* IsOutput */ true);
1473 if (!C)
1474 return nullptr;
1475
1476 // The precise NaN value is non-deterministic.
1477 if (!AllowNonDeterministic && C->isNaN())
1478 return nullptr;
1479
1480 return C;
1481 }
1482 // If instruction lacks a parent/function and the denormal mode cannot be
1483 // determined, use the default (IEEE).
1484 return ConstantFoldBinaryOpOperands(Opcode, LHS, RHS, DL);
1485}
1486
1488 Type *DestTy, const DataLayout &DL) {
1489 assert(Instruction::isCast(Opcode));
1490
1491 if (auto *CE = dyn_cast<ConstantExpr>(C))
1492 if (CE->isCast())
1493 if (unsigned NewOp = CastInst::isEliminableCastPair(
1494 Instruction::CastOps(CE->getOpcode()),
1495 Instruction::CastOps(Opcode), CE->getOperand(0)->getType(),
1496 C->getType(), DestTy, &DL))
1497 return ConstantFoldCastOperand(NewOp, CE->getOperand(0), DestTy, DL);
1498
1499 switch (Opcode) {
1500 default:
1501 llvm_unreachable("Missing case");
1502 case Instruction::PtrToAddr:
1503 case Instruction::PtrToInt:
1504 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1505 Constant *FoldedValue = nullptr;
1506 // If the input is an inttoptr, eliminate the pair. This requires knowing
1507 // the width of a pointer, so it can't be done in ConstantExpr::getCast.
1508 if (CE->getOpcode() == Instruction::IntToPtr) {
1509 // zext/trunc the inttoptr to pointer/address size.
1510 Type *MidTy = Opcode == Instruction::PtrToInt
1511 ? DL.getAddressType(CE->getType())
1512 : DL.getIntPtrType(CE->getType());
1513 FoldedValue = ConstantFoldIntegerCast(CE->getOperand(0), MidTy,
1514 /*IsSigned=*/false, DL);
1515 } else if (auto *GEP = dyn_cast<GEPOperator>(CE)) {
1516 // If we have GEP, we can perform the following folds:
1517 // (ptrtoint/ptrtoaddr (gep null, x)) -> x
1518 // (ptrtoint/ptrtoaddr (gep (gep null, x), y) -> x + y, etc.
1519 unsigned BitWidth = DL.getIndexTypeSizeInBits(GEP->getType());
1520 APInt BaseOffset(BitWidth, 0);
1521 auto *Base = cast<Constant>(GEP->stripAndAccumulateConstantOffsets(
1522 DL, BaseOffset, /*AllowNonInbounds=*/true));
1523 if (Base->isNullValue()) {
1524 FoldedValue = ConstantInt::get(CE->getContext(), BaseOffset);
1525 } else {
1526 // ptrtoint/ptrtoaddr (gep i8, Ptr, (sub 0, V))
1527 // -> sub (ptrtoint/ptrtoaddr Ptr), V
1528 if (GEP->getNumIndices() == 1 &&
1529 GEP->getSourceElementType()->isIntegerTy(8)) {
1530 auto *Ptr = cast<Constant>(GEP->getPointerOperand());
1531 auto *Sub = dyn_cast<ConstantExpr>(GEP->getOperand(1));
1532 Type *IntIdxTy = DL.getIndexType(Ptr->getType());
1533 if (Sub && Sub->getType() == IntIdxTy &&
1534 Sub->getOpcode() == Instruction::Sub &&
1535 Sub->getOperand(0)->isNullValue())
1536 FoldedValue = ConstantExpr::getSub(
1537 ConstantExpr::getCast(Opcode, Ptr, IntIdxTy),
1538 Sub->getOperand(1));
1539 }
1540 }
1541 }
1542 if (FoldedValue) {
1543 // Do a zext or trunc to get to the ptrtoint/ptrtoaddr dest size.
1544 return ConstantFoldIntegerCast(FoldedValue, DestTy, /*IsSigned=*/false,
1545 DL);
1546 }
1547 }
1548 break;
1549 case Instruction::IntToPtr:
1550 // If the input is a ptrtoint, turn the pair into a ptr to ptr bitcast if
1551 // the int size is >= the ptr size and the address spaces are the same.
1552 // This requires knowing the width of a pointer, so it can't be done in
1553 // ConstantExpr::getCast.
1554 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1555 if (CE->getOpcode() == Instruction::PtrToInt) {
1556 Constant *SrcPtr = CE->getOperand(0);
1557 unsigned SrcPtrSize = DL.getPointerTypeSizeInBits(SrcPtr->getType());
1558 unsigned MidIntSize = CE->getType()->getScalarSizeInBits();
1559
1560 if (MidIntSize >= SrcPtrSize) {
1561 unsigned SrcAS = SrcPtr->getType()->getPointerAddressSpace();
1562 if (SrcAS == DestTy->getPointerAddressSpace())
1563 return FoldBitCast(CE->getOperand(0), DestTy, DL);
1564 }
1565 }
1566 }
1567 break;
1568 case Instruction::Trunc:
1569 case Instruction::ZExt:
1570 case Instruction::SExt:
1571 case Instruction::FPTrunc:
1572 case Instruction::FPExt:
1573 case Instruction::UIToFP:
1574 case Instruction::SIToFP:
1575 case Instruction::FPToUI:
1576 case Instruction::FPToSI:
1577 case Instruction::AddrSpaceCast:
1578 break;
1579 case Instruction::BitCast:
1580 return FoldBitCast(C, DestTy, DL);
1581 }
1582
1584 return ConstantExpr::getCast(Opcode, C, DestTy);
1585 return ConstantFoldCastInstruction(Opcode, C, DestTy);
1586}
1587
1589 bool IsSigned, const DataLayout &DL) {
1590 Type *SrcTy = C->getType();
1591 if (SrcTy == DestTy)
1592 return C;
1593 if (SrcTy->getScalarSizeInBits() > DestTy->getScalarSizeInBits())
1594 return ConstantFoldCastOperand(Instruction::Trunc, C, DestTy, DL);
1595 if (IsSigned)
1596 return ConstantFoldCastOperand(Instruction::SExt, C, DestTy, DL);
1597 return ConstantFoldCastOperand(Instruction::ZExt, C, DestTy, DL);
1598}
1599
1600//===----------------------------------------------------------------------===//
1601// Constant Folding for Calls
1602//
1603
1605 if (Call->isNoBuiltin())
1606 return false;
1607 if (Call->getFunctionType() != F->getFunctionType())
1608 return false;
1609
1610 // Allow FP calls (both libcalls and intrinsics) to avoid being folded.
1611 // This can be useful for GPU targets or in cross-compilation scenarios
1612 // when the exact target FP behaviour is required, and the host compiler's
1613 // behaviour may be slightly different from the device's run-time behaviour.
1614 if (DisableFPCallFolding && (F->getReturnType()->isFloatingPointTy() ||
1615 any_of(F->args(), [](const Argument &Arg) {
1616 return Arg.getType()->isFloatingPointTy();
1617 })))
1618 return false;
1619
1620 switch (F->getIntrinsicID()) {
1621 // Operations that do not operate floating-point numbers and do not depend on
1622 // FP environment can be folded even in strictfp functions.
1623 case Intrinsic::bswap:
1624 case Intrinsic::ctpop:
1625 case Intrinsic::ctlz:
1626 case Intrinsic::cttz:
1627 case Intrinsic::fshl:
1628 case Intrinsic::fshr:
1629 case Intrinsic::launder_invariant_group:
1630 case Intrinsic::strip_invariant_group:
1631 case Intrinsic::masked_load:
1632 case Intrinsic::get_active_lane_mask:
1633 case Intrinsic::abs:
1634 case Intrinsic::smax:
1635 case Intrinsic::smin:
1636 case Intrinsic::umax:
1637 case Intrinsic::umin:
1638 case Intrinsic::scmp:
1639 case Intrinsic::ucmp:
1640 case Intrinsic::sadd_with_overflow:
1641 case Intrinsic::uadd_with_overflow:
1642 case Intrinsic::ssub_with_overflow:
1643 case Intrinsic::usub_with_overflow:
1644 case Intrinsic::smul_with_overflow:
1645 case Intrinsic::umul_with_overflow:
1646 case Intrinsic::sadd_sat:
1647 case Intrinsic::uadd_sat:
1648 case Intrinsic::ssub_sat:
1649 case Intrinsic::usub_sat:
1650 case Intrinsic::smul_fix:
1651 case Intrinsic::smul_fix_sat:
1652 case Intrinsic::bitreverse:
1653 case Intrinsic::is_constant:
1654 case Intrinsic::vector_reduce_add:
1655 case Intrinsic::vector_reduce_mul:
1656 case Intrinsic::vector_reduce_and:
1657 case Intrinsic::vector_reduce_or:
1658 case Intrinsic::vector_reduce_xor:
1659 case Intrinsic::vector_reduce_smin:
1660 case Intrinsic::vector_reduce_smax:
1661 case Intrinsic::vector_reduce_umin:
1662 case Intrinsic::vector_reduce_umax:
1663 case Intrinsic::vector_extract:
1664 case Intrinsic::vector_insert:
1665 case Intrinsic::vector_interleave2:
1666 case Intrinsic::vector_interleave3:
1667 case Intrinsic::vector_interleave4:
1668 case Intrinsic::vector_interleave5:
1669 case Intrinsic::vector_interleave6:
1670 case Intrinsic::vector_interleave7:
1671 case Intrinsic::vector_interleave8:
1672 case Intrinsic::vector_deinterleave2:
1673 case Intrinsic::vector_deinterleave3:
1674 case Intrinsic::vector_deinterleave4:
1675 case Intrinsic::vector_deinterleave5:
1676 case Intrinsic::vector_deinterleave6:
1677 case Intrinsic::vector_deinterleave7:
1678 case Intrinsic::vector_deinterleave8:
1679 // Target intrinsics
1680 case Intrinsic::amdgcn_perm:
1681 case Intrinsic::amdgcn_wave_reduce_umin:
1682 case Intrinsic::amdgcn_wave_reduce_umax:
1683 case Intrinsic::amdgcn_wave_reduce_max:
1684 case Intrinsic::amdgcn_wave_reduce_min:
1685 case Intrinsic::amdgcn_wave_reduce_add:
1686 case Intrinsic::amdgcn_wave_reduce_sub:
1687 case Intrinsic::amdgcn_wave_reduce_and:
1688 case Intrinsic::amdgcn_wave_reduce_or:
1689 case Intrinsic::amdgcn_wave_reduce_xor:
1690 case Intrinsic::amdgcn_s_wqm:
1691 case Intrinsic::amdgcn_s_quadmask:
1692 case Intrinsic::amdgcn_s_bitreplicate:
1693 case Intrinsic::arm_mve_vctp8:
1694 case Intrinsic::arm_mve_vctp16:
1695 case Intrinsic::arm_mve_vctp32:
1696 case Intrinsic::arm_mve_vctp64:
1697 case Intrinsic::aarch64_sve_convert_from_svbool:
1698 case Intrinsic::wasm_alltrue:
1699 case Intrinsic::wasm_anytrue:
1700 case Intrinsic::wasm_dot:
1701 // WebAssembly float semantics are always known
1702 case Intrinsic::wasm_trunc_signed:
1703 case Intrinsic::wasm_trunc_unsigned:
1704 return true;
1705
1706 // Floating point operations cannot be folded in strictfp functions in
1707 // general case. They can be folded if FP environment is known to compiler.
1708 case Intrinsic::minnum:
1709 case Intrinsic::maxnum:
1710 case Intrinsic::minimum:
1711 case Intrinsic::maximum:
1712 case Intrinsic::minimumnum:
1713 case Intrinsic::maximumnum:
1714 case Intrinsic::log:
1715 case Intrinsic::log2:
1716 case Intrinsic::log10:
1717 case Intrinsic::exp:
1718 case Intrinsic::exp2:
1719 case Intrinsic::exp10:
1720 case Intrinsic::sqrt:
1721 case Intrinsic::sin:
1722 case Intrinsic::cos:
1723 case Intrinsic::sincos:
1724 case Intrinsic::sinh:
1725 case Intrinsic::cosh:
1726 case Intrinsic::atan:
1727 case Intrinsic::pow:
1728 case Intrinsic::powi:
1729 case Intrinsic::ldexp:
1730 case Intrinsic::fma:
1731 case Intrinsic::fmuladd:
1732 case Intrinsic::frexp:
1733 case Intrinsic::fptoui_sat:
1734 case Intrinsic::fptosi_sat:
1735 case Intrinsic::amdgcn_cos:
1736 case Intrinsic::amdgcn_cubeid:
1737 case Intrinsic::amdgcn_cubema:
1738 case Intrinsic::amdgcn_cubesc:
1739 case Intrinsic::amdgcn_cubetc:
1740 case Intrinsic::amdgcn_fmul_legacy:
1741 case Intrinsic::amdgcn_fma_legacy:
1742 case Intrinsic::amdgcn_fract:
1743 case Intrinsic::amdgcn_sin:
1744 // The intrinsics below depend on rounding mode in MXCSR.
1745 case Intrinsic::x86_sse_cvtss2si:
1746 case Intrinsic::x86_sse_cvtss2si64:
1747 case Intrinsic::x86_sse_cvttss2si:
1748 case Intrinsic::x86_sse_cvttss2si64:
1749 case Intrinsic::x86_sse2_cvtsd2si:
1750 case Intrinsic::x86_sse2_cvtsd2si64:
1751 case Intrinsic::x86_sse2_cvttsd2si:
1752 case Intrinsic::x86_sse2_cvttsd2si64:
1753 case Intrinsic::x86_avx512_vcvtss2si32:
1754 case Intrinsic::x86_avx512_vcvtss2si64:
1755 case Intrinsic::x86_avx512_cvttss2si:
1756 case Intrinsic::x86_avx512_cvttss2si64:
1757 case Intrinsic::x86_avx512_vcvtsd2si32:
1758 case Intrinsic::x86_avx512_vcvtsd2si64:
1759 case Intrinsic::x86_avx512_cvttsd2si:
1760 case Intrinsic::x86_avx512_cvttsd2si64:
1761 case Intrinsic::x86_avx512_vcvtss2usi32:
1762 case Intrinsic::x86_avx512_vcvtss2usi64:
1763 case Intrinsic::x86_avx512_cvttss2usi:
1764 case Intrinsic::x86_avx512_cvttss2usi64:
1765 case Intrinsic::x86_avx512_vcvtsd2usi32:
1766 case Intrinsic::x86_avx512_vcvtsd2usi64:
1767 case Intrinsic::x86_avx512_cvttsd2usi:
1768 case Intrinsic::x86_avx512_cvttsd2usi64:
1769
1770 // NVVM FMax intrinsics
1771 case Intrinsic::nvvm_fmax_d:
1772 case Intrinsic::nvvm_fmax_f:
1773 case Intrinsic::nvvm_fmax_ftz_f:
1774 case Intrinsic::nvvm_fmax_ftz_nan_f:
1775 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
1776 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
1777 case Intrinsic::nvvm_fmax_nan_f:
1778 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
1779 case Intrinsic::nvvm_fmax_xorsign_abs_f:
1780
1781 // NVVM FMin intrinsics
1782 case Intrinsic::nvvm_fmin_d:
1783 case Intrinsic::nvvm_fmin_f:
1784 case Intrinsic::nvvm_fmin_ftz_f:
1785 case Intrinsic::nvvm_fmin_ftz_nan_f:
1786 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
1787 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
1788 case Intrinsic::nvvm_fmin_nan_f:
1789 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
1790 case Intrinsic::nvvm_fmin_xorsign_abs_f:
1791
1792 // NVVM float/double to int32/uint32 conversion intrinsics
1793 case Intrinsic::nvvm_f2i_rm:
1794 case Intrinsic::nvvm_f2i_rn:
1795 case Intrinsic::nvvm_f2i_rp:
1796 case Intrinsic::nvvm_f2i_rz:
1797 case Intrinsic::nvvm_f2i_rm_ftz:
1798 case Intrinsic::nvvm_f2i_rn_ftz:
1799 case Intrinsic::nvvm_f2i_rp_ftz:
1800 case Intrinsic::nvvm_f2i_rz_ftz:
1801 case Intrinsic::nvvm_f2ui_rm:
1802 case Intrinsic::nvvm_f2ui_rn:
1803 case Intrinsic::nvvm_f2ui_rp:
1804 case Intrinsic::nvvm_f2ui_rz:
1805 case Intrinsic::nvvm_f2ui_rm_ftz:
1806 case Intrinsic::nvvm_f2ui_rn_ftz:
1807 case Intrinsic::nvvm_f2ui_rp_ftz:
1808 case Intrinsic::nvvm_f2ui_rz_ftz:
1809 case Intrinsic::nvvm_d2i_rm:
1810 case Intrinsic::nvvm_d2i_rn:
1811 case Intrinsic::nvvm_d2i_rp:
1812 case Intrinsic::nvvm_d2i_rz:
1813 case Intrinsic::nvvm_d2ui_rm:
1814 case Intrinsic::nvvm_d2ui_rn:
1815 case Intrinsic::nvvm_d2ui_rp:
1816 case Intrinsic::nvvm_d2ui_rz:
1817
1818 // NVVM float/double to int64/uint64 conversion intrinsics
1819 case Intrinsic::nvvm_f2ll_rm:
1820 case Intrinsic::nvvm_f2ll_rn:
1821 case Intrinsic::nvvm_f2ll_rp:
1822 case Intrinsic::nvvm_f2ll_rz:
1823 case Intrinsic::nvvm_f2ll_rm_ftz:
1824 case Intrinsic::nvvm_f2ll_rn_ftz:
1825 case Intrinsic::nvvm_f2ll_rp_ftz:
1826 case Intrinsic::nvvm_f2ll_rz_ftz:
1827 case Intrinsic::nvvm_f2ull_rm:
1828 case Intrinsic::nvvm_f2ull_rn:
1829 case Intrinsic::nvvm_f2ull_rp:
1830 case Intrinsic::nvvm_f2ull_rz:
1831 case Intrinsic::nvvm_f2ull_rm_ftz:
1832 case Intrinsic::nvvm_f2ull_rn_ftz:
1833 case Intrinsic::nvvm_f2ull_rp_ftz:
1834 case Intrinsic::nvvm_f2ull_rz_ftz:
1835 case Intrinsic::nvvm_d2ll_rm:
1836 case Intrinsic::nvvm_d2ll_rn:
1837 case Intrinsic::nvvm_d2ll_rp:
1838 case Intrinsic::nvvm_d2ll_rz:
1839 case Intrinsic::nvvm_d2ull_rm:
1840 case Intrinsic::nvvm_d2ull_rn:
1841 case Intrinsic::nvvm_d2ull_rp:
1842 case Intrinsic::nvvm_d2ull_rz:
1843
1844 // NVVM math intrinsics:
1845 case Intrinsic::nvvm_ceil_d:
1846 case Intrinsic::nvvm_ceil_f:
1847 case Intrinsic::nvvm_ceil_ftz_f:
1848
1849 case Intrinsic::nvvm_fabs:
1850 case Intrinsic::nvvm_fabs_ftz:
1851
1852 case Intrinsic::nvvm_floor_d:
1853 case Intrinsic::nvvm_floor_f:
1854 case Intrinsic::nvvm_floor_ftz_f:
1855
1856 case Intrinsic::nvvm_rcp_rm_d:
1857 case Intrinsic::nvvm_rcp_rm_f:
1858 case Intrinsic::nvvm_rcp_rm_ftz_f:
1859 case Intrinsic::nvvm_rcp_rn_d:
1860 case Intrinsic::nvvm_rcp_rn_f:
1861 case Intrinsic::nvvm_rcp_rn_ftz_f:
1862 case Intrinsic::nvvm_rcp_rp_d:
1863 case Intrinsic::nvvm_rcp_rp_f:
1864 case Intrinsic::nvvm_rcp_rp_ftz_f:
1865 case Intrinsic::nvvm_rcp_rz_d:
1866 case Intrinsic::nvvm_rcp_rz_f:
1867 case Intrinsic::nvvm_rcp_rz_ftz_f:
1868
1869 case Intrinsic::nvvm_round_d:
1870 case Intrinsic::nvvm_round_f:
1871 case Intrinsic::nvvm_round_ftz_f:
1872
1873 case Intrinsic::nvvm_saturate_d:
1874 case Intrinsic::nvvm_saturate_f:
1875 case Intrinsic::nvvm_saturate_ftz_f:
1876
1877 case Intrinsic::nvvm_sqrt_f:
1878 case Intrinsic::nvvm_sqrt_rn_d:
1879 case Intrinsic::nvvm_sqrt_rn_f:
1880 case Intrinsic::nvvm_sqrt_rn_ftz_f:
1881 return !Call->isStrictFP();
1882
1883 // NVVM add intrinsics with explicit rounding modes
1884 case Intrinsic::nvvm_add_rm_d:
1885 case Intrinsic::nvvm_add_rn_d:
1886 case Intrinsic::nvvm_add_rp_d:
1887 case Intrinsic::nvvm_add_rz_d:
1888 case Intrinsic::nvvm_add_rm_f:
1889 case Intrinsic::nvvm_add_rn_f:
1890 case Intrinsic::nvvm_add_rp_f:
1891 case Intrinsic::nvvm_add_rz_f:
1892 case Intrinsic::nvvm_add_rm_ftz_f:
1893 case Intrinsic::nvvm_add_rn_ftz_f:
1894 case Intrinsic::nvvm_add_rp_ftz_f:
1895 case Intrinsic::nvvm_add_rz_ftz_f:
1896
1897 // NVVM div intrinsics with explicit rounding modes
1898 case Intrinsic::nvvm_div_rm_d:
1899 case Intrinsic::nvvm_div_rn_d:
1900 case Intrinsic::nvvm_div_rp_d:
1901 case Intrinsic::nvvm_div_rz_d:
1902 case Intrinsic::nvvm_div_rm_f:
1903 case Intrinsic::nvvm_div_rn_f:
1904 case Intrinsic::nvvm_div_rp_f:
1905 case Intrinsic::nvvm_div_rz_f:
1906 case Intrinsic::nvvm_div_rm_ftz_f:
1907 case Intrinsic::nvvm_div_rn_ftz_f:
1908 case Intrinsic::nvvm_div_rp_ftz_f:
1909 case Intrinsic::nvvm_div_rz_ftz_f:
1910
1911 // NVVM mul intrinsics with explicit rounding modes
1912 case Intrinsic::nvvm_mul_rm_d:
1913 case Intrinsic::nvvm_mul_rn_d:
1914 case Intrinsic::nvvm_mul_rp_d:
1915 case Intrinsic::nvvm_mul_rz_d:
1916 case Intrinsic::nvvm_mul_rm_f:
1917 case Intrinsic::nvvm_mul_rn_f:
1918 case Intrinsic::nvvm_mul_rp_f:
1919 case Intrinsic::nvvm_mul_rz_f:
1920 case Intrinsic::nvvm_mul_rm_ftz_f:
1921 case Intrinsic::nvvm_mul_rn_ftz_f:
1922 case Intrinsic::nvvm_mul_rp_ftz_f:
1923 case Intrinsic::nvvm_mul_rz_ftz_f:
1924
1925 // NVVM fma intrinsics with explicit rounding modes
1926 case Intrinsic::nvvm_fma_rm_d:
1927 case Intrinsic::nvvm_fma_rn_d:
1928 case Intrinsic::nvvm_fma_rp_d:
1929 case Intrinsic::nvvm_fma_rz_d:
1930 case Intrinsic::nvvm_fma_rm_f:
1931 case Intrinsic::nvvm_fma_rn_f:
1932 case Intrinsic::nvvm_fma_rp_f:
1933 case Intrinsic::nvvm_fma_rz_f:
1934 case Intrinsic::nvvm_fma_rm_ftz_f:
1935 case Intrinsic::nvvm_fma_rn_ftz_f:
1936 case Intrinsic::nvvm_fma_rp_ftz_f:
1937 case Intrinsic::nvvm_fma_rz_ftz_f:
1938
1939 // Sign operations are actually bitwise operations, they do not raise
1940 // exceptions even for SNANs.
1941 case Intrinsic::fabs:
1942 case Intrinsic::copysign:
1943 case Intrinsic::is_fpclass:
1944 // Non-constrained variants of rounding operations means default FP
1945 // environment, they can be folded in any case.
1946 case Intrinsic::ceil:
1947 case Intrinsic::floor:
1948 case Intrinsic::round:
1949 case Intrinsic::roundeven:
1950 case Intrinsic::trunc:
1951 case Intrinsic::nearbyint:
1952 case Intrinsic::rint:
1953 case Intrinsic::canonicalize:
1954
1955 // Constrained intrinsics can be folded if FP environment is known
1956 // to compiler.
1957 case Intrinsic::experimental_constrained_fma:
1958 case Intrinsic::experimental_constrained_fmuladd:
1959 case Intrinsic::experimental_constrained_fadd:
1960 case Intrinsic::experimental_constrained_fsub:
1961 case Intrinsic::experimental_constrained_fmul:
1962 case Intrinsic::experimental_constrained_fdiv:
1963 case Intrinsic::experimental_constrained_frem:
1964 case Intrinsic::experimental_constrained_ceil:
1965 case Intrinsic::experimental_constrained_floor:
1966 case Intrinsic::experimental_constrained_round:
1967 case Intrinsic::experimental_constrained_roundeven:
1968 case Intrinsic::experimental_constrained_trunc:
1969 case Intrinsic::experimental_constrained_nearbyint:
1970 case Intrinsic::experimental_constrained_rint:
1971 case Intrinsic::experimental_constrained_fcmp:
1972 case Intrinsic::experimental_constrained_fcmps:
1973
1974 case Intrinsic::experimental_cttz_elts:
1975 return true;
1976 default:
1977 return false;
1978 case Intrinsic::not_intrinsic: break;
1979 }
1980
1981 if (!F->hasName() || Call->isStrictFP())
1982 return false;
1983
1984 // In these cases, the check of the length is required. We don't want to
1985 // return true for a name like "cos\0blah" which strcmp would return equal to
1986 // "cos", but has length 8.
1987 StringRef Name = F->getName();
1988 switch (Name[0]) {
1989 default:
1990 return false;
1991 // clang-format off
1992 case 'a':
1993 return Name == "acos" || Name == "acosf" ||
1994 Name == "asin" || Name == "asinf" ||
1995 Name == "atan" || Name == "atanf" ||
1996 Name == "atan2" || Name == "atan2f";
1997 case 'c':
1998 return Name == "ceil" || Name == "ceilf" ||
1999 Name == "cos" || Name == "cosf" ||
2000 Name == "cosh" || Name == "coshf";
2001 case 'e':
2002 return Name == "exp" || Name == "expf" || Name == "exp2" ||
2003 Name == "exp2f" || Name == "erf" || Name == "erff";
2004 case 'f':
2005 return Name == "fabs" || Name == "fabsf" ||
2006 Name == "floor" || Name == "floorf" ||
2007 Name == "fmod" || Name == "fmodf";
2008 case 'i':
2009 return Name == "ilogb" || Name == "ilogbf";
2010 case 'l':
2011 return Name == "log" || Name == "logf" || Name == "logl" ||
2012 Name == "log2" || Name == "log2f" || Name == "log10" ||
2013 Name == "log10f" || Name == "logb" || Name == "logbf" ||
2014 Name == "log1p" || Name == "log1pf";
2015 case 'n':
2016 return Name == "nearbyint" || Name == "nearbyintf";
2017 case 'p':
2018 return Name == "pow" || Name == "powf";
2019 case 'r':
2020 return Name == "remainder" || Name == "remainderf" ||
2021 Name == "rint" || Name == "rintf" ||
2022 Name == "round" || Name == "roundf" ||
2023 Name == "roundeven" || Name == "roundevenf";
2024 case 's':
2025 return Name == "sin" || Name == "sinf" ||
2026 Name == "sinh" || Name == "sinhf" ||
2027 Name == "sqrt" || Name == "sqrtf";
2028 case 't':
2029 return Name == "tan" || Name == "tanf" ||
2030 Name == "tanh" || Name == "tanhf" ||
2031 Name == "trunc" || Name == "truncf";
2032 case '_':
2033 // Check for various function names that get used for the math functions
2034 // when the header files are preprocessed with the macro
2035 // __FINITE_MATH_ONLY__ enabled.
2036 // The '12' here is the length of the shortest name that can match.
2037 // We need to check the size before looking at Name[1] and Name[2]
2038 // so we may as well check a limit that will eliminate mismatches.
2039 if (Name.size() < 12 || Name[1] != '_')
2040 return false;
2041 switch (Name[2]) {
2042 default:
2043 return false;
2044 case 'a':
2045 return Name == "__acos_finite" || Name == "__acosf_finite" ||
2046 Name == "__asin_finite" || Name == "__asinf_finite" ||
2047 Name == "__atan2_finite" || Name == "__atan2f_finite";
2048 case 'c':
2049 return Name == "__cosh_finite" || Name == "__coshf_finite";
2050 case 'e':
2051 return Name == "__exp_finite" || Name == "__expf_finite" ||
2052 Name == "__exp2_finite" || Name == "__exp2f_finite";
2053 case 'l':
2054 return Name == "__log_finite" || Name == "__logf_finite" ||
2055 Name == "__log10_finite" || Name == "__log10f_finite";
2056 case 'p':
2057 return Name == "__pow_finite" || Name == "__powf_finite";
2058 case 's':
2059 return Name == "__sinh_finite" || Name == "__sinhf_finite";
2060 }
2061 // clang-format on
2062 }
2063}
2064
2065namespace {
2066
2067Constant *GetConstantFoldFPValue(double V, Type *Ty) {
2068 if (Ty->isHalfTy() || Ty->isFloatTy()) {
2069 APFloat APF(V);
2070 bool unused;
2071 APF.convert(Ty->getFltSemantics(), APFloat::rmNearestTiesToEven, &unused);
2072 return ConstantFP::get(Ty->getContext(), APF);
2073 }
2074 if (Ty->isDoubleTy())
2075 return ConstantFP::get(Ty->getContext(), APFloat(V));
2076 llvm_unreachable("Can only constant fold half/float/double");
2077}
2078
2079#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2080Constant *GetConstantFoldFPValue128(float128 V, Type *Ty) {
2081 if (Ty->isFP128Ty())
2082 return ConstantFP::get(Ty, V);
2083 llvm_unreachable("Can only constant fold fp128");
2084}
2085#endif
2086
2087/// Clear the floating-point exception state.
2088inline void llvm_fenv_clearexcept() {
2089#if HAVE_DECL_FE_ALL_EXCEPT
2090 feclearexcept(FE_ALL_EXCEPT);
2091#endif
2092 errno = 0;
2093}
2094
2095/// Test if a floating-point exception was raised.
2096inline bool llvm_fenv_testexcept() {
2097 int errno_val = errno;
2098 if (errno_val == ERANGE || errno_val == EDOM)
2099 return true;
2100#if HAVE_DECL_FE_ALL_EXCEPT && HAVE_DECL_FE_INEXACT
2101 if (fetestexcept(FE_ALL_EXCEPT & ~FE_INEXACT))
2102 return true;
2103#endif
2104 return false;
2105}
2106
2107static APFloat FTZPreserveSign(const APFloat &V) {
2108 if (V.isDenormal())
2109 return APFloat::getZero(V.getSemantics(), V.isNegative());
2110 return V;
2111}
2112
2113static APFloat FlushToPositiveZero(const APFloat &V) {
2114 if (V.isDenormal())
2115 return APFloat::getZero(V.getSemantics(), false);
2116 return V;
2117}
2118
2119static APFloat FlushWithDenormKind(const APFloat &V,
2120 DenormalMode::DenormalModeKind DenormKind) {
2123 switch (DenormKind) {
2125 return V;
2127 return FTZPreserveSign(V);
2129 return FlushToPositiveZero(V);
2130 default:
2131 llvm_unreachable("Invalid denormal mode!");
2132 }
2133}
2134
2135Constant *ConstantFoldFP(double (*NativeFP)(double), const APFloat &V, Type *Ty,
2136 DenormalMode DenormMode = DenormalMode::getIEEE()) {
2137 if (!DenormMode.isValid() ||
2138 DenormMode.Input == DenormalMode::DenormalModeKind::Dynamic ||
2139 DenormMode.Output == DenormalMode::DenormalModeKind::Dynamic)
2140 return nullptr;
2141
2142 llvm_fenv_clearexcept();
2143 auto Input = FlushWithDenormKind(V, DenormMode.Input);
2144 double Result = NativeFP(Input.convertToDouble());
2145 if (llvm_fenv_testexcept()) {
2146 llvm_fenv_clearexcept();
2147 return nullptr;
2148 }
2149
2150 Constant *Output = GetConstantFoldFPValue(Result, Ty);
2151 if (DenormMode.Output == DenormalMode::DenormalModeKind::IEEE)
2152 return Output;
2153 const auto *CFP = static_cast<ConstantFP *>(Output);
2154 const auto Res = FlushWithDenormKind(CFP->getValueAPF(), DenormMode.Output);
2155 return ConstantFP::get(Ty->getContext(), Res);
2156}
2157
2158#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2159Constant *ConstantFoldFP128(float128 (*NativeFP)(float128), const APFloat &V,
2160 Type *Ty) {
2161 llvm_fenv_clearexcept();
2162 float128 Result = NativeFP(V.convertToQuad());
2163 if (llvm_fenv_testexcept()) {
2164 llvm_fenv_clearexcept();
2165 return nullptr;
2166 }
2167
2168 return GetConstantFoldFPValue128(Result, Ty);
2169}
2170#endif
2171
2172Constant *ConstantFoldBinaryFP(double (*NativeFP)(double, double),
2173 const APFloat &V, const APFloat &W, Type *Ty) {
2174 llvm_fenv_clearexcept();
2175 double Result = NativeFP(V.convertToDouble(), W.convertToDouble());
2176 if (llvm_fenv_testexcept()) {
2177 llvm_fenv_clearexcept();
2178 return nullptr;
2179 }
2180
2181 return GetConstantFoldFPValue(Result, Ty);
2182}
2183
2184Constant *constantFoldVectorReduce(Intrinsic::ID IID, Constant *Op) {
2185 auto *OpVT = cast<VectorType>(Op->getType());
2186
2187 // This is the same as the underlying binops - poison propagates.
2188 if (Op->containsPoisonElement())
2189 return PoisonValue::get(OpVT->getElementType());
2190
2191 // Shortcut non-accumulating reductions.
2192 if (Constant *SplatVal = Op->getSplatValue()) {
2193 switch (IID) {
2194 case Intrinsic::vector_reduce_and:
2195 case Intrinsic::vector_reduce_or:
2196 case Intrinsic::vector_reduce_smin:
2197 case Intrinsic::vector_reduce_smax:
2198 case Intrinsic::vector_reduce_umin:
2199 case Intrinsic::vector_reduce_umax:
2200 return SplatVal;
2201 case Intrinsic::vector_reduce_add:
2202 if (SplatVal->isNullValue())
2203 return SplatVal;
2204 break;
2205 case Intrinsic::vector_reduce_mul:
2206 if (SplatVal->isNullValue() || SplatVal->isOneValue())
2207 return SplatVal;
2208 break;
2209 case Intrinsic::vector_reduce_xor:
2210 if (SplatVal->isNullValue())
2211 return SplatVal;
2212 if (OpVT->getElementCount().isKnownMultipleOf(2))
2213 return Constant::getNullValue(OpVT->getElementType());
2214 break;
2215 }
2216 }
2217
2219 if (!VT)
2220 return nullptr;
2221
2222 // TODO: Handle undef.
2223 auto *EltC = dyn_cast_or_null<ConstantInt>(Op->getAggregateElement(0U));
2224 if (!EltC)
2225 return nullptr;
2226
2227 APInt Acc = EltC->getValue();
2228 for (unsigned I = 1, E = VT->getNumElements(); I != E; I++) {
2229 if (!(EltC = dyn_cast_or_null<ConstantInt>(Op->getAggregateElement(I))))
2230 return nullptr;
2231 const APInt &X = EltC->getValue();
2232 switch (IID) {
2233 case Intrinsic::vector_reduce_add:
2234 Acc = Acc + X;
2235 break;
2236 case Intrinsic::vector_reduce_mul:
2237 Acc = Acc * X;
2238 break;
2239 case Intrinsic::vector_reduce_and:
2240 Acc = Acc & X;
2241 break;
2242 case Intrinsic::vector_reduce_or:
2243 Acc = Acc | X;
2244 break;
2245 case Intrinsic::vector_reduce_xor:
2246 Acc = Acc ^ X;
2247 break;
2248 case Intrinsic::vector_reduce_smin:
2249 Acc = APIntOps::smin(Acc, X);
2250 break;
2251 case Intrinsic::vector_reduce_smax:
2252 Acc = APIntOps::smax(Acc, X);
2253 break;
2254 case Intrinsic::vector_reduce_umin:
2255 Acc = APIntOps::umin(Acc, X);
2256 break;
2257 case Intrinsic::vector_reduce_umax:
2258 Acc = APIntOps::umax(Acc, X);
2259 break;
2260 }
2261 }
2262
2263 return ConstantInt::get(Op->getContext(), Acc);
2264}
2265
2266/// Attempt to fold an SSE floating point to integer conversion of a constant
2267/// floating point. If roundTowardZero is false, the default IEEE rounding is
2268/// used (toward nearest, ties to even). This matches the behavior of the
2269/// non-truncating SSE instructions in the default rounding mode. The desired
2270/// integer type Ty is used to select how many bits are available for the
2271/// result. Returns null if the conversion cannot be performed, otherwise
2272/// returns the Constant value resulting from the conversion.
2273Constant *ConstantFoldSSEConvertToInt(const APFloat &Val, bool roundTowardZero,
2274 Type *Ty, bool IsSigned) {
2275 // All of these conversion intrinsics form an integer of at most 64bits.
2276 unsigned ResultWidth = Ty->getIntegerBitWidth();
2277 assert(ResultWidth <= 64 &&
2278 "Can only constant fold conversions to 64 and 32 bit ints");
2279
2280 uint64_t UIntVal;
2281 bool isExact = false;
2285 Val.convertToInteger(MutableArrayRef(UIntVal), ResultWidth,
2286 IsSigned, mode, &isExact);
2287 if (status != APFloat::opOK &&
2288 (!roundTowardZero || status != APFloat::opInexact))
2289 return nullptr;
2290 return ConstantInt::get(Ty, UIntVal, IsSigned);
2291}
2292
2293double getValueAsDouble(ConstantFP *Op) {
2294 Type *Ty = Op->getType();
2295
2296 if (Ty->isBFloatTy() || Ty->isHalfTy() || Ty->isFloatTy() || Ty->isDoubleTy())
2297 return Op->getValueAPF().convertToDouble();
2298
2299 bool unused;
2300 APFloat APF = Op->getValueAPF();
2302 return APF.convertToDouble();
2303}
2304
2305static bool getConstIntOrUndef(Value *Op, const APInt *&C) {
2306 if (auto *CI = dyn_cast<ConstantInt>(Op)) {
2307 C = &CI->getValue();
2308 return true;
2309 }
2310 if (isa<UndefValue>(Op)) {
2311 C = nullptr;
2312 return true;
2313 }
2314 return false;
2315}
2316
2317/// Checks if the given intrinsic call, which evaluates to constant, is allowed
2318/// to be folded.
2319///
2320/// \param CI Constrained intrinsic call.
2321/// \param St Exception flags raised during constant evaluation.
2322static bool mayFoldConstrained(ConstrainedFPIntrinsic *CI,
2323 APFloat::opStatus St) {
2324 std::optional<RoundingMode> ORM = CI->getRoundingMode();
2325 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2326
2327 // If the operation does not change exception status flags, it is safe
2328 // to fold.
2329 if (St == APFloat::opStatus::opOK)
2330 return true;
2331
2332 // If evaluation raised FP exception, the result can depend on rounding
2333 // mode. If the latter is unknown, folding is not possible.
2334 if (ORM == RoundingMode::Dynamic)
2335 return false;
2336
2337 // If FP exceptions are ignored, fold the call, even if such exception is
2338 // raised.
2339 if (EB && *EB != fp::ExceptionBehavior::ebStrict)
2340 return true;
2341
2342 // Leave the calculation for runtime so that exception flags be correctly set
2343 // in hardware.
2344 return false;
2345}
2346
2347/// Returns the rounding mode that should be used for constant evaluation.
2348static RoundingMode
2349getEvaluationRoundingMode(const ConstrainedFPIntrinsic *CI) {
2350 std::optional<RoundingMode> ORM = CI->getRoundingMode();
2351 if (!ORM || *ORM == RoundingMode::Dynamic)
2352 // Even if the rounding mode is unknown, try evaluating the operation.
2353 // If it does not raise inexact exception, rounding was not applied,
2354 // so the result is exact and does not depend on rounding mode. Whether
2355 // other FP exceptions are raised, it does not depend on rounding mode.
2357 return *ORM;
2358}
2359
2360/// Try to constant fold llvm.canonicalize for the given caller and value.
2361static Constant *constantFoldCanonicalize(const Type *Ty, const CallBase *CI,
2362 const APFloat &Src) {
2363 // Zero, positive and negative, is always OK to fold.
2364 if (Src.isZero()) {
2365 // Get a fresh 0, since ppc_fp128 does have non-canonical zeros.
2366 return ConstantFP::get(
2367 CI->getContext(),
2368 APFloat::getZero(Src.getSemantics(), Src.isNegative()));
2369 }
2370
2371 if (!Ty->isIEEELikeFPTy())
2372 return nullptr;
2373
2374 // Zero is always canonical and the sign must be preserved.
2375 //
2376 // Denorms and nans may have special encodings, but it should be OK to fold a
2377 // totally average number.
2378 if (Src.isNormal() || Src.isInfinity())
2379 return ConstantFP::get(CI->getContext(), Src);
2380
2381 if (Src.isDenormal() && CI->getParent() && CI->getFunction()) {
2382 DenormalMode DenormMode =
2383 CI->getFunction()->getDenormalMode(Src.getSemantics());
2384
2385 if (DenormMode == DenormalMode::getIEEE())
2386 return ConstantFP::get(CI->getContext(), Src);
2387
2388 if (DenormMode.Input == DenormalMode::Dynamic)
2389 return nullptr;
2390
2391 // If we know if either input or output is flushed, we can fold.
2392 if ((DenormMode.Input == DenormalMode::Dynamic &&
2393 DenormMode.Output == DenormalMode::IEEE) ||
2394 (DenormMode.Input == DenormalMode::IEEE &&
2395 DenormMode.Output == DenormalMode::Dynamic))
2396 return nullptr;
2397
2398 bool IsPositive =
2399 (!Src.isNegative() || DenormMode.Input == DenormalMode::PositiveZero ||
2400 (DenormMode.Output == DenormalMode::PositiveZero &&
2401 DenormMode.Input == DenormalMode::IEEE));
2402
2403 return ConstantFP::get(CI->getContext(),
2404 APFloat::getZero(Src.getSemantics(), !IsPositive));
2405 }
2406
2407 return nullptr;
2408}
2409
2410static Constant *ConstantFoldScalarCall1(StringRef Name,
2411 Intrinsic::ID IntrinsicID,
2412 Type *Ty,
2413 ArrayRef<Constant *> Operands,
2414 const TargetLibraryInfo *TLI,
2415 const CallBase *Call) {
2416 assert(Operands.size() == 1 && "Wrong number of operands.");
2417
2418 if (IntrinsicID == Intrinsic::is_constant) {
2419 // We know we have a "Constant" argument. But we want to only
2420 // return true for manifest constants, not those that depend on
2421 // constants with unknowable values, e.g. GlobalValue or BlockAddress.
2422 if (Operands[0]->isManifestConstant())
2423 return ConstantInt::getTrue(Ty->getContext());
2424 return nullptr;
2425 }
2426
2427 if (isa<UndefValue>(Operands[0])) {
2428 // cosine(arg) is between -1 and 1. cosine(invalid arg) is NaN.
2429 // ctpop() is between 0 and bitwidth, pick 0 for undef.
2430 // fptoui.sat and fptosi.sat can always fold to zero (for a zero input).
2431 if (IntrinsicID == Intrinsic::cos ||
2432 IntrinsicID == Intrinsic::ctpop ||
2433 IntrinsicID == Intrinsic::fptoui_sat ||
2434 IntrinsicID == Intrinsic::fptosi_sat ||
2435 IntrinsicID == Intrinsic::canonicalize)
2436 return Constant::getNullValue(Ty);
2437 if (IntrinsicID == Intrinsic::bswap ||
2438 IntrinsicID == Intrinsic::bitreverse ||
2439 IntrinsicID == Intrinsic::launder_invariant_group ||
2440 IntrinsicID == Intrinsic::strip_invariant_group)
2441 return Operands[0];
2442 }
2443
2444 if (isa<ConstantPointerNull>(Operands[0])) {
2445 // launder(null) == null == strip(null) iff in addrspace 0
2446 if (IntrinsicID == Intrinsic::launder_invariant_group ||
2447 IntrinsicID == Intrinsic::strip_invariant_group) {
2448 // If instruction is not yet put in a basic block (e.g. when cloning
2449 // a function during inlining), Call's caller may not be available.
2450 // So check Call's BB first before querying Call->getCaller.
2451 const Function *Caller =
2452 Call->getParent() ? Call->getCaller() : nullptr;
2453 if (Caller &&
2455 Caller, Operands[0]->getType()->getPointerAddressSpace())) {
2456 return Operands[0];
2457 }
2458 return nullptr;
2459 }
2460 }
2461
2462 if (auto *Op = dyn_cast<ConstantFP>(Operands[0])) {
2463 APFloat U = Op->getValueAPF();
2464
2465 if (IntrinsicID == Intrinsic::wasm_trunc_signed ||
2466 IntrinsicID == Intrinsic::wasm_trunc_unsigned) {
2467 bool Signed = IntrinsicID == Intrinsic::wasm_trunc_signed;
2468
2469 if (U.isNaN())
2470 return nullptr;
2471
2472 unsigned Width = Ty->getIntegerBitWidth();
2473 APSInt Int(Width, !Signed);
2474 bool IsExact = false;
2476 U.convertToInteger(Int, APFloat::rmTowardZero, &IsExact);
2477
2479 return ConstantInt::get(Ty, Int);
2480
2481 return nullptr;
2482 }
2483
2484 if (IntrinsicID == Intrinsic::fptoui_sat ||
2485 IntrinsicID == Intrinsic::fptosi_sat) {
2486 // convertToInteger() already has the desired saturation semantics.
2487 APSInt Int(Ty->getIntegerBitWidth(),
2488 IntrinsicID == Intrinsic::fptoui_sat);
2489 bool IsExact;
2490 U.convertToInteger(Int, APFloat::rmTowardZero, &IsExact);
2491 return ConstantInt::get(Ty, Int);
2492 }
2493
2494 if (IntrinsicID == Intrinsic::canonicalize)
2495 return constantFoldCanonicalize(Ty, Call, U);
2496
2497#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2498 if (Ty->isFP128Ty()) {
2499 if (IntrinsicID == Intrinsic::log) {
2500 float128 Result = logf128(Op->getValueAPF().convertToQuad());
2501 return GetConstantFoldFPValue128(Result, Ty);
2502 }
2503
2504 LibFunc Fp128Func = NotLibFunc;
2505 if (TLI && TLI->getLibFunc(Name, Fp128Func) && TLI->has(Fp128Func) &&
2506 Fp128Func == LibFunc_logl)
2507 return ConstantFoldFP128(logf128, Op->getValueAPF(), Ty);
2508 }
2509#endif
2510
2511 if (!Ty->isHalfTy() && !Ty->isFloatTy() && !Ty->isDoubleTy() &&
2512 !Ty->isIntegerTy())
2513 return nullptr;
2514
2515 // Use internal versions of these intrinsics.
2516
2517 if (IntrinsicID == Intrinsic::nearbyint || IntrinsicID == Intrinsic::rint ||
2518 IntrinsicID == Intrinsic::roundeven) {
2519 U.roundToIntegral(APFloat::rmNearestTiesToEven);
2520 return ConstantFP::get(Ty, U);
2521 }
2522
2523 if (IntrinsicID == Intrinsic::round) {
2524 U.roundToIntegral(APFloat::rmNearestTiesToAway);
2525 return ConstantFP::get(Ty, U);
2526 }
2527
2528 if (IntrinsicID == Intrinsic::roundeven) {
2529 U.roundToIntegral(APFloat::rmNearestTiesToEven);
2530 return ConstantFP::get(Ty, U);
2531 }
2532
2533 if (IntrinsicID == Intrinsic::ceil) {
2534 U.roundToIntegral(APFloat::rmTowardPositive);
2535 return ConstantFP::get(Ty, U);
2536 }
2537
2538 if (IntrinsicID == Intrinsic::floor) {
2539 U.roundToIntegral(APFloat::rmTowardNegative);
2540 return ConstantFP::get(Ty, U);
2541 }
2542
2543 if (IntrinsicID == Intrinsic::trunc) {
2544 U.roundToIntegral(APFloat::rmTowardZero);
2545 return ConstantFP::get(Ty, U);
2546 }
2547
2548 if (IntrinsicID == Intrinsic::fabs) {
2549 U.clearSign();
2550 return ConstantFP::get(Ty, U);
2551 }
2552
2553 if (IntrinsicID == Intrinsic::amdgcn_fract) {
2554 // The v_fract instruction behaves like the OpenCL spec, which defines
2555 // fract(x) as fmin(x - floor(x), 0x1.fffffep-1f): "The min() operator is
2556 // there to prevent fract(-small) from returning 1.0. It returns the
2557 // largest positive floating-point number less than 1.0."
2558 APFloat FloorU(U);
2559 FloorU.roundToIntegral(APFloat::rmTowardNegative);
2560 APFloat FractU(U - FloorU);
2561 APFloat AlmostOne(U.getSemantics(), 1);
2562 AlmostOne.next(/*nextDown*/ true);
2563 return ConstantFP::get(Ty, minimum(FractU, AlmostOne));
2564 }
2565
2566 // Rounding operations (floor, trunc, ceil, round and nearbyint) do not
2567 // raise FP exceptions, unless the argument is signaling NaN.
2568
2569 std::optional<APFloat::roundingMode> RM;
2570 switch (IntrinsicID) {
2571 default:
2572 break;
2573 case Intrinsic::experimental_constrained_nearbyint:
2574 case Intrinsic::experimental_constrained_rint: {
2576 RM = CI->getRoundingMode();
2577 if (!RM || *RM == RoundingMode::Dynamic)
2578 return nullptr;
2579 break;
2580 }
2581 case Intrinsic::experimental_constrained_round:
2583 break;
2584 case Intrinsic::experimental_constrained_ceil:
2586 break;
2587 case Intrinsic::experimental_constrained_floor:
2589 break;
2590 case Intrinsic::experimental_constrained_trunc:
2592 break;
2593 }
2594 if (RM) {
2596 if (U.isFinite()) {
2597 APFloat::opStatus St = U.roundToIntegral(*RM);
2598 if (IntrinsicID == Intrinsic::experimental_constrained_rint &&
2599 St == APFloat::opInexact) {
2600 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2601 if (EB == fp::ebStrict)
2602 return nullptr;
2603 }
2604 } else if (U.isSignaling()) {
2605 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2606 if (EB && *EB != fp::ebIgnore)
2607 return nullptr;
2608 U = APFloat::getQNaN(U.getSemantics());
2609 }
2610 return ConstantFP::get(Ty, U);
2611 }
2612
2613 // NVVM float/double to signed/unsigned int32/int64 conversions:
2614 switch (IntrinsicID) {
2615 // f2i
2616 case Intrinsic::nvvm_f2i_rm:
2617 case Intrinsic::nvvm_f2i_rn:
2618 case Intrinsic::nvvm_f2i_rp:
2619 case Intrinsic::nvvm_f2i_rz:
2620 case Intrinsic::nvvm_f2i_rm_ftz:
2621 case Intrinsic::nvvm_f2i_rn_ftz:
2622 case Intrinsic::nvvm_f2i_rp_ftz:
2623 case Intrinsic::nvvm_f2i_rz_ftz:
2624 // f2ui
2625 case Intrinsic::nvvm_f2ui_rm:
2626 case Intrinsic::nvvm_f2ui_rn:
2627 case Intrinsic::nvvm_f2ui_rp:
2628 case Intrinsic::nvvm_f2ui_rz:
2629 case Intrinsic::nvvm_f2ui_rm_ftz:
2630 case Intrinsic::nvvm_f2ui_rn_ftz:
2631 case Intrinsic::nvvm_f2ui_rp_ftz:
2632 case Intrinsic::nvvm_f2ui_rz_ftz:
2633 // d2i
2634 case Intrinsic::nvvm_d2i_rm:
2635 case Intrinsic::nvvm_d2i_rn:
2636 case Intrinsic::nvvm_d2i_rp:
2637 case Intrinsic::nvvm_d2i_rz:
2638 // d2ui
2639 case Intrinsic::nvvm_d2ui_rm:
2640 case Intrinsic::nvvm_d2ui_rn:
2641 case Intrinsic::nvvm_d2ui_rp:
2642 case Intrinsic::nvvm_d2ui_rz:
2643 // f2ll
2644 case Intrinsic::nvvm_f2ll_rm:
2645 case Intrinsic::nvvm_f2ll_rn:
2646 case Intrinsic::nvvm_f2ll_rp:
2647 case Intrinsic::nvvm_f2ll_rz:
2648 case Intrinsic::nvvm_f2ll_rm_ftz:
2649 case Intrinsic::nvvm_f2ll_rn_ftz:
2650 case Intrinsic::nvvm_f2ll_rp_ftz:
2651 case Intrinsic::nvvm_f2ll_rz_ftz:
2652 // f2ull
2653 case Intrinsic::nvvm_f2ull_rm:
2654 case Intrinsic::nvvm_f2ull_rn:
2655 case Intrinsic::nvvm_f2ull_rp:
2656 case Intrinsic::nvvm_f2ull_rz:
2657 case Intrinsic::nvvm_f2ull_rm_ftz:
2658 case Intrinsic::nvvm_f2ull_rn_ftz:
2659 case Intrinsic::nvvm_f2ull_rp_ftz:
2660 case Intrinsic::nvvm_f2ull_rz_ftz:
2661 // d2ll
2662 case Intrinsic::nvvm_d2ll_rm:
2663 case Intrinsic::nvvm_d2ll_rn:
2664 case Intrinsic::nvvm_d2ll_rp:
2665 case Intrinsic::nvvm_d2ll_rz:
2666 // d2ull
2667 case Intrinsic::nvvm_d2ull_rm:
2668 case Intrinsic::nvvm_d2ull_rn:
2669 case Intrinsic::nvvm_d2ull_rp:
2670 case Intrinsic::nvvm_d2ull_rz: {
2671 // In float-to-integer conversion, NaN inputs are converted to 0.
2672 if (U.isNaN()) {
2673 // In float-to-integer conversion, NaN inputs are converted to 0
2674 // when the source and destination bitwidths are both less than 64.
2675 if (nvvm::FPToIntegerIntrinsicNaNZero(IntrinsicID))
2676 return ConstantInt::get(Ty, 0);
2677
2678 // Otherwise, the most significant bit is set.
2679 unsigned BitWidth = Ty->getIntegerBitWidth();
2680 uint64_t Val = 1ULL << (BitWidth - 1);
2681 return ConstantInt::get(Ty, APInt(BitWidth, Val, /*IsSigned=*/false));
2682 }
2683
2684 APFloat::roundingMode RMode =
2686 bool IsFTZ = nvvm::FPToIntegerIntrinsicShouldFTZ(IntrinsicID);
2687 bool IsSigned = nvvm::FPToIntegerIntrinsicResultIsSigned(IntrinsicID);
2688
2689 APSInt ResInt(Ty->getIntegerBitWidth(), !IsSigned);
2690 auto FloatToRound = IsFTZ ? FTZPreserveSign(U) : U;
2691
2692 // Return max/min value for integers if the result is +/-inf or
2693 // is too large to fit in the result's integer bitwidth.
2694 bool IsExact = false;
2695 FloatToRound.convertToInteger(ResInt, RMode, &IsExact);
2696 return ConstantInt::get(Ty, ResInt);
2697 }
2698 }
2699
2700 /// We only fold functions with finite arguments. Folding NaN and inf is
2701 /// likely to be aborted with an exception anyway, and some host libms
2702 /// have known errors raising exceptions.
2703 if (!U.isFinite())
2704 return nullptr;
2705
2706 /// Currently APFloat versions of these functions do not exist, so we use
2707 /// the host native double versions. Float versions are not called
2708 /// directly but for all these it is true (float)(f((double)arg)) ==
2709 /// f(arg). Long double not supported yet.
2710 const APFloat &APF = Op->getValueAPF();
2711
2712 switch (IntrinsicID) {
2713 default: break;
2714 case Intrinsic::log:
2715 if (U.isZero())
2716 return ConstantFP::getInfinity(Ty, true);
2717 if (U.isNegative())
2718 return ConstantFP::getNaN(Ty);
2719 if (U.isExactlyValue(1.0))
2720 return ConstantFP::getZero(Ty);
2721 return ConstantFoldFP(log, APF, Ty);
2722 case Intrinsic::log2:
2723 if (U.isZero())
2724 return ConstantFP::getInfinity(Ty, true);
2725 if (U.isNegative())
2726 return ConstantFP::getNaN(Ty);
2727 if (U.isExactlyValue(1.0))
2728 return ConstantFP::getZero(Ty);
2729 // TODO: What about hosts that lack a C99 library?
2730 return ConstantFoldFP(log2, APF, Ty);
2731 case Intrinsic::log10:
2732 if (U.isZero())
2733 return ConstantFP::getInfinity(Ty, true);
2734 if (U.isNegative())
2735 return ConstantFP::getNaN(Ty);
2736 if (U.isExactlyValue(1.0))
2737 return ConstantFP::getZero(Ty);
2738 // TODO: What about hosts that lack a C99 library?
2739 return ConstantFoldFP(log10, APF, Ty);
2740 case Intrinsic::exp:
2741 return ConstantFoldFP(exp, APF, Ty);
2742 case Intrinsic::exp2:
2743 // Fold exp2(x) as pow(2, x), in case the host lacks a C99 library.
2744 return ConstantFoldBinaryFP(pow, APFloat(2.0), APF, Ty);
2745 case Intrinsic::exp10:
2746 // Fold exp10(x) as pow(10, x), in case the host lacks a C99 library.
2747 return ConstantFoldBinaryFP(pow, APFloat(10.0), APF, Ty);
2748 case Intrinsic::sin:
2749 return ConstantFoldFP(sin, APF, Ty);
2750 case Intrinsic::cos:
2751 return ConstantFoldFP(cos, APF, Ty);
2752 case Intrinsic::sinh:
2753 return ConstantFoldFP(sinh, APF, Ty);
2754 case Intrinsic::cosh:
2755 return ConstantFoldFP(cosh, APF, Ty);
2756 case Intrinsic::atan:
2757 // Implement optional behavior from C's Annex F for +/-0.0.
2758 if (U.isZero())
2759 return ConstantFP::get(Ty, U);
2760 return ConstantFoldFP(atan, APF, Ty);
2761 case Intrinsic::sqrt:
2762 return ConstantFoldFP(sqrt, APF, Ty);
2763
2764 // NVVM Intrinsics:
2765 case Intrinsic::nvvm_ceil_ftz_f:
2766 case Intrinsic::nvvm_ceil_f:
2767 case Intrinsic::nvvm_ceil_d:
2768 return ConstantFoldFP(
2769 ceil, APF, Ty,
2771 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2772
2773 case Intrinsic::nvvm_fabs_ftz:
2774 case Intrinsic::nvvm_fabs:
2775 return ConstantFoldFP(
2776 fabs, APF, Ty,
2778 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2779
2780 case Intrinsic::nvvm_floor_ftz_f:
2781 case Intrinsic::nvvm_floor_f:
2782 case Intrinsic::nvvm_floor_d:
2783 return ConstantFoldFP(
2784 floor, APF, Ty,
2786 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2787
2788 case Intrinsic::nvvm_rcp_rm_ftz_f:
2789 case Intrinsic::nvvm_rcp_rn_ftz_f:
2790 case Intrinsic::nvvm_rcp_rp_ftz_f:
2791 case Intrinsic::nvvm_rcp_rz_ftz_f:
2792 case Intrinsic::nvvm_rcp_rm_d:
2793 case Intrinsic::nvvm_rcp_rm_f:
2794 case Intrinsic::nvvm_rcp_rn_d:
2795 case Intrinsic::nvvm_rcp_rn_f:
2796 case Intrinsic::nvvm_rcp_rp_d:
2797 case Intrinsic::nvvm_rcp_rp_f:
2798 case Intrinsic::nvvm_rcp_rz_d:
2799 case Intrinsic::nvvm_rcp_rz_f: {
2800 APFloat::roundingMode RoundMode = nvvm::GetRCPRoundingMode(IntrinsicID);
2801 bool IsFTZ = nvvm::RCPShouldFTZ(IntrinsicID);
2802
2803 auto Denominator = IsFTZ ? FTZPreserveSign(APF) : APF;
2805 APFloat::opStatus Status = Res.divide(Denominator, RoundMode);
2806
2808 if (IsFTZ)
2809 Res = FTZPreserveSign(Res);
2810 return ConstantFP::get(Ty, Res);
2811 }
2812 return nullptr;
2813 }
2814
2815 case Intrinsic::nvvm_round_ftz_f:
2816 case Intrinsic::nvvm_round_f:
2817 case Intrinsic::nvvm_round_d: {
2818 // nvvm_round is lowered to PTX cvt.rni, which will round to nearest
2819 // integer, choosing even integer if source is equidistant between two
2820 // integers, so the semantics are closer to "rint" rather than "round".
2821 bool IsFTZ = nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID);
2822 auto V = IsFTZ ? FTZPreserveSign(APF) : APF;
2824 return ConstantFP::get(Ty, V);
2825 }
2826
2827 case Intrinsic::nvvm_saturate_ftz_f:
2828 case Intrinsic::nvvm_saturate_d:
2829 case Intrinsic::nvvm_saturate_f: {
2830 bool IsFTZ = nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID);
2831 auto V = IsFTZ ? FTZPreserveSign(APF) : APF;
2832 if (V.isNegative() || V.isZero() || V.isNaN())
2833 return ConstantFP::getZero(Ty);
2835 if (V > One)
2836 return ConstantFP::get(Ty, One);
2837 return ConstantFP::get(Ty, APF);
2838 }
2839
2840 case Intrinsic::nvvm_sqrt_rn_ftz_f:
2841 case Intrinsic::nvvm_sqrt_f:
2842 case Intrinsic::nvvm_sqrt_rn_d:
2843 case Intrinsic::nvvm_sqrt_rn_f:
2844 if (APF.isNegative())
2845 return nullptr;
2846 return ConstantFoldFP(
2847 sqrt, APF, Ty,
2849 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2850
2851 // AMDGCN Intrinsics:
2852 case Intrinsic::amdgcn_cos:
2853 case Intrinsic::amdgcn_sin: {
2854 double V = getValueAsDouble(Op);
2855 if (V < -256.0 || V > 256.0)
2856 // The gfx8 and gfx9 architectures handle arguments outside the range
2857 // [-256, 256] differently. This should be a rare case so bail out
2858 // rather than trying to handle the difference.
2859 return nullptr;
2860 bool IsCos = IntrinsicID == Intrinsic::amdgcn_cos;
2861 double V4 = V * 4.0;
2862 if (V4 == floor(V4)) {
2863 // Force exact results for quarter-integer inputs.
2864 const double SinVals[4] = { 0.0, 1.0, 0.0, -1.0 };
2865 V = SinVals[((int)V4 + (IsCos ? 1 : 0)) & 3];
2866 } else {
2867 if (IsCos)
2868 V = cos(V * 2.0 * numbers::pi);
2869 else
2870 V = sin(V * 2.0 * numbers::pi);
2871 }
2872 return GetConstantFoldFPValue(V, Ty);
2873 }
2874 }
2875
2876 if (!TLI)
2877 return nullptr;
2878
2879 LibFunc Func = NotLibFunc;
2880 if (!TLI->getLibFunc(Name, Func))
2881 return nullptr;
2882
2883 switch (Func) {
2884 default:
2885 break;
2886 case LibFunc_acos:
2887 case LibFunc_acosf:
2888 case LibFunc_acos_finite:
2889 case LibFunc_acosf_finite:
2890 if (TLI->has(Func))
2891 return ConstantFoldFP(acos, APF, Ty);
2892 break;
2893 case LibFunc_asin:
2894 case LibFunc_asinf:
2895 case LibFunc_asin_finite:
2896 case LibFunc_asinf_finite:
2897 if (TLI->has(Func))
2898 return ConstantFoldFP(asin, APF, Ty);
2899 break;
2900 case LibFunc_atan:
2901 case LibFunc_atanf:
2902 // Implement optional behavior from C's Annex F for +/-0.0.
2903 if (U.isZero())
2904 return ConstantFP::get(Ty, U);
2905 if (TLI->has(Func))
2906 return ConstantFoldFP(atan, APF, Ty);
2907 break;
2908 case LibFunc_ceil:
2909 case LibFunc_ceilf:
2910 if (TLI->has(Func)) {
2911 U.roundToIntegral(APFloat::rmTowardPositive);
2912 return ConstantFP::get(Ty, U);
2913 }
2914 break;
2915 case LibFunc_cos:
2916 case LibFunc_cosf:
2917 if (TLI->has(Func))
2918 return ConstantFoldFP(cos, APF, Ty);
2919 break;
2920 case LibFunc_cosh:
2921 case LibFunc_coshf:
2922 case LibFunc_cosh_finite:
2923 case LibFunc_coshf_finite:
2924 if (TLI->has(Func))
2925 return ConstantFoldFP(cosh, APF, Ty);
2926 break;
2927 case LibFunc_exp:
2928 case LibFunc_expf:
2929 case LibFunc_exp_finite:
2930 case LibFunc_expf_finite:
2931 if (TLI->has(Func))
2932 return ConstantFoldFP(exp, APF, Ty);
2933 break;
2934 case LibFunc_exp2:
2935 case LibFunc_exp2f:
2936 case LibFunc_exp2_finite:
2937 case LibFunc_exp2f_finite:
2938 if (TLI->has(Func))
2939 // Fold exp2(x) as pow(2, x), in case the host lacks a C99 library.
2940 return ConstantFoldBinaryFP(pow, APFloat(2.0), APF, Ty);
2941 break;
2942 case LibFunc_fabs:
2943 case LibFunc_fabsf:
2944 if (TLI->has(Func)) {
2945 U.clearSign();
2946 return ConstantFP::get(Ty, U);
2947 }
2948 break;
2949 case LibFunc_floor:
2950 case LibFunc_floorf:
2951 if (TLI->has(Func)) {
2952 U.roundToIntegral(APFloat::rmTowardNegative);
2953 return ConstantFP::get(Ty, U);
2954 }
2955 break;
2956 case LibFunc_log:
2957 case LibFunc_logf:
2958 case LibFunc_log_finite:
2959 case LibFunc_logf_finite:
2960 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
2961 return ConstantFoldFP(log, APF, Ty);
2962 break;
2963 case LibFunc_log2:
2964 case LibFunc_log2f:
2965 case LibFunc_log2_finite:
2966 case LibFunc_log2f_finite:
2967 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
2968 // TODO: What about hosts that lack a C99 library?
2969 return ConstantFoldFP(log2, APF, Ty);
2970 break;
2971 case LibFunc_log10:
2972 case LibFunc_log10f:
2973 case LibFunc_log10_finite:
2974 case LibFunc_log10f_finite:
2975 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
2976 // TODO: What about hosts that lack a C99 library?
2977 return ConstantFoldFP(log10, APF, Ty);
2978 break;
2979 case LibFunc_ilogb:
2980 case LibFunc_ilogbf:
2981 if (!APF.isZero() && TLI->has(Func))
2982 return ConstantInt::get(Ty, ilogb(APF), true);
2983 break;
2984 case LibFunc_logb:
2985 case LibFunc_logbf:
2986 if (!APF.isZero() && TLI->has(Func))
2987 return ConstantFoldFP(logb, APF, Ty);
2988 break;
2989 case LibFunc_log1p:
2990 case LibFunc_log1pf:
2991 // Implement optional behavior from C's Annex F for +/-0.0.
2992 if (U.isZero())
2993 return ConstantFP::get(Ty, U);
2994 if (APF > APFloat::getOne(APF.getSemantics(), true) && TLI->has(Func))
2995 return ConstantFoldFP(log1p, APF, Ty);
2996 break;
2997 case LibFunc_logl:
2998 return nullptr;
2999 case LibFunc_erf:
3000 case LibFunc_erff:
3001 if (TLI->has(Func))
3002 return ConstantFoldFP(erf, APF, Ty);
3003 break;
3004 case LibFunc_nearbyint:
3005 case LibFunc_nearbyintf:
3006 case LibFunc_rint:
3007 case LibFunc_rintf:
3008 case LibFunc_roundeven:
3009 case LibFunc_roundevenf:
3010 if (TLI->has(Func)) {
3011 U.roundToIntegral(APFloat::rmNearestTiesToEven);
3012 return ConstantFP::get(Ty, U);
3013 }
3014 break;
3015 case LibFunc_round:
3016 case LibFunc_roundf:
3017 if (TLI->has(Func)) {
3018 U.roundToIntegral(APFloat::rmNearestTiesToAway);
3019 return ConstantFP::get(Ty, U);
3020 }
3021 break;
3022 case LibFunc_sin:
3023 case LibFunc_sinf:
3024 if (TLI->has(Func))
3025 return ConstantFoldFP(sin, APF, Ty);
3026 break;
3027 case LibFunc_sinh:
3028 case LibFunc_sinhf:
3029 case LibFunc_sinh_finite:
3030 case LibFunc_sinhf_finite:
3031 if (TLI->has(Func))
3032 return ConstantFoldFP(sinh, APF, Ty);
3033 break;
3034 case LibFunc_sqrt:
3035 case LibFunc_sqrtf:
3036 if (!APF.isNegative() && TLI->has(Func))
3037 return ConstantFoldFP(sqrt, APF, Ty);
3038 break;
3039 case LibFunc_tan:
3040 case LibFunc_tanf:
3041 if (TLI->has(Func))
3042 return ConstantFoldFP(tan, APF, Ty);
3043 break;
3044 case LibFunc_tanh:
3045 case LibFunc_tanhf:
3046 if (TLI->has(Func))
3047 return ConstantFoldFP(tanh, APF, Ty);
3048 break;
3049 case LibFunc_trunc:
3050 case LibFunc_truncf:
3051 if (TLI->has(Func)) {
3052 U.roundToIntegral(APFloat::rmTowardZero);
3053 return ConstantFP::get(Ty, U);
3054 }
3055 break;
3056 }
3057 return nullptr;
3058 }
3059
3060 if (auto *Op = dyn_cast<ConstantInt>(Operands[0])) {
3061 switch (IntrinsicID) {
3062 case Intrinsic::bswap:
3063 return ConstantInt::get(Ty->getContext(), Op->getValue().byteSwap());
3064 case Intrinsic::ctpop:
3065 return ConstantInt::get(Ty, Op->getValue().popcount());
3066 case Intrinsic::bitreverse:
3067 return ConstantInt::get(Ty->getContext(), Op->getValue().reverseBits());
3068 case Intrinsic::amdgcn_s_wqm: {
3069 uint64_t Val = Op->getZExtValue();
3070 Val |= (Val & 0x5555555555555555ULL) << 1 |
3071 ((Val >> 1) & 0x5555555555555555ULL);
3072 Val |= (Val & 0x3333333333333333ULL) << 2 |
3073 ((Val >> 2) & 0x3333333333333333ULL);
3074 return ConstantInt::get(Ty, Val);
3075 }
3076
3077 case Intrinsic::amdgcn_s_quadmask: {
3078 uint64_t Val = Op->getZExtValue();
3079 uint64_t QuadMask = 0;
3080 for (unsigned I = 0; I < Op->getBitWidth() / 4; ++I, Val >>= 4) {
3081 if (!(Val & 0xF))
3082 continue;
3083
3084 QuadMask |= (1ULL << I);
3085 }
3086 return ConstantInt::get(Ty, QuadMask);
3087 }
3088
3089 case Intrinsic::amdgcn_s_bitreplicate: {
3090 uint64_t Val = Op->getZExtValue();
3091 Val = (Val & 0x000000000000FFFFULL) | (Val & 0x00000000FFFF0000ULL) << 16;
3092 Val = (Val & 0x000000FF000000FFULL) | (Val & 0x0000FF000000FF00ULL) << 8;
3093 Val = (Val & 0x000F000F000F000FULL) | (Val & 0x00F000F000F000F0ULL) << 4;
3094 Val = (Val & 0x0303030303030303ULL) | (Val & 0x0C0C0C0C0C0C0C0CULL) << 2;
3095 Val = (Val & 0x1111111111111111ULL) | (Val & 0x2222222222222222ULL) << 1;
3096 Val = Val | Val << 1;
3097 return ConstantInt::get(Ty, Val);
3098 }
3099 }
3100 }
3101
3102 if (Operands[0]->getType()->isVectorTy()) {
3103 auto *Op = cast<Constant>(Operands[0]);
3104 switch (IntrinsicID) {
3105 default: break;
3106 case Intrinsic::vector_reduce_add:
3107 case Intrinsic::vector_reduce_mul:
3108 case Intrinsic::vector_reduce_and:
3109 case Intrinsic::vector_reduce_or:
3110 case Intrinsic::vector_reduce_xor:
3111 case Intrinsic::vector_reduce_smin:
3112 case Intrinsic::vector_reduce_smax:
3113 case Intrinsic::vector_reduce_umin:
3114 case Intrinsic::vector_reduce_umax:
3115 if (Constant *C = constantFoldVectorReduce(IntrinsicID, Operands[0]))
3116 return C;
3117 break;
3118 case Intrinsic::x86_sse_cvtss2si:
3119 case Intrinsic::x86_sse_cvtss2si64:
3120 case Intrinsic::x86_sse2_cvtsd2si:
3121 case Intrinsic::x86_sse2_cvtsd2si64:
3122 if (ConstantFP *FPOp =
3123 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3124 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3125 /*roundTowardZero=*/false, Ty,
3126 /*IsSigned*/true);
3127 break;
3128 case Intrinsic::x86_sse_cvttss2si:
3129 case Intrinsic::x86_sse_cvttss2si64:
3130 case Intrinsic::x86_sse2_cvttsd2si:
3131 case Intrinsic::x86_sse2_cvttsd2si64:
3132 if (ConstantFP *FPOp =
3133 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3134 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3135 /*roundTowardZero=*/true, Ty,
3136 /*IsSigned*/true);
3137 break;
3138
3139 case Intrinsic::wasm_anytrue:
3140 return Op->isNullValue() ? ConstantInt::get(Ty, 0)
3141 : ConstantInt::get(Ty, 1);
3142
3143 case Intrinsic::wasm_alltrue:
3144 // Check each element individually
3145 unsigned E = cast<FixedVectorType>(Op->getType())->getNumElements();
3146 for (unsigned I = 0; I != E; ++I) {
3147 Constant *Elt = Op->getAggregateElement(I);
3148 // Return false as soon as we find a non-true element.
3149 if (Elt && Elt->isNullValue())
3150 return ConstantInt::get(Ty, 0);
3151 // Bail as soon as we find an element we cannot prove to be true.
3152 if (!Elt || !isa<ConstantInt>(Elt))
3153 return nullptr;
3154 }
3155
3156 return ConstantInt::get(Ty, 1);
3157 }
3158 }
3159
3160 return nullptr;
3161}
3162
3163static Constant *evaluateCompare(const APFloat &Op1, const APFloat &Op2,
3167 FCmpInst::Predicate Cond = FCmp->getPredicate();
3168 if (FCmp->isSignaling()) {
3169 if (Op1.isNaN() || Op2.isNaN())
3171 } else {
3172 if (Op1.isSignaling() || Op2.isSignaling())
3174 }
3175 bool Result = FCmpInst::compare(Op1, Op2, Cond);
3176 if (mayFoldConstrained(const_cast<ConstrainedFPCmpIntrinsic *>(FCmp), St))
3177 return ConstantInt::get(Call->getType()->getScalarType(), Result);
3178 return nullptr;
3179}
3180
3181static Constant *ConstantFoldLibCall2(StringRef Name, Type *Ty,
3182 ArrayRef<Constant *> Operands,
3183 const TargetLibraryInfo *TLI) {
3184 if (!TLI)
3185 return nullptr;
3186
3187 LibFunc Func = NotLibFunc;
3188 if (!TLI->getLibFunc(Name, Func))
3189 return nullptr;
3190
3191 const auto *Op1 = dyn_cast<ConstantFP>(Operands[0]);
3192 if (!Op1)
3193 return nullptr;
3194
3195 const auto *Op2 = dyn_cast<ConstantFP>(Operands[1]);
3196 if (!Op2)
3197 return nullptr;
3198
3199 const APFloat &Op1V = Op1->getValueAPF();
3200 const APFloat &Op2V = Op2->getValueAPF();
3201
3202 switch (Func) {
3203 default:
3204 break;
3205 case LibFunc_pow:
3206 case LibFunc_powf:
3207 case LibFunc_pow_finite:
3208 case LibFunc_powf_finite:
3209 if (TLI->has(Func))
3210 return ConstantFoldBinaryFP(pow, Op1V, Op2V, Ty);
3211 break;
3212 case LibFunc_fmod:
3213 case LibFunc_fmodf:
3214 if (TLI->has(Func)) {
3215 APFloat V = Op1->getValueAPF();
3216 if (APFloat::opStatus::opOK == V.mod(Op2->getValueAPF()))
3217 return ConstantFP::get(Ty, V);
3218 }
3219 break;
3220 case LibFunc_remainder:
3221 case LibFunc_remainderf:
3222 if (TLI->has(Func)) {
3223 APFloat V = Op1->getValueAPF();
3224 if (APFloat::opStatus::opOK == V.remainder(Op2->getValueAPF()))
3225 return ConstantFP::get(Ty, V);
3226 }
3227 break;
3228 case LibFunc_atan2:
3229 case LibFunc_atan2f:
3230 // atan2(+/-0.0, +/-0.0) is known to raise an exception on some libm
3231 // (Solaris), so we do not assume a known result for that.
3232 if (Op1V.isZero() && Op2V.isZero())
3233 return nullptr;
3234 [[fallthrough]];
3235 case LibFunc_atan2_finite:
3236 case LibFunc_atan2f_finite:
3237 if (TLI->has(Func))
3238 return ConstantFoldBinaryFP(atan2, Op1V, Op2V, Ty);
3239 break;
3240 }
3241
3242 return nullptr;
3243}
3244
3245static Constant *ConstantFoldIntrinsicCall2(Intrinsic::ID IntrinsicID, Type *Ty,
3246 ArrayRef<Constant *> Operands,
3247 const CallBase *Call) {
3248 assert(Operands.size() == 2 && "Wrong number of operands.");
3249
3250 if (Ty->isFloatingPointTy()) {
3251 // TODO: We should have undef handling for all of the FP intrinsics that
3252 // are attempted to be folded in this function.
3253 bool IsOp0Undef = isa<UndefValue>(Operands[0]);
3254 bool IsOp1Undef = isa<UndefValue>(Operands[1]);
3255 switch (IntrinsicID) {
3256 case Intrinsic::maxnum:
3257 case Intrinsic::minnum:
3258 case Intrinsic::maximum:
3259 case Intrinsic::minimum:
3260 case Intrinsic::maximumnum:
3261 case Intrinsic::minimumnum:
3262 case Intrinsic::nvvm_fmax_d:
3263 case Intrinsic::nvvm_fmin_d:
3264 // If one argument is undef, return the other argument.
3265 if (IsOp0Undef)
3266 return Operands[1];
3267 if (IsOp1Undef)
3268 return Operands[0];
3269 break;
3270
3271 case Intrinsic::nvvm_fmax_f:
3272 case Intrinsic::nvvm_fmax_ftz_f:
3273 case Intrinsic::nvvm_fmax_ftz_nan_f:
3274 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3275 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3276 case Intrinsic::nvvm_fmax_nan_f:
3277 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3278 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3279
3280 case Intrinsic::nvvm_fmin_f:
3281 case Intrinsic::nvvm_fmin_ftz_f:
3282 case Intrinsic::nvvm_fmin_ftz_nan_f:
3283 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
3284 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
3285 case Intrinsic::nvvm_fmin_nan_f:
3286 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
3287 case Intrinsic::nvvm_fmin_xorsign_abs_f:
3288 // If one arg is undef, the other arg can be returned only if it is
3289 // constant, as we may need to flush it to sign-preserving zero or
3290 // canonicalize the NaN.
3291 if (!IsOp0Undef && !IsOp1Undef)
3292 break;
3293 if (auto *Op = dyn_cast<ConstantFP>(Operands[IsOp0Undef ? 1 : 0])) {
3294 if (Op->isNaN()) {
3295 APInt NVCanonicalNaN(32, 0x7fffffff);
3296 return ConstantFP::get(
3297 Ty, APFloat(Ty->getFltSemantics(), NVCanonicalNaN));
3298 }
3299 if (nvvm::FMinFMaxShouldFTZ(IntrinsicID))
3300 return ConstantFP::get(Ty, FTZPreserveSign(Op->getValueAPF()));
3301 else
3302 return Op;
3303 }
3304 break;
3305 }
3306 }
3307
3308 if (const auto *Op1 = dyn_cast<ConstantFP>(Operands[0])) {
3309 const APFloat &Op1V = Op1->getValueAPF();
3310
3311 if (const auto *Op2 = dyn_cast<ConstantFP>(Operands[1])) {
3312 if (Op2->getType() != Op1->getType())
3313 return nullptr;
3314 const APFloat &Op2V = Op2->getValueAPF();
3315
3316 if (const auto *ConstrIntr =
3318 RoundingMode RM = getEvaluationRoundingMode(ConstrIntr);
3319 APFloat Res = Op1V;
3321 switch (IntrinsicID) {
3322 default:
3323 return nullptr;
3324 case Intrinsic::experimental_constrained_fadd:
3325 St = Res.add(Op2V, RM);
3326 break;
3327 case Intrinsic::experimental_constrained_fsub:
3328 St = Res.subtract(Op2V, RM);
3329 break;
3330 case Intrinsic::experimental_constrained_fmul:
3331 St = Res.multiply(Op2V, RM);
3332 break;
3333 case Intrinsic::experimental_constrained_fdiv:
3334 St = Res.divide(Op2V, RM);
3335 break;
3336 case Intrinsic::experimental_constrained_frem:
3337 St = Res.mod(Op2V);
3338 break;
3339 case Intrinsic::experimental_constrained_fcmp:
3340 case Intrinsic::experimental_constrained_fcmps:
3341 return evaluateCompare(Op1V, Op2V, ConstrIntr);
3342 }
3343 if (mayFoldConstrained(const_cast<ConstrainedFPIntrinsic *>(ConstrIntr),
3344 St))
3345 return ConstantFP::get(Ty, Res);
3346 return nullptr;
3347 }
3348
3349 switch (IntrinsicID) {
3350 default:
3351 break;
3352 case Intrinsic::copysign:
3353 return ConstantFP::get(Ty, APFloat::copySign(Op1V, Op2V));
3354 case Intrinsic::minnum:
3355 return ConstantFP::get(Ty, minnum(Op1V, Op2V));
3356 case Intrinsic::maxnum:
3357 return ConstantFP::get(Ty, maxnum(Op1V, Op2V));
3358 case Intrinsic::minimum:
3359 return ConstantFP::get(Ty, minimum(Op1V, Op2V));
3360 case Intrinsic::maximum:
3361 return ConstantFP::get(Ty, maximum(Op1V, Op2V));
3362 case Intrinsic::minimumnum:
3363 return ConstantFP::get(Ty, minimumnum(Op1V, Op2V));
3364 case Intrinsic::maximumnum:
3365 return ConstantFP::get(Ty, maximumnum(Op1V, Op2V));
3366
3367 case Intrinsic::nvvm_fmax_d:
3368 case Intrinsic::nvvm_fmax_f:
3369 case Intrinsic::nvvm_fmax_ftz_f:
3370 case Intrinsic::nvvm_fmax_ftz_nan_f:
3371 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3372 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3373 case Intrinsic::nvvm_fmax_nan_f:
3374 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3375 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3376
3377 case Intrinsic::nvvm_fmin_d:
3378 case Intrinsic::nvvm_fmin_f:
3379 case Intrinsic::nvvm_fmin_ftz_f:
3380 case Intrinsic::nvvm_fmin_ftz_nan_f:
3381 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
3382 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
3383 case Intrinsic::nvvm_fmin_nan_f:
3384 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
3385 case Intrinsic::nvvm_fmin_xorsign_abs_f: {
3386
3387 bool ShouldCanonicalizeNaNs = !(IntrinsicID == Intrinsic::nvvm_fmax_d ||
3388 IntrinsicID == Intrinsic::nvvm_fmin_d);
3389 bool IsFTZ = nvvm::FMinFMaxShouldFTZ(IntrinsicID);
3390 bool IsNaNPropagating = nvvm::FMinFMaxPropagatesNaNs(IntrinsicID);
3391 bool IsXorSignAbs = nvvm::FMinFMaxIsXorSignAbs(IntrinsicID);
3392
3393 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3394 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3395
3396 bool XorSign = false;
3397 if (IsXorSignAbs) {
3398 XorSign = A.isNegative() ^ B.isNegative();
3399 A = abs(A);
3400 B = abs(B);
3401 }
3402
3403 bool IsFMax = false;
3404 switch (IntrinsicID) {
3405 case Intrinsic::nvvm_fmax_d:
3406 case Intrinsic::nvvm_fmax_f:
3407 case Intrinsic::nvvm_fmax_ftz_f:
3408 case Intrinsic::nvvm_fmax_ftz_nan_f:
3409 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3410 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3411 case Intrinsic::nvvm_fmax_nan_f:
3412 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3413 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3414 IsFMax = true;
3415 break;
3416 }
3417 APFloat Res = IsFMax ? maximum(A, B) : minimum(A, B);
3418
3419 if (ShouldCanonicalizeNaNs) {
3420 APFloat NVCanonicalNaN(Res.getSemantics(), APInt(32, 0x7fffffff));
3421 if (A.isNaN() && B.isNaN())
3422 return ConstantFP::get(Ty, NVCanonicalNaN);
3423 else if (IsNaNPropagating && (A.isNaN() || B.isNaN()))
3424 return ConstantFP::get(Ty, NVCanonicalNaN);
3425 }
3426
3427 if (A.isNaN() && B.isNaN())
3428 return Operands[1];
3429 else if (A.isNaN())
3430 Res = B;
3431 else if (B.isNaN())
3432 Res = A;
3433
3434 if (IsXorSignAbs && XorSign != Res.isNegative())
3435 Res.changeSign();
3436
3437 return ConstantFP::get(Ty, Res);
3438 }
3439
3440 case Intrinsic::nvvm_add_rm_f:
3441 case Intrinsic::nvvm_add_rn_f:
3442 case Intrinsic::nvvm_add_rp_f:
3443 case Intrinsic::nvvm_add_rz_f:
3444 case Intrinsic::nvvm_add_rm_d:
3445 case Intrinsic::nvvm_add_rn_d:
3446 case Intrinsic::nvvm_add_rp_d:
3447 case Intrinsic::nvvm_add_rz_d:
3448 case Intrinsic::nvvm_add_rm_ftz_f:
3449 case Intrinsic::nvvm_add_rn_ftz_f:
3450 case Intrinsic::nvvm_add_rp_ftz_f:
3451 case Intrinsic::nvvm_add_rz_ftz_f: {
3452
3453 bool IsFTZ = nvvm::FAddShouldFTZ(IntrinsicID);
3454 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3455 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3456
3457 APFloat::roundingMode RoundMode =
3458 nvvm::GetFAddRoundingMode(IntrinsicID);
3459
3460 APFloat Res = A;
3461 APFloat::opStatus Status = Res.add(B, RoundMode);
3462
3463 if (!Res.isNaN() &&
3465 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3466 return ConstantFP::get(Ty, Res);
3467 }
3468 return nullptr;
3469 }
3470
3471 case Intrinsic::nvvm_mul_rm_f:
3472 case Intrinsic::nvvm_mul_rn_f:
3473 case Intrinsic::nvvm_mul_rp_f:
3474 case Intrinsic::nvvm_mul_rz_f:
3475 case Intrinsic::nvvm_mul_rm_d:
3476 case Intrinsic::nvvm_mul_rn_d:
3477 case Intrinsic::nvvm_mul_rp_d:
3478 case Intrinsic::nvvm_mul_rz_d:
3479 case Intrinsic::nvvm_mul_rm_ftz_f:
3480 case Intrinsic::nvvm_mul_rn_ftz_f:
3481 case Intrinsic::nvvm_mul_rp_ftz_f:
3482 case Intrinsic::nvvm_mul_rz_ftz_f: {
3483
3484 bool IsFTZ = nvvm::FMulShouldFTZ(IntrinsicID);
3485 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3486 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3487
3488 APFloat::roundingMode RoundMode =
3489 nvvm::GetFMulRoundingMode(IntrinsicID);
3490
3491 APFloat Res = A;
3492 APFloat::opStatus Status = Res.multiply(B, RoundMode);
3493
3494 if (!Res.isNaN() &&
3496 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3497 return ConstantFP::get(Ty, Res);
3498 }
3499 return nullptr;
3500 }
3501
3502 case Intrinsic::nvvm_div_rm_f:
3503 case Intrinsic::nvvm_div_rn_f:
3504 case Intrinsic::nvvm_div_rp_f:
3505 case Intrinsic::nvvm_div_rz_f:
3506 case Intrinsic::nvvm_div_rm_d:
3507 case Intrinsic::nvvm_div_rn_d:
3508 case Intrinsic::nvvm_div_rp_d:
3509 case Intrinsic::nvvm_div_rz_d:
3510 case Intrinsic::nvvm_div_rm_ftz_f:
3511 case Intrinsic::nvvm_div_rn_ftz_f:
3512 case Intrinsic::nvvm_div_rp_ftz_f:
3513 case Intrinsic::nvvm_div_rz_ftz_f: {
3514 bool IsFTZ = nvvm::FDivShouldFTZ(IntrinsicID);
3515 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3516 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3517 APFloat::roundingMode RoundMode =
3518 nvvm::GetFDivRoundingMode(IntrinsicID);
3519
3520 APFloat Res = A;
3521 APFloat::opStatus Status = Res.divide(B, RoundMode);
3522 if (!Res.isNaN() &&
3524 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3525 return ConstantFP::get(Ty, Res);
3526 }
3527 return nullptr;
3528 }
3529 }
3530
3531 if (!Ty->isHalfTy() && !Ty->isFloatTy() && !Ty->isDoubleTy())
3532 return nullptr;
3533
3534 switch (IntrinsicID) {
3535 default:
3536 break;
3537 case Intrinsic::pow:
3538 return ConstantFoldBinaryFP(pow, Op1V, Op2V, Ty);
3539 case Intrinsic::amdgcn_fmul_legacy:
3540 // The legacy behaviour is that multiplying +/- 0.0 by anything, even
3541 // NaN or infinity, gives +0.0.
3542 if (Op1V.isZero() || Op2V.isZero())
3543 return ConstantFP::getZero(Ty);
3544 return ConstantFP::get(Ty, Op1V * Op2V);
3545 }
3546
3547 } else if (auto *Op2C = dyn_cast<ConstantInt>(Operands[1])) {
3548 switch (IntrinsicID) {
3549 case Intrinsic::ldexp: {
3550 return ConstantFP::get(
3551 Ty->getContext(),
3552 scalbn(Op1V, Op2C->getSExtValue(), APFloat::rmNearestTiesToEven));
3553 }
3554 case Intrinsic::is_fpclass: {
3555 FPClassTest Mask = static_cast<FPClassTest>(Op2C->getZExtValue());
3556 bool Result =
3557 ((Mask & fcSNan) && Op1V.isNaN() && Op1V.isSignaling()) ||
3558 ((Mask & fcQNan) && Op1V.isNaN() && !Op1V.isSignaling()) ||
3559 ((Mask & fcNegInf) && Op1V.isNegInfinity()) ||
3560 ((Mask & fcNegNormal) && Op1V.isNormal() && Op1V.isNegative()) ||
3561 ((Mask & fcNegSubnormal) && Op1V.isDenormal() && Op1V.isNegative()) ||
3562 ((Mask & fcNegZero) && Op1V.isZero() && Op1V.isNegative()) ||
3563 ((Mask & fcPosZero) && Op1V.isZero() && !Op1V.isNegative()) ||
3564 ((Mask & fcPosSubnormal) && Op1V.isDenormal() && !Op1V.isNegative()) ||
3565 ((Mask & fcPosNormal) && Op1V.isNormal() && !Op1V.isNegative()) ||
3566 ((Mask & fcPosInf) && Op1V.isPosInfinity());
3567 return ConstantInt::get(Ty, Result);
3568 }
3569 case Intrinsic::powi: {
3570 int Exp = static_cast<int>(Op2C->getSExtValue());
3571 switch (Ty->getTypeID()) {
3572 case Type::HalfTyID:
3573 case Type::FloatTyID: {
3574 APFloat Res(static_cast<float>(std::pow(Op1V.convertToFloat(), Exp)));
3575 if (Ty->isHalfTy()) {
3576 bool Unused;
3578 &Unused);
3579 }
3580 return ConstantFP::get(Ty, Res);
3581 }
3582 case Type::DoubleTyID:
3583 return ConstantFP::get(Ty, std::pow(Op1V.convertToDouble(), Exp));
3584 default:
3585 return nullptr;
3586 }
3587 }
3588 default:
3589 break;
3590 }
3591 }
3592 return nullptr;
3593 }
3594
3595 if (Operands[0]->getType()->isIntegerTy() &&
3596 Operands[1]->getType()->isIntegerTy()) {
3597 const APInt *C0, *C1;
3598 if (!getConstIntOrUndef(Operands[0], C0) ||
3599 !getConstIntOrUndef(Operands[1], C1))
3600 return nullptr;
3601
3602 switch (IntrinsicID) {
3603 default: break;
3604 case Intrinsic::smax:
3605 case Intrinsic::smin:
3606 case Intrinsic::umax:
3607 case Intrinsic::umin:
3608 if (!C0 && !C1)
3609 return UndefValue::get(Ty);
3610 if (!C0 || !C1)
3611 return MinMaxIntrinsic::getSaturationPoint(IntrinsicID, Ty);
3612 return ConstantInt::get(
3613 Ty, ICmpInst::compare(*C0, *C1,
3614 MinMaxIntrinsic::getPredicate(IntrinsicID))
3615 ? *C0
3616 : *C1);
3617
3618 case Intrinsic::scmp:
3619 case Intrinsic::ucmp:
3620 if (!C0 || !C1)
3621 return ConstantInt::get(Ty, 0);
3622
3623 int Res;
3624 if (IntrinsicID == Intrinsic::scmp)
3625 Res = C0->sgt(*C1) ? 1 : C0->slt(*C1) ? -1 : 0;
3626 else
3627 Res = C0->ugt(*C1) ? 1 : C0->ult(*C1) ? -1 : 0;
3628 return ConstantInt::get(Ty, Res, /*IsSigned=*/true);
3629
3630 case Intrinsic::usub_with_overflow:
3631 case Intrinsic::ssub_with_overflow:
3632 // X - undef -> { 0, false }
3633 // undef - X -> { 0, false }
3634 if (!C0 || !C1)
3635 return Constant::getNullValue(Ty);
3636 [[fallthrough]];
3637 case Intrinsic::uadd_with_overflow:
3638 case Intrinsic::sadd_with_overflow:
3639 // X + undef -> { -1, false }
3640 // undef + x -> { -1, false }
3641 if (!C0 || !C1) {
3642 return ConstantStruct::get(
3643 cast<StructType>(Ty),
3644 {Constant::getAllOnesValue(Ty->getStructElementType(0)),
3645 Constant::getNullValue(Ty->getStructElementType(1))});
3646 }
3647 [[fallthrough]];
3648 case Intrinsic::smul_with_overflow:
3649 case Intrinsic::umul_with_overflow: {
3650 // undef * X -> { 0, false }
3651 // X * undef -> { 0, false }
3652 if (!C0 || !C1)
3653 return Constant::getNullValue(Ty);
3654
3655 APInt Res;
3656 bool Overflow;
3657 switch (IntrinsicID) {
3658 default: llvm_unreachable("Invalid case");
3659 case Intrinsic::sadd_with_overflow:
3660 Res = C0->sadd_ov(*C1, Overflow);
3661 break;
3662 case Intrinsic::uadd_with_overflow:
3663 Res = C0->uadd_ov(*C1, Overflow);
3664 break;
3665 case Intrinsic::ssub_with_overflow:
3666 Res = C0->ssub_ov(*C1, Overflow);
3667 break;
3668 case Intrinsic::usub_with_overflow:
3669 Res = C0->usub_ov(*C1, Overflow);
3670 break;
3671 case Intrinsic::smul_with_overflow:
3672 Res = C0->smul_ov(*C1, Overflow);
3673 break;
3674 case Intrinsic::umul_with_overflow:
3675 Res = C0->umul_ov(*C1, Overflow);
3676 break;
3677 }
3678 Constant *Ops[] = {
3679 ConstantInt::get(Ty->getContext(), Res),
3680 ConstantInt::get(Type::getInt1Ty(Ty->getContext()), Overflow)
3681 };
3683 }
3684 case Intrinsic::uadd_sat:
3685 case Intrinsic::sadd_sat:
3686 if (!C0 && !C1)
3687 return UndefValue::get(Ty);
3688 if (!C0 || !C1)
3689 return Constant::getAllOnesValue(Ty);
3690 if (IntrinsicID == Intrinsic::uadd_sat)
3691 return ConstantInt::get(Ty, C0->uadd_sat(*C1));
3692 else
3693 return ConstantInt::get(Ty, C0->sadd_sat(*C1));
3694 case Intrinsic::usub_sat:
3695 case Intrinsic::ssub_sat:
3696 if (!C0 && !C1)
3697 return UndefValue::get(Ty);
3698 if (!C0 || !C1)
3699 return Constant::getNullValue(Ty);
3700 if (IntrinsicID == Intrinsic::usub_sat)
3701 return ConstantInt::get(Ty, C0->usub_sat(*C1));
3702 else
3703 return ConstantInt::get(Ty, C0->ssub_sat(*C1));
3704 case Intrinsic::cttz:
3705 case Intrinsic::ctlz:
3706 assert(C1 && "Must be constant int");
3707
3708 // cttz(0, 1) and ctlz(0, 1) are poison.
3709 if (C1->isOne() && (!C0 || C0->isZero()))
3710 return PoisonValue::get(Ty);
3711 if (!C0)
3712 return Constant::getNullValue(Ty);
3713 if (IntrinsicID == Intrinsic::cttz)
3714 return ConstantInt::get(Ty, C0->countr_zero());
3715 else
3716 return ConstantInt::get(Ty, C0->countl_zero());
3717
3718 case Intrinsic::abs:
3719 assert(C1 && "Must be constant int");
3720 assert((C1->isOne() || C1->isZero()) && "Must be 0 or 1");
3721
3722 // Undef or minimum val operand with poison min --> poison
3723 if (C1->isOne() && (!C0 || C0->isMinSignedValue()))
3724 return PoisonValue::get(Ty);
3725
3726 // Undef operand with no poison min --> 0 (sign bit must be clear)
3727 if (!C0)
3728 return Constant::getNullValue(Ty);
3729
3730 return ConstantInt::get(Ty, C0->abs());
3731 case Intrinsic::amdgcn_wave_reduce_umin:
3732 case Intrinsic::amdgcn_wave_reduce_umax:
3733 case Intrinsic::amdgcn_wave_reduce_max:
3734 case Intrinsic::amdgcn_wave_reduce_min:
3735 case Intrinsic::amdgcn_wave_reduce_add:
3736 case Intrinsic::amdgcn_wave_reduce_sub:
3737 case Intrinsic::amdgcn_wave_reduce_and:
3738 case Intrinsic::amdgcn_wave_reduce_or:
3739 case Intrinsic::amdgcn_wave_reduce_xor:
3740 return Operands[0];
3741 }
3742
3743 return nullptr;
3744 }
3745
3746 // Support ConstantVector in case we have an Undef in the top.
3747 if ((isa<ConstantVector>(Operands[0]) ||
3748 isa<ConstantDataVector>(Operands[0])) &&
3749 // Check for default rounding mode.
3750 // FIXME: Support other rounding modes?
3751 isa<ConstantInt>(Operands[1]) &&
3752 cast<ConstantInt>(Operands[1])->getValue() == 4) {
3753 auto *Op = cast<Constant>(Operands[0]);
3754 switch (IntrinsicID) {
3755 default: break;
3756 case Intrinsic::x86_avx512_vcvtss2si32:
3757 case Intrinsic::x86_avx512_vcvtss2si64:
3758 case Intrinsic::x86_avx512_vcvtsd2si32:
3759 case Intrinsic::x86_avx512_vcvtsd2si64:
3760 if (ConstantFP *FPOp =
3761 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3762 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3763 /*roundTowardZero=*/false, Ty,
3764 /*IsSigned*/true);
3765 break;
3766 case Intrinsic::x86_avx512_vcvtss2usi32:
3767 case Intrinsic::x86_avx512_vcvtss2usi64:
3768 case Intrinsic::x86_avx512_vcvtsd2usi32:
3769 case Intrinsic::x86_avx512_vcvtsd2usi64:
3770 if (ConstantFP *FPOp =
3771 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3772 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3773 /*roundTowardZero=*/false, Ty,
3774 /*IsSigned*/false);
3775 break;
3776 case Intrinsic::x86_avx512_cvttss2si:
3777 case Intrinsic::x86_avx512_cvttss2si64:
3778 case Intrinsic::x86_avx512_cvttsd2si:
3779 case Intrinsic::x86_avx512_cvttsd2si64:
3780 if (ConstantFP *FPOp =
3781 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3782 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3783 /*roundTowardZero=*/true, Ty,
3784 /*IsSigned*/true);
3785 break;
3786 case Intrinsic::x86_avx512_cvttss2usi:
3787 case Intrinsic::x86_avx512_cvttss2usi64:
3788 case Intrinsic::x86_avx512_cvttsd2usi:
3789 case Intrinsic::x86_avx512_cvttsd2usi64:
3790 if (ConstantFP *FPOp =
3791 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3792 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3793 /*roundTowardZero=*/true, Ty,
3794 /*IsSigned*/false);
3795 break;
3796 }
3797 }
3798
3799 if (IntrinsicID == Intrinsic::experimental_cttz_elts) {
3800 auto *FVTy = dyn_cast<FixedVectorType>(Operands[0]->getType());
3801 bool ZeroIsPoison = cast<ConstantInt>(Operands[1])->isOne();
3802 if (!FVTy)
3803 return nullptr;
3804 unsigned Width = Ty->getIntegerBitWidth();
3805 if (APInt::getMaxValue(Width).ult(FVTy->getNumElements()))
3806 return PoisonValue::get(Ty);
3807 for (unsigned I = 0; I < FVTy->getNumElements(); ++I) {
3808 Constant *Elt = Operands[0]->getAggregateElement(I);
3809 if (!Elt)
3810 return nullptr;
3811 if (isa<UndefValue>(Elt) || Elt->isNullValue())
3812 continue;
3813 return ConstantInt::get(Ty, I);
3814 }
3815 if (ZeroIsPoison)
3816 return PoisonValue::get(Ty);
3817 return ConstantInt::get(Ty, FVTy->getNumElements());
3818 }
3819 return nullptr;
3820}
3821
3822static APFloat ConstantFoldAMDGCNCubeIntrinsic(Intrinsic::ID IntrinsicID,
3823 const APFloat &S0,
3824 const APFloat &S1,
3825 const APFloat &S2) {
3826 unsigned ID;
3827 const fltSemantics &Sem = S0.getSemantics();
3828 APFloat MA(Sem), SC(Sem), TC(Sem);
3829 if (abs(S2) >= abs(S0) && abs(S2) >= abs(S1)) {
3830 if (S2.isNegative() && S2.isNonZero() && !S2.isNaN()) {
3831 // S2 < 0
3832 ID = 5;
3833 SC = -S0;
3834 } else {
3835 ID = 4;
3836 SC = S0;
3837 }
3838 MA = S2;
3839 TC = -S1;
3840 } else if (abs(S1) >= abs(S0)) {
3841 if (S1.isNegative() && S1.isNonZero() && !S1.isNaN()) {
3842 // S1 < 0
3843 ID = 3;
3844 TC = -S2;
3845 } else {
3846 ID = 2;
3847 TC = S2;
3848 }
3849 MA = S1;
3850 SC = S0;
3851 } else {
3852 if (S0.isNegative() && S0.isNonZero() && !S0.isNaN()) {
3853 // S0 < 0
3854 ID = 1;
3855 SC = S2;
3856 } else {
3857 ID = 0;
3858 SC = -S2;
3859 }
3860 MA = S0;
3861 TC = -S1;
3862 }
3863 switch (IntrinsicID) {
3864 default:
3865 llvm_unreachable("unhandled amdgcn cube intrinsic");
3866 case Intrinsic::amdgcn_cubeid:
3867 return APFloat(Sem, ID);
3868 case Intrinsic::amdgcn_cubema:
3869 return MA + MA;
3870 case Intrinsic::amdgcn_cubesc:
3871 return SC;
3872 case Intrinsic::amdgcn_cubetc:
3873 return TC;
3874 }
3875}
3876
3877static Constant *ConstantFoldAMDGCNPermIntrinsic(ArrayRef<Constant *> Operands,
3878 Type *Ty) {
3879 const APInt *C0, *C1, *C2;
3880 if (!getConstIntOrUndef(Operands[0], C0) ||
3881 !getConstIntOrUndef(Operands[1], C1) ||
3882 !getConstIntOrUndef(Operands[2], C2))
3883 return nullptr;
3884
3885 if (!C2)
3886 return UndefValue::get(Ty);
3887
3888 APInt Val(32, 0);
3889 unsigned NumUndefBytes = 0;
3890 for (unsigned I = 0; I < 32; I += 8) {
3891 unsigned Sel = C2->extractBitsAsZExtValue(8, I);
3892 unsigned B = 0;
3893
3894 if (Sel >= 13)
3895 B = 0xff;
3896 else if (Sel == 12)
3897 B = 0x00;
3898 else {
3899 const APInt *Src = ((Sel & 10) == 10 || (Sel & 12) == 4) ? C0 : C1;
3900 if (!Src)
3901 ++NumUndefBytes;
3902 else if (Sel < 8)
3903 B = Src->extractBitsAsZExtValue(8, (Sel & 3) * 8);
3904 else
3905 B = Src->extractBitsAsZExtValue(1, (Sel & 1) ? 31 : 15) * 0xff;
3906 }
3907
3908 Val.insertBits(B, I, 8);
3909 }
3910
3911 if (NumUndefBytes == 4)
3912 return UndefValue::get(Ty);
3913
3914 return ConstantInt::get(Ty, Val);
3915}
3916
3917static Constant *ConstantFoldScalarCall3(StringRef Name,
3918 Intrinsic::ID IntrinsicID,
3919 Type *Ty,
3920 ArrayRef<Constant *> Operands,
3921 const TargetLibraryInfo *TLI,
3922 const CallBase *Call) {
3923 assert(Operands.size() == 3 && "Wrong number of operands.");
3924
3925 if (const auto *Op1 = dyn_cast<ConstantFP>(Operands[0])) {
3926 if (const auto *Op2 = dyn_cast<ConstantFP>(Operands[1])) {
3927 if (const auto *Op3 = dyn_cast<ConstantFP>(Operands[2])) {
3928 const APFloat &C1 = Op1->getValueAPF();
3929 const APFloat &C2 = Op2->getValueAPF();
3930 const APFloat &C3 = Op3->getValueAPF();
3931
3932 if (const auto *ConstrIntr = dyn_cast<ConstrainedFPIntrinsic>(Call)) {
3933 RoundingMode RM = getEvaluationRoundingMode(ConstrIntr);
3934 APFloat Res = C1;
3936 switch (IntrinsicID) {
3937 default:
3938 return nullptr;
3939 case Intrinsic::experimental_constrained_fma:
3940 case Intrinsic::experimental_constrained_fmuladd:
3941 St = Res.fusedMultiplyAdd(C2, C3, RM);
3942 break;
3943 }
3944 if (mayFoldConstrained(
3945 const_cast<ConstrainedFPIntrinsic *>(ConstrIntr), St))
3946 return ConstantFP::get(Ty, Res);
3947 return nullptr;
3948 }
3949
3950 switch (IntrinsicID) {
3951 default: break;
3952 case Intrinsic::amdgcn_fma_legacy: {
3953 // The legacy behaviour is that multiplying +/- 0.0 by anything, even
3954 // NaN or infinity, gives +0.0.
3955 if (C1.isZero() || C2.isZero()) {
3956 // It's tempting to just return C3 here, but that would give the
3957 // wrong result if C3 was -0.0.
3958 return ConstantFP::get(Ty, APFloat(0.0f) + C3);
3959 }
3960 [[fallthrough]];
3961 }
3962 case Intrinsic::fma:
3963 case Intrinsic::fmuladd: {
3964 APFloat V = C1;
3966 return ConstantFP::get(Ty, V);
3967 }
3968
3969 case Intrinsic::nvvm_fma_rm_f:
3970 case Intrinsic::nvvm_fma_rn_f:
3971 case Intrinsic::nvvm_fma_rp_f:
3972 case Intrinsic::nvvm_fma_rz_f:
3973 case Intrinsic::nvvm_fma_rm_d:
3974 case Intrinsic::nvvm_fma_rn_d:
3975 case Intrinsic::nvvm_fma_rp_d:
3976 case Intrinsic::nvvm_fma_rz_d:
3977 case Intrinsic::nvvm_fma_rm_ftz_f:
3978 case Intrinsic::nvvm_fma_rn_ftz_f:
3979 case Intrinsic::nvvm_fma_rp_ftz_f:
3980 case Intrinsic::nvvm_fma_rz_ftz_f: {
3981 bool IsFTZ = nvvm::FMAShouldFTZ(IntrinsicID);
3982 APFloat A = IsFTZ ? FTZPreserveSign(C1) : C1;
3983 APFloat B = IsFTZ ? FTZPreserveSign(C2) : C2;
3984 APFloat C = IsFTZ ? FTZPreserveSign(C3) : C3;
3985
3986 APFloat::roundingMode RoundMode =
3987 nvvm::GetFMARoundingMode(IntrinsicID);
3988
3989 APFloat Res = A;
3990 APFloat::opStatus Status = Res.fusedMultiplyAdd(B, C, RoundMode);
3991
3992 if (!Res.isNaN() &&
3994 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3995 return ConstantFP::get(Ty, Res);
3996 }
3997 return nullptr;
3998 }
3999
4000 case Intrinsic::amdgcn_cubeid:
4001 case Intrinsic::amdgcn_cubema:
4002 case Intrinsic::amdgcn_cubesc:
4003 case Intrinsic::amdgcn_cubetc: {
4004 APFloat V = ConstantFoldAMDGCNCubeIntrinsic(IntrinsicID, C1, C2, C3);
4005 return ConstantFP::get(Ty, V);
4006 }
4007 }
4008 }
4009 }
4010 }
4011
4012 if (IntrinsicID == Intrinsic::smul_fix ||
4013 IntrinsicID == Intrinsic::smul_fix_sat) {
4014 const APInt *C0, *C1;
4015 if (!getConstIntOrUndef(Operands[0], C0) ||
4016 !getConstIntOrUndef(Operands[1], C1))
4017 return nullptr;
4018
4019 // undef * C -> 0
4020 // C * undef -> 0
4021 if (!C0 || !C1)
4022 return Constant::getNullValue(Ty);
4023
4024 // This code performs rounding towards negative infinity in case the result
4025 // cannot be represented exactly for the given scale. Targets that do care
4026 // about rounding should use a target hook for specifying how rounding
4027 // should be done, and provide their own folding to be consistent with
4028 // rounding. This is the same approach as used by
4029 // DAGTypeLegalizer::ExpandIntRes_MULFIX.
4030 unsigned Scale = cast<ConstantInt>(Operands[2])->getZExtValue();
4031 unsigned Width = C0->getBitWidth();
4032 assert(Scale < Width && "Illegal scale.");
4033 unsigned ExtendedWidth = Width * 2;
4034 APInt Product =
4035 (C0->sext(ExtendedWidth) * C1->sext(ExtendedWidth)).ashr(Scale);
4036 if (IntrinsicID == Intrinsic::smul_fix_sat) {
4037 APInt Max = APInt::getSignedMaxValue(Width).sext(ExtendedWidth);
4038 APInt Min = APInt::getSignedMinValue(Width).sext(ExtendedWidth);
4039 Product = APIntOps::smin(Product, Max);
4040 Product = APIntOps::smax(Product, Min);
4041 }
4042 return ConstantInt::get(Ty->getContext(), Product.sextOrTrunc(Width));
4043 }
4044
4045 if (IntrinsicID == Intrinsic::fshl || IntrinsicID == Intrinsic::fshr) {
4046 const APInt *C0, *C1, *C2;
4047 if (!getConstIntOrUndef(Operands[0], C0) ||
4048 !getConstIntOrUndef(Operands[1], C1) ||
4049 !getConstIntOrUndef(Operands[2], C2))
4050 return nullptr;
4051
4052 bool IsRight = IntrinsicID == Intrinsic::fshr;
4053 if (!C2)
4054 return Operands[IsRight ? 1 : 0];
4055 if (!C0 && !C1)
4056 return UndefValue::get(Ty);
4057
4058 // The shift amount is interpreted as modulo the bitwidth. If the shift
4059 // amount is effectively 0, avoid UB due to oversized inverse shift below.
4060 unsigned BitWidth = C2->getBitWidth();
4061 unsigned ShAmt = C2->urem(BitWidth);
4062 if (!ShAmt)
4063 return Operands[IsRight ? 1 : 0];
4064
4065 // (C0 << ShlAmt) | (C1 >> LshrAmt)
4066 unsigned LshrAmt = IsRight ? ShAmt : BitWidth - ShAmt;
4067 unsigned ShlAmt = !IsRight ? ShAmt : BitWidth - ShAmt;
4068 if (!C0)
4069 return ConstantInt::get(Ty, C1->lshr(LshrAmt));
4070 if (!C1)
4071 return ConstantInt::get(Ty, C0->shl(ShlAmt));
4072 return ConstantInt::get(Ty, C0->shl(ShlAmt) | C1->lshr(LshrAmt));
4073 }
4074
4075 if (IntrinsicID == Intrinsic::amdgcn_perm)
4076 return ConstantFoldAMDGCNPermIntrinsic(Operands, Ty);
4077
4078 return nullptr;
4079}
4080
4081static Constant *ConstantFoldScalarCall(StringRef Name,
4082 Intrinsic::ID IntrinsicID,
4083 Type *Ty,
4084 ArrayRef<Constant *> Operands,
4085 const TargetLibraryInfo *TLI,
4086 const CallBase *Call) {
4087 if (IntrinsicID != Intrinsic::not_intrinsic &&
4088 any_of(Operands, IsaPred<PoisonValue>) &&
4089 intrinsicPropagatesPoison(IntrinsicID))
4090 return PoisonValue::get(Ty);
4091
4092 if (Operands.size() == 1)
4093 return ConstantFoldScalarCall1(Name, IntrinsicID, Ty, Operands, TLI, Call);
4094
4095 if (Operands.size() == 2) {
4096 if (Constant *FoldedLibCall =
4097 ConstantFoldLibCall2(Name, Ty, Operands, TLI)) {
4098 return FoldedLibCall;
4099 }
4100 return ConstantFoldIntrinsicCall2(IntrinsicID, Ty, Operands, Call);
4101 }
4102
4103 if (Operands.size() == 3)
4104 return ConstantFoldScalarCall3(Name, IntrinsicID, Ty, Operands, TLI, Call);
4105
4106 return nullptr;
4107}
4108
4109static Constant *ConstantFoldFixedVectorCall(
4110 StringRef Name, Intrinsic::ID IntrinsicID, FixedVectorType *FVTy,
4111 ArrayRef<Constant *> Operands, const DataLayout &DL,
4112 const TargetLibraryInfo *TLI, const CallBase *Call) {
4114 SmallVector<Constant *, 4> Lane(Operands.size());
4115 Type *Ty = FVTy->getElementType();
4116
4117 switch (IntrinsicID) {
4118 case Intrinsic::masked_load: {
4119 auto *SrcPtr = Operands[0];
4120 auto *Mask = Operands[1];
4121 auto *Passthru = Operands[2];
4122
4123 Constant *VecData = ConstantFoldLoadFromConstPtr(SrcPtr, FVTy, DL);
4124
4125 SmallVector<Constant *, 32> NewElements;
4126 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4127 auto *MaskElt = Mask->getAggregateElement(I);
4128 if (!MaskElt)
4129 break;
4130 auto *PassthruElt = Passthru->getAggregateElement(I);
4131 auto *VecElt = VecData ? VecData->getAggregateElement(I) : nullptr;
4132 if (isa<UndefValue>(MaskElt)) {
4133 if (PassthruElt)
4134 NewElements.push_back(PassthruElt);
4135 else if (VecElt)
4136 NewElements.push_back(VecElt);
4137 else
4138 return nullptr;
4139 }
4140 if (MaskElt->isNullValue()) {
4141 if (!PassthruElt)
4142 return nullptr;
4143 NewElements.push_back(PassthruElt);
4144 } else if (MaskElt->isOneValue()) {
4145 if (!VecElt)
4146 return nullptr;
4147 NewElements.push_back(VecElt);
4148 } else {
4149 return nullptr;
4150 }
4151 }
4152 if (NewElements.size() != FVTy->getNumElements())
4153 return nullptr;
4154 return ConstantVector::get(NewElements);
4155 }
4156 case Intrinsic::arm_mve_vctp8:
4157 case Intrinsic::arm_mve_vctp16:
4158 case Intrinsic::arm_mve_vctp32:
4159 case Intrinsic::arm_mve_vctp64: {
4160 if (auto *Op = dyn_cast<ConstantInt>(Operands[0])) {
4161 unsigned Lanes = FVTy->getNumElements();
4162 uint64_t Limit = Op->getZExtValue();
4163
4165 for (unsigned i = 0; i < Lanes; i++) {
4166 if (i < Limit)
4168 else
4170 }
4171 return ConstantVector::get(NCs);
4172 }
4173 return nullptr;
4174 }
4175 case Intrinsic::get_active_lane_mask: {
4176 auto *Op0 = dyn_cast<ConstantInt>(Operands[0]);
4177 auto *Op1 = dyn_cast<ConstantInt>(Operands[1]);
4178 if (Op0 && Op1) {
4179 unsigned Lanes = FVTy->getNumElements();
4180 uint64_t Base = Op0->getZExtValue();
4181 uint64_t Limit = Op1->getZExtValue();
4182
4184 for (unsigned i = 0; i < Lanes; i++) {
4185 if (Base + i < Limit)
4187 else
4189 }
4190 return ConstantVector::get(NCs);
4191 }
4192 return nullptr;
4193 }
4194 case Intrinsic::vector_extract: {
4195 auto *Idx = dyn_cast<ConstantInt>(Operands[1]);
4196 Constant *Vec = Operands[0];
4197 if (!Idx || !isa<FixedVectorType>(Vec->getType()))
4198 return nullptr;
4199
4200 unsigned NumElements = FVTy->getNumElements();
4201 unsigned VecNumElements =
4202 cast<FixedVectorType>(Vec->getType())->getNumElements();
4203 unsigned StartingIndex = Idx->getZExtValue();
4204
4205 // Extracting entire vector is nop
4206 if (NumElements == VecNumElements && StartingIndex == 0)
4207 return Vec;
4208
4209 for (unsigned I = StartingIndex, E = StartingIndex + NumElements; I < E;
4210 ++I) {
4211 Constant *Elt = Vec->getAggregateElement(I);
4212 if (!Elt)
4213 return nullptr;
4214 Result[I - StartingIndex] = Elt;
4215 }
4216
4217 return ConstantVector::get(Result);
4218 }
4219 case Intrinsic::vector_insert: {
4220 Constant *Vec = Operands[0];
4221 Constant *SubVec = Operands[1];
4222 auto *Idx = dyn_cast<ConstantInt>(Operands[2]);
4223 if (!Idx || !isa<FixedVectorType>(Vec->getType()))
4224 return nullptr;
4225
4226 unsigned SubVecNumElements =
4227 cast<FixedVectorType>(SubVec->getType())->getNumElements();
4228 unsigned VecNumElements =
4229 cast<FixedVectorType>(Vec->getType())->getNumElements();
4230 unsigned IdxN = Idx->getZExtValue();
4231 // Replacing entire vector with a subvec is nop
4232 if (SubVecNumElements == VecNumElements && IdxN == 0)
4233 return SubVec;
4234
4235 for (unsigned I = 0; I < VecNumElements; ++I) {
4236 Constant *Elt;
4237 if (I < IdxN + SubVecNumElements)
4238 Elt = SubVec->getAggregateElement(I - IdxN);
4239 else
4240 Elt = Vec->getAggregateElement(I);
4241 if (!Elt)
4242 return nullptr;
4243 Result[I] = Elt;
4244 }
4245 return ConstantVector::get(Result);
4246 }
4247 case Intrinsic::vector_interleave2:
4248 case Intrinsic::vector_interleave3:
4249 case Intrinsic::vector_interleave4:
4250 case Intrinsic::vector_interleave5:
4251 case Intrinsic::vector_interleave6:
4252 case Intrinsic::vector_interleave7:
4253 case Intrinsic::vector_interleave8: {
4254 unsigned NumElements =
4255 cast<FixedVectorType>(Operands[0]->getType())->getNumElements();
4256 unsigned NumOperands = Operands.size();
4257 for (unsigned I = 0; I < NumElements; ++I) {
4258 for (unsigned J = 0; J < NumOperands; ++J) {
4259 Constant *Elt = Operands[J]->getAggregateElement(I);
4260 if (!Elt)
4261 return nullptr;
4262 Result[NumOperands * I + J] = Elt;
4263 }
4264 }
4265 return ConstantVector::get(Result);
4266 }
4267 case Intrinsic::wasm_dot: {
4268 unsigned NumElements =
4269 cast<FixedVectorType>(Operands[0]->getType())->getNumElements();
4270
4271 assert(NumElements == 8 && Result.size() == 4 &&
4272 "wasm dot takes i16x8 and produces i32x4");
4273 assert(Ty->isIntegerTy());
4274 int32_t MulVector[8];
4275
4276 for (unsigned I = 0; I < NumElements; ++I) {
4277 ConstantInt *Elt0 =
4278 cast<ConstantInt>(Operands[0]->getAggregateElement(I));
4279 ConstantInt *Elt1 =
4280 cast<ConstantInt>(Operands[1]->getAggregateElement(I));
4281
4282 MulVector[I] = Elt0->getSExtValue() * Elt1->getSExtValue();
4283 }
4284 for (unsigned I = 0; I < Result.size(); I++) {
4285 int64_t IAdd = (int64_t)MulVector[I * 2] + (int64_t)MulVector[I * 2 + 1];
4286 Result[I] = ConstantInt::getSigned(Ty, IAdd, /*ImplicitTrunc=*/true);
4287 }
4288
4289 return ConstantVector::get(Result);
4290 }
4291 default:
4292 break;
4293 }
4294
4295 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4296 // Gather a column of constants.
4297 for (unsigned J = 0, JE = Operands.size(); J != JE; ++J) {
4298 // Some intrinsics use a scalar type for certain arguments.
4299 if (isVectorIntrinsicWithScalarOpAtArg(IntrinsicID, J, /*TTI=*/nullptr)) {
4300 Lane[J] = Operands[J];
4301 continue;
4302 }
4303
4304 Constant *Agg = Operands[J]->getAggregateElement(I);
4305 if (!Agg)
4306 return nullptr;
4307
4308 Lane[J] = Agg;
4309 }
4310
4311 // Use the regular scalar folding to simplify this column.
4312 Constant *Folded =
4313 ConstantFoldScalarCall(Name, IntrinsicID, Ty, Lane, TLI, Call);
4314 if (!Folded)
4315 return nullptr;
4316 Result[I] = Folded;
4317 }
4318
4319 return ConstantVector::get(Result);
4320}
4321
4322static Constant *ConstantFoldScalableVectorCall(
4323 StringRef Name, Intrinsic::ID IntrinsicID, ScalableVectorType *SVTy,
4324 ArrayRef<Constant *> Operands, const DataLayout &DL,
4325 const TargetLibraryInfo *TLI, const CallBase *Call) {
4326 switch (IntrinsicID) {
4327 case Intrinsic::aarch64_sve_convert_from_svbool: {
4328 Constant *Src = Operands[0];
4329 if (!Src->isNullValue())
4330 break;
4331
4332 return ConstantInt::getFalse(SVTy);
4333 }
4334 case Intrinsic::get_active_lane_mask: {
4335 auto *Op0 = dyn_cast<ConstantInt>(Operands[0]);
4336 auto *Op1 = dyn_cast<ConstantInt>(Operands[1]);
4337 if (Op0 && Op1 && Op0->getValue().uge(Op1->getValue()))
4338 return ConstantVector::getNullValue(SVTy);
4339 break;
4340 }
4341 case Intrinsic::vector_interleave2:
4342 case Intrinsic::vector_interleave3:
4343 case Intrinsic::vector_interleave4:
4344 case Intrinsic::vector_interleave5:
4345 case Intrinsic::vector_interleave6:
4346 case Intrinsic::vector_interleave7:
4347 case Intrinsic::vector_interleave8: {
4348 Constant *SplatVal = Operands[0]->getSplatValue();
4349 if (!SplatVal)
4350 return nullptr;
4351
4352 if (!llvm::all_equal(Operands))
4353 return nullptr;
4354
4355 return ConstantVector::getSplat(SVTy->getElementCount(), SplatVal);
4356 }
4357 default:
4358 break;
4359 }
4360
4361 // If trivially vectorizable, try folding it via the scalar call if all
4362 // operands are splats.
4363
4364 // TODO: ConstantFoldFixedVectorCall should probably check this too?
4365 if (!isTriviallyVectorizable(IntrinsicID))
4366 return nullptr;
4367
4369 for (auto [I, Op] : enumerate(Operands)) {
4370 if (isVectorIntrinsicWithScalarOpAtArg(IntrinsicID, I, /*TTI=*/nullptr)) {
4371 SplatOps.push_back(Op);
4372 continue;
4373 }
4374 Constant *Splat = Op->getSplatValue();
4375 if (!Splat)
4376 return nullptr;
4377 SplatOps.push_back(Splat);
4378 }
4379 Constant *Folded = ConstantFoldScalarCall(
4380 Name, IntrinsicID, SVTy->getElementType(), SplatOps, TLI, Call);
4381 if (!Folded)
4382 return nullptr;
4383 return ConstantVector::getSplat(SVTy->getElementCount(), Folded);
4384}
4385
4386static std::pair<Constant *, Constant *>
4387ConstantFoldScalarFrexpCall(Constant *Op, Type *IntTy) {
4388 if (isa<PoisonValue>(Op))
4389 return {Op, PoisonValue::get(IntTy)};
4390
4391 auto *ConstFP = dyn_cast<ConstantFP>(Op);
4392 if (!ConstFP)
4393 return {};
4394
4395 const APFloat &U = ConstFP->getValueAPF();
4396 int FrexpExp;
4397 APFloat FrexpMant = frexp(U, FrexpExp, APFloat::rmNearestTiesToEven);
4398 Constant *Result0 = ConstantFP::get(ConstFP->getType(), FrexpMant);
4399
4400 // The exponent is an "unspecified value" for inf/nan. We use zero to avoid
4401 // using undef.
4402 Constant *Result1 = FrexpMant.isFinite()
4403 ? ConstantInt::getSigned(IntTy, FrexpExp)
4404 : ConstantInt::getNullValue(IntTy);
4405 return {Result0, Result1};
4406}
4407
4408/// Handle intrinsics that return tuples, which may be tuples of vectors.
4409static Constant *
4410ConstantFoldStructCall(StringRef Name, Intrinsic::ID IntrinsicID,
4411 StructType *StTy, ArrayRef<Constant *> Operands,
4412 const DataLayout &DL, const TargetLibraryInfo *TLI,
4413 const CallBase *Call) {
4414
4415 switch (IntrinsicID) {
4416 case Intrinsic::frexp: {
4417 Type *Ty0 = StTy->getContainedType(0);
4418 Type *Ty1 = StTy->getContainedType(1)->getScalarType();
4419
4420 if (auto *FVTy0 = dyn_cast<FixedVectorType>(Ty0)) {
4421 SmallVector<Constant *, 4> Results0(FVTy0->getNumElements());
4422 SmallVector<Constant *, 4> Results1(FVTy0->getNumElements());
4423
4424 for (unsigned I = 0, E = FVTy0->getNumElements(); I != E; ++I) {
4425 Constant *Lane = Operands[0]->getAggregateElement(I);
4426 std::tie(Results0[I], Results1[I]) =
4427 ConstantFoldScalarFrexpCall(Lane, Ty1);
4428 if (!Results0[I])
4429 return nullptr;
4430 }
4431
4432 return ConstantStruct::get(StTy, ConstantVector::get(Results0),
4433 ConstantVector::get(Results1));
4434 }
4435
4436 auto [Result0, Result1] = ConstantFoldScalarFrexpCall(Operands[0], Ty1);
4437 if (!Result0)
4438 return nullptr;
4439 return ConstantStruct::get(StTy, Result0, Result1);
4440 }
4441 case Intrinsic::sincos: {
4442 Type *Ty = StTy->getContainedType(0);
4443 Type *TyScalar = Ty->getScalarType();
4444
4445 auto ConstantFoldScalarSincosCall =
4446 [&](Constant *Op) -> std::pair<Constant *, Constant *> {
4447 Constant *SinResult =
4448 ConstantFoldScalarCall(Name, Intrinsic::sin, TyScalar, Op, TLI, Call);
4449 Constant *CosResult =
4450 ConstantFoldScalarCall(Name, Intrinsic::cos, TyScalar, Op, TLI, Call);
4451 return std::make_pair(SinResult, CosResult);
4452 };
4453
4454 if (auto *FVTy = dyn_cast<FixedVectorType>(Ty)) {
4455 SmallVector<Constant *> SinResults(FVTy->getNumElements());
4456 SmallVector<Constant *> CosResults(FVTy->getNumElements());
4457
4458 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4459 Constant *Lane = Operands[0]->getAggregateElement(I);
4460 std::tie(SinResults[I], CosResults[I]) =
4461 ConstantFoldScalarSincosCall(Lane);
4462 if (!SinResults[I] || !CosResults[I])
4463 return nullptr;
4464 }
4465
4466 return ConstantStruct::get(StTy, ConstantVector::get(SinResults),
4467 ConstantVector::get(CosResults));
4468 }
4469
4470 auto [SinResult, CosResult] = ConstantFoldScalarSincosCall(Operands[0]);
4471 if (!SinResult || !CosResult)
4472 return nullptr;
4473 return ConstantStruct::get(StTy, SinResult, CosResult);
4474 }
4475 case Intrinsic::vector_deinterleave2:
4476 case Intrinsic::vector_deinterleave3:
4477 case Intrinsic::vector_deinterleave4:
4478 case Intrinsic::vector_deinterleave5:
4479 case Intrinsic::vector_deinterleave6:
4480 case Intrinsic::vector_deinterleave7:
4481 case Intrinsic::vector_deinterleave8: {
4482 unsigned NumResults = StTy->getNumElements();
4483 auto *Vec = Operands[0];
4484 auto *VecTy = cast<VectorType>(Vec->getType());
4485
4486 ElementCount ResultEC =
4487 VecTy->getElementCount().divideCoefficientBy(NumResults);
4488
4489 if (auto *EltC = Vec->getSplatValue()) {
4490 auto *ResultVec = ConstantVector::getSplat(ResultEC, EltC);
4491 SmallVector<Constant *, 8> Results(NumResults, ResultVec);
4492 return ConstantStruct::get(StTy, Results);
4493 }
4494
4495 if (!ResultEC.isFixed())
4496 return nullptr;
4497
4498 unsigned NumElements = ResultEC.getFixedValue();
4500 SmallVector<Constant *> Elements(NumElements);
4501 for (unsigned I = 0; I != NumResults; ++I) {
4502 for (unsigned J = 0; J != NumElements; ++J) {
4503 Constant *Elt = Vec->getAggregateElement(J * NumResults + I);
4504 if (!Elt)
4505 return nullptr;
4506 Elements[J] = Elt;
4507 }
4508 Results[I] = ConstantVector::get(Elements);
4509 }
4510 return ConstantStruct::get(StTy, Results);
4511 }
4512 default:
4513 // TODO: Constant folding of vector intrinsics that fall through here does
4514 // not work (e.g. overflow intrinsics)
4515 return ConstantFoldScalarCall(Name, IntrinsicID, StTy, Operands, TLI, Call);
4516 }
4517
4518 return nullptr;
4519}
4520
4521} // end anonymous namespace
4522
4524 Constant *RHS, Type *Ty,
4527 // Ensure we check flags like StrictFP that might prevent this from getting
4528 // folded before generating a result.
4529 if (Call && !canConstantFoldCallTo(Call, Call->getCalledFunction()))
4530 return nullptr;
4531 return ConstantFoldIntrinsicCall2(ID, Ty, {LHS, RHS}, Call);
4532}
4533
4535 ArrayRef<Constant *> Operands,
4536 const TargetLibraryInfo *TLI,
4537 bool AllowNonDeterministic) {
4538 if (Call->isNoBuiltin())
4539 return nullptr;
4540 if (!F->hasName())
4541 return nullptr;
4542
4543 // If this is not an intrinsic and not recognized as a library call, bail out.
4544 Intrinsic::ID IID = F->getIntrinsicID();
4545 if (IID == Intrinsic::not_intrinsic) {
4546 if (!TLI)
4547 return nullptr;
4548 LibFunc LibF;
4549 if (!TLI->getLibFunc(*F, LibF))
4550 return nullptr;
4551 }
4552
4553 // Conservatively assume that floating-point libcalls may be
4554 // non-deterministic.
4555 Type *Ty = F->getReturnType();
4556 if (!AllowNonDeterministic && Ty->isFPOrFPVectorTy())
4557 return nullptr;
4558
4559 StringRef Name = F->getName();
4560 if (auto *FVTy = dyn_cast<FixedVectorType>(Ty))
4561 return ConstantFoldFixedVectorCall(
4562 Name, IID, FVTy, Operands, F->getDataLayout(), TLI, Call);
4563
4564 if (auto *SVTy = dyn_cast<ScalableVectorType>(Ty))
4565 return ConstantFoldScalableVectorCall(
4566 Name, IID, SVTy, Operands, F->getDataLayout(), TLI, Call);
4567
4568 if (auto *StTy = dyn_cast<StructType>(Ty))
4569 return ConstantFoldStructCall(Name, IID, StTy, Operands,
4570 F->getDataLayout(), TLI, Call);
4571
4572 // TODO: If this is a library function, we already discovered that above,
4573 // so we should pass the LibFunc, not the name (and it might be better
4574 // still to separate intrinsic handling from libcalls).
4575 return ConstantFoldScalarCall(Name, IID, Ty, Operands, TLI, Call);
4576}
4577
4579 const TargetLibraryInfo *TLI) {
4580 // FIXME: Refactor this code; this duplicates logic in LibCallsShrinkWrap
4581 // (and to some extent ConstantFoldScalarCall).
4582 if (Call->isNoBuiltin() || Call->isStrictFP())
4583 return false;
4584 Function *F = Call->getCalledFunction();
4585 if (!F)
4586 return false;
4587
4588 LibFunc Func;
4589 if (!TLI || !TLI->getLibFunc(*F, Func))
4590 return false;
4591
4592 if (Call->arg_size() == 1) {
4593 if (ConstantFP *OpC = dyn_cast<ConstantFP>(Call->getArgOperand(0))) {
4594 const APFloat &Op = OpC->getValueAPF();
4595 switch (Func) {
4596 case LibFunc_logl:
4597 case LibFunc_log:
4598 case LibFunc_logf:
4599 case LibFunc_log2l:
4600 case LibFunc_log2:
4601 case LibFunc_log2f:
4602 case LibFunc_log10l:
4603 case LibFunc_log10:
4604 case LibFunc_log10f:
4605 return Op.isNaN() || (!Op.isZero() && !Op.isNegative());
4606
4607 case LibFunc_ilogb:
4608 return !Op.isNaN() && !Op.isZero() && !Op.isInfinity();
4609
4610 case LibFunc_expl:
4611 case LibFunc_exp:
4612 case LibFunc_expf:
4613 // FIXME: These boundaries are slightly conservative.
4614 if (OpC->getType()->isDoubleTy())
4615 return !(Op < APFloat(-745.0) || Op > APFloat(709.0));
4616 if (OpC->getType()->isFloatTy())
4617 return !(Op < APFloat(-103.0f) || Op > APFloat(88.0f));
4618 break;
4619
4620 case LibFunc_exp2l:
4621 case LibFunc_exp2:
4622 case LibFunc_exp2f:
4623 // FIXME: These boundaries are slightly conservative.
4624 if (OpC->getType()->isDoubleTy())
4625 return !(Op < APFloat(-1074.0) || Op > APFloat(1023.0));
4626 if (OpC->getType()->isFloatTy())
4627 return !(Op < APFloat(-149.0f) || Op > APFloat(127.0f));
4628 break;
4629
4630 case LibFunc_sinl:
4631 case LibFunc_sin:
4632 case LibFunc_sinf:
4633 case LibFunc_cosl:
4634 case LibFunc_cos:
4635 case LibFunc_cosf:
4636 return !Op.isInfinity();
4637
4638 case LibFunc_tanl:
4639 case LibFunc_tan:
4640 case LibFunc_tanf: {
4641 // FIXME: Stop using the host math library.
4642 // FIXME: The computation isn't done in the right precision.
4643 Type *Ty = OpC->getType();
4644 if (Ty->isDoubleTy() || Ty->isFloatTy() || Ty->isHalfTy())
4645 return ConstantFoldFP(tan, OpC->getValueAPF(), Ty) != nullptr;
4646 break;
4647 }
4648
4649 case LibFunc_atan:
4650 case LibFunc_atanf:
4651 case LibFunc_atanl:
4652 // Per POSIX, this MAY fail if Op is denormal. We choose not failing.
4653 return true;
4654
4655 case LibFunc_asinl:
4656 case LibFunc_asin:
4657 case LibFunc_asinf:
4658 case LibFunc_acosl:
4659 case LibFunc_acos:
4660 case LibFunc_acosf:
4661 return !(Op < APFloat::getOne(Op.getSemantics(), true) ||
4662 Op > APFloat::getOne(Op.getSemantics()));
4663
4664 case LibFunc_sinh:
4665 case LibFunc_cosh:
4666 case LibFunc_sinhf:
4667 case LibFunc_coshf:
4668 case LibFunc_sinhl:
4669 case LibFunc_coshl:
4670 // FIXME: These boundaries are slightly conservative.
4671 if (OpC->getType()->isDoubleTy())
4672 return !(Op < APFloat(-710.0) || Op > APFloat(710.0));
4673 if (OpC->getType()->isFloatTy())
4674 return !(Op < APFloat(-89.0f) || Op > APFloat(89.0f));
4675 break;
4676
4677 case LibFunc_sqrtl:
4678 case LibFunc_sqrt:
4679 case LibFunc_sqrtf:
4680 return Op.isNaN() || Op.isZero() || !Op.isNegative();
4681
4682 // FIXME: Add more functions: sqrt_finite, atanh, expm1, log1p,
4683 // maybe others?
4684 default:
4685 break;
4686 }
4687 }
4688 }
4689
4690 if (Call->arg_size() == 2) {
4691 ConstantFP *Op0C = dyn_cast<ConstantFP>(Call->getArgOperand(0));
4692 ConstantFP *Op1C = dyn_cast<ConstantFP>(Call->getArgOperand(1));
4693 if (Op0C && Op1C) {
4694 const APFloat &Op0 = Op0C->getValueAPF();
4695 const APFloat &Op1 = Op1C->getValueAPF();
4696
4697 switch (Func) {
4698 case LibFunc_powl:
4699 case LibFunc_pow:
4700 case LibFunc_powf: {
4701 // FIXME: Stop using the host math library.
4702 // FIXME: The computation isn't done in the right precision.
4703 Type *Ty = Op0C->getType();
4704 if (Ty->isDoubleTy() || Ty->isFloatTy() || Ty->isHalfTy()) {
4705 if (Ty == Op1C->getType())
4706 return ConstantFoldBinaryFP(pow, Op0, Op1, Ty) != nullptr;
4707 }
4708 break;
4709 }
4710
4711 case LibFunc_fmodl:
4712 case LibFunc_fmod:
4713 case LibFunc_fmodf:
4714 case LibFunc_remainderl:
4715 case LibFunc_remainder:
4716 case LibFunc_remainderf:
4717 return Op0.isNaN() || Op1.isNaN() ||
4718 (!Op0.isInfinity() && !Op1.isZero());
4719
4720 case LibFunc_atan2:
4721 case LibFunc_atan2f:
4722 case LibFunc_atan2l:
4723 // Although IEEE-754 says atan2(+/-0.0, +/-0.0) are well-defined, and
4724 // GLIBC and MSVC do not appear to raise an error on those, we
4725 // cannot rely on that behavior. POSIX and C11 say that a domain error
4726 // may occur, so allow for that possibility.
4727 return !Op0.isZero() || !Op1.isZero();
4728
4729 default:
4730 break;
4731 }
4732 }
4733 }
4734
4735 return false;
4736}
4737
4739 unsigned CastOp, const DataLayout &DL,
4740 PreservedCastFlags *Flags) {
4741 switch (CastOp) {
4742 case Instruction::BitCast:
4743 // Bitcast is always lossless.
4744 return ConstantFoldCastOperand(Instruction::BitCast, C, InvCastTo, DL);
4745 case Instruction::Trunc: {
4746 auto *ZExtC = ConstantFoldCastOperand(Instruction::ZExt, C, InvCastTo, DL);
4747 if (Flags) {
4748 // Truncation back on ZExt value is always NUW.
4749 Flags->NUW = true;
4750 // Test positivity of C.
4751 auto *SExtC =
4752 ConstantFoldCastOperand(Instruction::SExt, C, InvCastTo, DL);
4753 Flags->NSW = ZExtC == SExtC;
4754 }
4755 return ZExtC;
4756 }
4757 case Instruction::SExt:
4758 case Instruction::ZExt: {
4759 auto *InvC = ConstantExpr::getTrunc(C, InvCastTo);
4760 auto *CastInvC = ConstantFoldCastOperand(CastOp, InvC, C->getType(), DL);
4761 // Must satisfy CastOp(InvC) == C.
4762 if (!CastInvC || CastInvC != C)
4763 return nullptr;
4764 if (Flags && CastOp == Instruction::ZExt) {
4765 auto *SExtInvC =
4766 ConstantFoldCastOperand(Instruction::SExt, InvC, C->getType(), DL);
4767 // Test positivity of InvC.
4768 Flags->NNeg = CastInvC == SExtInvC;
4769 }
4770 return InvC;
4771 }
4772 case Instruction::FPExt: {
4773 Constant *InvC =
4774 ConstantFoldCastOperand(Instruction::FPTrunc, C, InvCastTo, DL);
4775 if (InvC) {
4776 Constant *CastInvC =
4777 ConstantFoldCastOperand(CastOp, InvC, C->getType(), DL);
4778 if (CastInvC == C)
4779 return InvC;
4780 }
4781 return nullptr;
4782 }
4783 default:
4784 return nullptr;
4785 }
4786}
4787
4789 const DataLayout &DL,
4790 PreservedCastFlags *Flags) {
4791 return getLosslessInvCast(C, DestTy, Instruction::ZExt, DL, Flags);
4792}
4793
4795 const DataLayout &DL,
4796 PreservedCastFlags *Flags) {
4797 return getLosslessInvCast(C, DestTy, Instruction::SExt, DL, Flags);
4798}
4799
4800void TargetFolder::anchor() {}
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
constexpr LLT S1
This file declares a class to represent arbitrary precision floating point values and provide a varie...
This file implements a class to represent arbitrary precision integral constant values and operations...
This file implements the APSInt class, which is a simple class that represents an arbitrary sized int...
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Function Alias Analysis Results
#define X(NUM, ENUM, NAME)
Definition ELF.h:849
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
static Constant * FoldBitCast(Constant *V, Type *DestTy)
static ConstantFP * flushDenormalConstant(Type *Ty, const APFloat &APF, DenormalMode::DenormalModeKind Mode)
Constant * getConstantAtOffset(Constant *Base, APInt Offset, const DataLayout &DL)
If this Offset points exactly to the start of an aggregate element, return that element,...
static cl::opt< bool > DisableFPCallFolding("disable-fp-call-folding", cl::desc("Disable constant-folding of FP intrinsics and libcalls."), cl::init(false), cl::Hidden)
static ConstantFP * flushDenormalConstantFP(ConstantFP *CFP, const Instruction *Inst, bool IsOutput)
static DenormalMode getInstrDenormalMode(const Instruction *CtxI, Type *Ty)
Return the denormal mode that can be assumed when executing a floating point operation at CtxI.
This file contains the declarations for the subclasses of Constant, which represent the different fla...
This file defines the DenseMap class.
Hexagon Common GEP
amode Optimize addressing mode
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
static bool InRange(int64_t Value, unsigned short Shift, int LBound, int HBound)
This file contains the definitions of the enumerations and flags associated with NVVM Intrinsics,...
if(PassOpts->AAPipeline)
const SmallVectorImpl< MachineOperand > & Cond
static cl::opt< RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode > Mode("regalloc-enable-advisor", cl::Hidden, cl::init(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default), cl::desc("Enable regalloc advisor mode"), cl::values(clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default, "default", "Default"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Release, "release", "precompiled"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Development, "development", "for training")))
This file contains some templates that are useful if you are working with the STL at all.
This file defines the SmallVector class.
static SymbolRef::Type getType(const Symbol *Sym)
Definition TapiFile.cpp:39
The Input class is used to parse a yaml document into in-memory structs and vectors.
static constexpr roundingMode rmTowardZero
Definition APFloat.h:348
llvm::RoundingMode roundingMode
IEEE-754R 4.3: Rounding-direction attributes.
Definition APFloat.h:342
static const fltSemantics & IEEEdouble()
Definition APFloat.h:297
static constexpr roundingMode rmTowardNegative
Definition APFloat.h:347
static constexpr roundingMode rmNearestTiesToEven
Definition APFloat.h:344
static constexpr roundingMode rmTowardPositive
Definition APFloat.h:346
static const fltSemantics & IEEEhalf()
Definition APFloat.h:294
static constexpr roundingMode rmNearestTiesToAway
Definition APFloat.h:349
opStatus
IEEE-754R 7: Default exception handling.
Definition APFloat.h:360
static APFloat getQNaN(const fltSemantics &Sem, bool Negative=false, const APInt *payload=nullptr)
Factory for QNaN values.
Definition APFloat.h:1175
opStatus divide(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1263
void copySign(const APFloat &RHS)
Definition APFloat.h:1357
LLVM_ABI opStatus convert(const fltSemantics &ToSemantics, roundingMode RM, bool *losesInfo)
Definition APFloat.cpp:5890
opStatus subtract(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1245
bool isNegative() const
Definition APFloat.h:1516
LLVM_ABI double convertToDouble() const
Converts this APFloat to host double value.
Definition APFloat.cpp:5949
bool isPosInfinity() const
Definition APFloat.h:1529
bool isNormal() const
Definition APFloat.h:1520
bool isDenormal() const
Definition APFloat.h:1517
opStatus add(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1236
const fltSemantics & getSemantics() const
Definition APFloat.h:1524
bool isNonZero() const
Definition APFloat.h:1525
bool isFinite() const
Definition APFloat.h:1521
bool isNaN() const
Definition APFloat.h:1514
static APFloat getOne(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative One.
Definition APFloat.h:1143
opStatus multiply(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1254
LLVM_ABI float convertToFloat() const
Converts this APFloat to host float value.
Definition APFloat.cpp:5977
bool isSignaling() const
Definition APFloat.h:1518
opStatus fusedMultiplyAdd(const APFloat &Multiplicand, const APFloat &Addend, roundingMode RM)
Definition APFloat.h:1290
bool isZero() const
Definition APFloat.h:1512
opStatus convertToInteger(MutableArrayRef< integerPart > Input, unsigned int Width, bool IsSigned, roundingMode RM, bool *IsExact) const
Definition APFloat.h:1387
opStatus mod(const APFloat &RHS)
Definition APFloat.h:1281
bool isNegInfinity() const
Definition APFloat.h:1530
opStatus roundToIntegral(roundingMode RM)
Definition APFloat.h:1303
void changeSign()
Definition APFloat.h:1352
static APFloat getZero(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative Zero.
Definition APFloat.h:1134
bool isInfinity() const
Definition APFloat.h:1513
Class for arbitrary precision integers.
Definition APInt.h:78
LLVM_ABI APInt umul_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:2011
LLVM_ABI APInt usub_sat(const APInt &RHS) const
Definition APInt.cpp:2095
bool isMinSignedValue() const
Determine if this is the smallest signed value.
Definition APInt.h:424
uint64_t getZExtValue() const
Get zero extended value.
Definition APInt.h:1555
LLVM_ABI uint64_t extractBitsAsZExtValue(unsigned numBits, unsigned bitPosition) const
Definition APInt.cpp:520
LLVM_ABI APInt zextOrTrunc(unsigned width) const
Zero extend or truncate to width.
Definition APInt.cpp:1064
LLVM_ABI APInt trunc(unsigned width) const
Truncate to new width.
Definition APInt.cpp:956
static APInt getMaxValue(unsigned numBits)
Gets maximum unsigned value of APInt for specific bit width.
Definition APInt.h:207
APInt abs() const
Get the absolute value.
Definition APInt.h:1810
LLVM_ABI APInt sadd_sat(const APInt &RHS) const
Definition APInt.cpp:2066
bool sgt(const APInt &RHS) const
Signed greater than comparison.
Definition APInt.h:1208
LLVM_ABI APInt usub_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1988
bool ugt(const APInt &RHS) const
Unsigned greater than comparison.
Definition APInt.h:1189
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
Definition APInt.h:381
LLVM_ABI APInt urem(const APInt &RHS) const
Unsigned remainder operation.
Definition APInt.cpp:1697
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition APInt.h:1503
bool ult(const APInt &RHS) const
Unsigned less than comparison.
Definition APInt.h:1118
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition APInt.h:210
LLVM_ABI APInt sadd_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1968
LLVM_ABI APInt uadd_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1975
unsigned countr_zero() const
Count the number of trailing zero bits.
Definition APInt.h:1654
unsigned countl_zero() const
The APInt version of std::countl_zero.
Definition APInt.h:1613
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
Definition APInt.h:220
LLVM_ABI APInt sextOrTrunc(unsigned width) const
Sign extend or truncate to width.
Definition APInt.cpp:1072
LLVM_ABI APInt uadd_sat(const APInt &RHS) const
Definition APInt.cpp:2076
APInt ashr(unsigned ShiftAmt) const
Arithmetic right-shift function.
Definition APInt.h:834
LLVM_ABI APInt smul_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:2000
LLVM_ABI APInt sext(unsigned width) const
Sign extend to a new width.
Definition APInt.cpp:1016
APInt shl(unsigned shiftAmt) const
Left-shift function.
Definition APInt.h:880
bool slt(const APInt &RHS) const
Signed less than comparison.
Definition APInt.h:1137
LLVM_ABI APInt extractBits(unsigned numBits, unsigned bitPosition) const
Return an APInt with the extracted bits [bitPosition,bitPosition+numBits).
Definition APInt.cpp:482
LLVM_ABI APInt ssub_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1981
bool isOne() const
Determine if this is a value of 1.
Definition APInt.h:390
APInt lshr(unsigned shiftAmt) const
Logical right-shift function.
Definition APInt.h:858
LLVM_ABI APInt ssub_sat(const APInt &RHS) const
Definition APInt.cpp:2085
An arbitrary precision integer that knows its signedness.
Definition APSInt.h:24
This class represents an incoming formal argument to a Function.
Definition Argument.h:32
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
size_t size() const
size - Get the array size.
Definition ArrayRef.h:142
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
static LLVM_ABI Instruction::CastOps getCastOpcode(const Value *Val, bool SrcIsSigned, Type *Ty, bool DstIsSigned)
Returns the opcode necessary to cast Val into Ty using usual casting rules.
static LLVM_ABI unsigned isEliminableCastPair(Instruction::CastOps firstOpcode, Instruction::CastOps secondOpcode, Type *SrcTy, Type *MidTy, Type *DstTy, const DataLayout *DL)
Determine how a pair of casts can be eliminated, if they can be at all.
static LLVM_ABI bool castIsValid(Instruction::CastOps op, Type *SrcTy, Type *DstTy)
This method can be used to determine if a cast from SrcTy to DstTy using Opcode op is valid or not.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:676
bool isSigned() const
Definition InstrTypes.h:930
Predicate getSwappedPredicate() const
For example, EQ->EQ, SLE->SGE, ULT->UGT, OEQ->OEQ, ULE->UGE, OLT->OGT, etc.
Definition InstrTypes.h:827
static bool isFPPredicate(Predicate P)
Definition InstrTypes.h:770
static Constant * get(LLVMContext &Context, ArrayRef< ElementTy > Elts)
get() constructor - Return a constant with array type with an element count and element type matching...
Definition Constants.h:859
static LLVM_ABI Constant * getIntToPtr(Constant *C, Type *Ty, bool OnlyIfReduced=false)
static LLVM_ABI Constant * getExtractElement(Constant *Vec, Constant *Idx, Type *OnlyIfReducedTy=nullptr)
static LLVM_ABI bool isDesirableCastOp(unsigned Opcode)
Whether creating a constant expression for this cast is desirable.
static LLVM_ABI Constant * getCast(unsigned ops, Constant *C, Type *Ty, bool OnlyIfReduced=false)
Convenience function for getting a Cast operation.
static LLVM_ABI Constant * getSub(Constant *C1, Constant *C2, bool HasNUW=false, bool HasNSW=false)
static Constant * getPtrAdd(Constant *Ptr, Constant *Offset, GEPNoWrapFlags NW=GEPNoWrapFlags::none(), std::optional< ConstantRange > InRange=std::nullopt, Type *OnlyIfReduced=nullptr)
Create a getelementptr i8, ptr, offset constant expression.
Definition Constants.h:1472
static LLVM_ABI Constant * getInsertElement(Constant *Vec, Constant *Elt, Constant *Idx, Type *OnlyIfReducedTy=nullptr)
static LLVM_ABI Constant * getShuffleVector(Constant *V1, Constant *V2, ArrayRef< int > Mask, Type *OnlyIfReducedTy=nullptr)
static bool isSupportedGetElementPtr(const Type *SrcElemTy)
Whether creating a constant expression for this getelementptr type is supported.
Definition Constants.h:1573
static LLVM_ABI Constant * get(unsigned Opcode, Constant *C1, Constant *C2, unsigned Flags=0, Type *OnlyIfReducedTy=nullptr)
get - Return a binary or shift operator constant expression, folding if possible.
static LLVM_ABI bool isDesirableBinOp(unsigned Opcode)
Whether creating a constant expression for this binary operator is desirable.
static Constant * getGetElementPtr(Type *Ty, Constant *C, ArrayRef< Constant * > IdxList, GEPNoWrapFlags NW=GEPNoWrapFlags::none(), std::optional< ConstantRange > InRange=std::nullopt, Type *OnlyIfReducedTy=nullptr)
Getelementptr form.
Definition Constants.h:1445
static LLVM_ABI Constant * getBitCast(Constant *C, Type *Ty, bool OnlyIfReduced=false)
static LLVM_ABI Constant * getTrunc(Constant *C, Type *Ty, bool OnlyIfReduced=false)
ConstantFP - Floating Point Values [float, double].
Definition Constants.h:420
const APFloat & getValueAPF() const
Definition Constants.h:463
static LLVM_ABI Constant * getInfinity(Type *Ty, bool Negative=false)
static LLVM_ABI Constant * getZero(Type *Ty, bool Negative=false)
static LLVM_ABI Constant * getNaN(Type *Ty, bool Negative=false, uint64_t Payload=0)
This is the shared class of boolean and integer constants.
Definition Constants.h:87
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
static ConstantInt * getSigned(IntegerType *Ty, int64_t V, bool ImplicitTrunc=false)
Return a ConstantInt with the specified value for the specified type.
Definition Constants.h:135
static LLVM_ABI ConstantInt * getFalse(LLVMContext &Context)
int64_t getSExtValue() const
Return the constant as a 64-bit integer value after it has been sign extended as appropriate for the ...
Definition Constants.h:174
static LLVM_ABI ConstantInt * getBool(LLVMContext &Context, bool V)
static LLVM_ABI Constant * get(StructType *T, ArrayRef< Constant * > V)
static LLVM_ABI Constant * getSplat(ElementCount EC, Constant *Elt)
Return a ConstantVector with the specified constant in each element.
static LLVM_ABI Constant * get(ArrayRef< Constant * > V)
This is an important base class in LLVM.
Definition Constant.h:43
LLVM_ABI Constant * getSplatValue(bool AllowPoison=false) const
If all elements of the vector constant have the same value, return that value.
static LLVM_ABI Constant * getAllOnesValue(Type *Ty)
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
LLVM_ABI Constant * getAggregateElement(unsigned Elt) const
For aggregates (struct/array/vector) return the constant that corresponds to the specified element if...
LLVM_ABI bool isNullValue() const
Return true if this is the value that would be returned by getNullValue.
Definition Constants.cpp:74
Constrained floating point compare intrinsics.
This is the common base class for constrained floating point intrinsics.
LLVM_ABI std::optional< fp::ExceptionBehavior > getExceptionBehavior() const
LLVM_ABI std::optional< RoundingMode > getRoundingMode() const
Wrapper for a function that represents a value that functionally represents the original function.
Definition Constants.h:1118
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64
iterator find(const_arg_type_t< KeyT > Val)
Definition DenseMap.h:178
iterator end()
Definition DenseMap.h:81
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Definition DenseMap.h:241
static LLVM_ABI bool compare(const APFloat &LHS, const APFloat &RHS, FCmpInst::Predicate Pred)
Return result of LHS Pred RHS comparison.
This provides a helper for copying FMF from an instruction or setting specified flags.
Definition IRBuilder.h:93
Class to represent fixed width SIMD vectors.
unsigned getNumElements() const
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
Definition Type.cpp:873
DenormalMode getDenormalMode(const fltSemantics &FPType) const
Returns the denormal handling type for the default rounding mode of the function.
Definition Function.cpp:804
Represents flags for the getelementptr instruction/expression.
static GEPNoWrapFlags inBounds()
GEPNoWrapFlags withoutNoUnsignedSignedWrap() const
static GEPNoWrapFlags noUnsignedWrap()
bool hasNoUnsignedSignedWrap() const
bool isInBounds() const
static LLVM_ABI Type * getIndexedType(Type *Ty, ArrayRef< Value * > IdxList)
Returns the result type of a getelementptr with the given source element type and indexes.
PointerType * getType() const
Global values are always pointers.
LLVM_ABI const DataLayout & getDataLayout() const
Get the data layout of the module this global belongs to.
Definition Globals.cpp:135
const Constant * getInitializer() const
getInitializer - Return the initializer for this global variable.
bool isConstant() const
If the value is a global constant, its value is immutable throughout the runtime execution of the pro...
bool hasDefinitiveInitializer() const
hasDefinitiveInitializer - Whether the global variable has an initializer, and any other instances of...
static LLVM_ABI bool compare(const APInt &LHS, const APInt &RHS, ICmpInst::Predicate Pred)
Return result of LHS Pred RHS comparison.
Predicate getSignedPredicate() const
For example, EQ->EQ, SLE->SLE, UGT->SGT, etc.
bool isEquality() const
Return true if this predicate is either EQ or NE.
bool isCast() const
bool isBinaryOp() const
LLVM_ABI const Function * getFunction() const
Return the function this instruction belongs to.
bool isUnaryOp() const
static LLVM_ABI IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition Type.cpp:354
This is an important class for using LLVM in a threaded context.
Definition LLVMContext.h:68
static APInt getSaturationPoint(Intrinsic::ID ID, unsigned numBits)
Min/max intrinsics are monotonic, they operate on a fixed-bitwidth values, so there is a certain thre...
static ICmpInst::Predicate getPredicate(Intrinsic::ID ID)
Returns the comparison predicate underlying the intrinsic.
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Class to represent scalable SIMD vectors.
void push_back(const T &Elt)
pointer data()
Return a pointer to the vector's buffer, even if empty().
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55
Used to lazily calculate structure layout information for a target machine, based on the DataLayout s...
Definition DataLayout.h:736
LLVM_ABI unsigned getElementContainingOffset(uint64_t FixedOffset) const
Given a valid byte offset into the structure, returns the structure index that contains it.
TypeSize getElementOffset(unsigned Idx) const
Definition DataLayout.h:767
Class to represent struct types.
unsigned getNumElements() const
Random access to the elements.
Provides information about what library functions are available for the current target.
bool has(LibFunc F) const
Tests whether a library function is available.
bool getLibFunc(StringRef funcName, LibFunc &F) const
Searches for a particular function name.
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46
static LLVM_ABI IntegerType * getInt64Ty(LLVMContext &C)
Definition Type.cpp:314
bool isVectorTy() const
True if this is an instance of VectorType.
Definition Type.h:290
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
Definition Type.cpp:313
bool isPointerTy() const
True if this is an instance of PointerType.
Definition Type.h:284
LLVM_ABI unsigned getPointerAddressSpace() const
Get the address space of this pointer or pointer vector type.
@ HalfTyID
16-bit floating point type
Definition Type.h:57
@ FloatTyID
32-bit floating point type
Definition Type.h:59
@ DoubleTyID
64-bit floating point type
Definition Type.h:60
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition Type.h:370
LLVM_ABI TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
Definition Type.cpp:201
static LLVM_ABI IntegerType * getInt16Ty(LLVMContext &C)
Definition Type.cpp:312
bool isSized(SmallPtrSetImpl< Type * > *Visited=nullptr) const
Return true if it makes sense to take the size of this type.
Definition Type.h:328
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
Definition Type.h:130
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
Definition Type.cpp:236
static LLVM_ABI IntegerType * getInt1Ty(LLVMContext &C)
Definition Type.cpp:310
bool isFloatingPointTy() const
Return true if this is one of the floating-point types.
Definition Type.h:186
bool isPtrOrPtrVectorTy() const
Return true if this is a pointer type or a vector of pointer types.
Definition Type.h:287
bool isX86_AMXTy() const
Return true if this is X86 AMX.
Definition Type.h:202
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition Type.h:257
static LLVM_ABI IntegerType * getIntNTy(LLVMContext &C, unsigned N)
Definition Type.cpp:317
Type * getContainedType(unsigned i) const
This method is used to implement the type iterator (defined at the end of the file).
Definition Type.h:399
LLVM_ABI const fltSemantics & getFltSemantics() const
Definition Type.cpp:110
static LLVM_ABI UndefValue * get(Type *T)
Static factory methods - Return an 'undef' object of the specified type.
A Use represents the edge between a Value definition and its users.
Definition Use.h:35
LLVM Value Representation.
Definition Value.h:75
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:256
LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.h:259
LLVM_ABI const Value * stripAndAccumulateConstantOffsets(const DataLayout &DL, APInt &Offset, bool AllowNonInbounds, bool AllowInvariantGroup=false, function_ref< bool(Value &Value, APInt &Offset)> ExternalAnalysis=nullptr, bool LookThroughIntToPtr=false) const
Accumulate the constant offset this value has compared to a base pointer.
LLVM_ABI uint64_t getPointerDereferenceableBytes(const DataLayout &DL, bool &CanBeNull, bool &CanBeFreed) const
Returns the number of bytes known to be dereferenceable for the pointer value.
Definition Value.cpp:893
Base class of all SIMD vector types.
ElementCount getElementCount() const
Return an ElementCount instance to represent the (possibly scalable) number of elements in the vector...
Type * getElementType() const
constexpr ScalarTy getFixedValue() const
Definition TypeSize.h:200
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
Definition TypeSize.h:168
constexpr bool isFixed() const
Returns true if the quantity is not scaled by vscale.
Definition TypeSize.h:171
constexpr LeafTy divideCoefficientBy(ScalarTy RHS) const
We do not provide the '/' operator here because division for polynomial types does not work in the sa...
Definition TypeSize.h:252
static constexpr bool isKnownGE(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
Definition TypeSize.h:237
const ParentTy * getParent() const
Definition ilist_node.h:34
CallInst * Call
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
const APInt & smin(const APInt &A, const APInt &B)
Determine the smaller of two APInts considered to be signed.
Definition APInt.h:2266
const APInt & smax(const APInt &A, const APInt &B)
Determine the larger of two APInts considered to be signed.
Definition APInt.h:2271
const APInt & umin(const APInt &A, const APInt &B)
Determine the smaller of two APInts considered to be unsigned.
Definition APInt.h:2276
const APInt & umax(const APInt &A, const APInt &B)
Determine the larger of two APInts considered to be unsigned.
Definition APInt.h:2281
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
@ CE
Windows NT (Windows on ARM)
Definition MCAsmInfo.h:48
initializer< Ty > init(const Ty &Val)
@ ebStrict
This corresponds to "fpexcept.strict".
Definition FPEnv.h:42
@ ebIgnore
This corresponds to "fpexcept.ignore".
Definition FPEnv.h:40
constexpr double pi
APFloat::roundingMode GetFMARoundingMode(Intrinsic::ID IntrinsicID)
DenormalMode GetNVVMDenormMode(bool ShouldFTZ)
bool FPToIntegerIntrinsicNaNZero(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFDivRoundingMode(Intrinsic::ID IntrinsicID)
bool FPToIntegerIntrinsicResultIsSigned(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFPToIntegerRoundingMode(Intrinsic::ID IntrinsicID)
bool RCPShouldFTZ(Intrinsic::ID IntrinsicID)
bool FPToIntegerIntrinsicShouldFTZ(Intrinsic::ID IntrinsicID)
bool FDivShouldFTZ(Intrinsic::ID IntrinsicID)
bool FAddShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMinFMaxIsXorSignAbs(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFMulRoundingMode(Intrinsic::ID IntrinsicID)
bool UnaryMathIntrinsicShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMinFMaxShouldFTZ(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFAddRoundingMode(Intrinsic::ID IntrinsicID)
bool FMAShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMulShouldFTZ(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetRCPRoundingMode(Intrinsic::ID IntrinsicID)
bool FMinFMaxPropagatesNaNs(Intrinsic::ID IntrinsicID)
NodeAddr< FuncNode * > Func
Definition RDFGraph.h:393
LLVM_ABI std::error_code status(const Twine &path, file_status &result, bool follow=true)
Get file status as if by POSIX stat().
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition STLExtras.h:316
@ Offset
Definition DWP.cpp:532
LLVM_ABI Constant * ConstantFoldBinaryIntrinsic(Intrinsic::ID ID, Constant *LHS, Constant *RHS, Type *Ty, Instruction *FMFSource)
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1739
LLVM_ABI Constant * ConstantFoldLoadThroughBitcast(Constant *C, Type *DestTy, const DataLayout &DL)
ConstantFoldLoadThroughBitcast - try to cast constant to destination type returning null if unsuccess...
static double log2(double V)
LLVM_ABI Constant * ConstantFoldSelectInstruction(Constant *Cond, Constant *V1, Constant *V2)
Attempt to constant fold a select instruction with the specified operands.
LLVM_ABI Constant * ConstantFoldFPInstOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL, const Instruction *I, bool AllowNonDeterministic=true)
Attempt to constant fold a floating point binary operation with the specified operands,...
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
Definition STLExtras.h:2554
LLVM_ABI bool canConstantFoldCallTo(const CallBase *Call, const Function *F)
canConstantFoldCallTo - Return true if its even possible to fold a call to the specified function.
unsigned getPointerAddressSpace(const Type *T)
Definition SPIRVUtils.h:374
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
LLVM_ABI Constant * ConstantFoldInstruction(const Instruction *I, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldInstruction - Try to constant fold the specified instruction.
APFloat abs(APFloat X)
Returns the absolute value of the argument.
Definition APFloat.h:1630
LLVM_ABI Constant * ConstantFoldCompareInstruction(CmpInst::Predicate Predicate, Constant *C1, Constant *C2)
LLVM_ABI Constant * ConstantFoldUnaryInstruction(unsigned Opcode, Constant *V)
LLVM_ABI bool IsConstantOffsetFromGlobal(Constant *C, GlobalValue *&GV, APInt &Offset, const DataLayout &DL, DSOLocalEquivalent **DSOEquiv=nullptr)
If this constant is a constant offset from a global, return the global and the constant.
LLVM_ABI bool isMathLibCallNoop(const CallBase *Call, const TargetLibraryInfo *TLI)
Check whether the given call has no side-effects.
LLVM_ABI Constant * ReadByteArrayFromGlobal(const GlobalVariable *GV, uint64_t Offset)
auto dyn_cast_if_present(const Y &Val)
dyn_cast_if_present<X> - Functionally identical to dyn_cast, except that a null (or none in the case ...
Definition Casting.h:732
LLVM_READONLY APFloat maximum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 maximum semantics.
Definition APFloat.h:1710
LLVM_ABI Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
int ilogb(const APFloat &Arg)
Returns the exponent of the internal representation of the APFloat.
Definition APFloat.h:1601
bool isa_and_nonnull(const Y &Val)
Definition Casting.h:676
LLVM_ABI Constant * ConstantFoldCall(const CallBase *Call, Function *F, ArrayRef< Constant * > Operands, const TargetLibraryInfo *TLI=nullptr, bool AllowNonDeterministic=true)
ConstantFoldCall - Attempt to constant fold a call to the specified function with the specified argum...
APFloat frexp(const APFloat &X, int &Exp, APFloat::roundingMode RM)
Equivalent of C standard library function.
Definition APFloat.h:1622
LLVM_ABI Constant * ConstantFoldExtractValueInstruction(Constant *Agg, ArrayRef< unsigned > Idxs)
Attempt to constant fold an extractvalue instruction with the specified operands and indices.
LLVM_ABI Constant * ConstantFoldConstant(const Constant *C, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldConstant - Fold the constant using the specified DataLayout.
auto dyn_cast_or_null(const Y &Val)
Definition Casting.h:753
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1746
LLVM_READONLY APFloat maxnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2008 maxNum semantics.
Definition APFloat.h:1665
LLVM_ABI Constant * ConstantFoldLoadFromUniformValue(Constant *C, Type *Ty, const DataLayout &DL)
If C is a uniform value where all bits are the same (either all zero, all ones, all undef or all pois...
LLVM_ABI Constant * ConstantFoldUnaryOpOperand(unsigned Opcode, Constant *Op, const DataLayout &DL)
Attempt to constant fold a unary operation with the specified operand.
LLVM_ABI Constant * FlushFPConstant(Constant *Operand, const Instruction *I, bool IsOutput)
Attempt to flush float point constant according to denormal mode set in the instruction's parent func...
LLVM_ABI Constant * getLosslessUnsignedTrunc(Constant *C, Type *DestTy, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
LLVM_READONLY APFloat minimumnum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 minimumNumber semantics.
Definition APFloat.h:1696
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
APFloat scalbn(APFloat X, int Exp, APFloat::roundingMode RM)
Returns: X * 2^Exp for integral exponents.
Definition APFloat.h:1610
LLVM_ABI void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
LLVM_ABI bool NullPointerIsDefined(const Function *F, unsigned AS=0)
Check whether null pointer dereferencing is considered undefined behavior for a given function or an ...
LLVM_ABI Constant * getLosslessSignedTrunc(Constant *C, Type *DestTy, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
LLVM_ABI Constant * ConstantFoldCastOperand(unsigned Opcode, Constant *C, Type *DestTy, const DataLayout &DL)
Attempt to constant fold a cast with the specified operand.
LLVM_ABI Constant * ConstantFoldLoadFromConst(Constant *C, Type *Ty, const APInt &Offset, const DataLayout &DL)
Extract value of C at the given Offset reinterpreted as Ty.
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547
LLVM_ABI bool intrinsicPropagatesPoison(Intrinsic::ID IID)
Return whether this intrinsic propagates poison for all operands.
LLVM_ABI Constant * ConstantFoldBinaryOpOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL)
Attempt to constant fold a binary operation with the specified operands.
MutableArrayRef(T &OneElt) -> MutableArrayRef< T >
LLVM_READONLY APFloat minnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2008 minNum semantics.
Definition APFloat.h:1646
@ Sub
Subtraction of integers.
LLVM_ABI bool isVectorIntrinsicWithScalarOpAtArg(Intrinsic::ID ID, unsigned ScalarOpdIdx, const TargetTransformInfo *TTI)
Identifies if the vector form of the intrinsic has a scalar operand.
DWARFExpression::Operation Op
RoundingMode
Rounding mode.
@ NearestTiesToEven
roundTiesToEven.
@ Dynamic
Denotes mode unknown at compile time.
LLVM_ABI bool isGuaranteedNotToBeUndefOrPoison(const Value *V, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Return true if this function can prove that V does not have undef bits and is never poison.
constexpr unsigned BitWidth
LLVM_ABI Constant * getLosslessInvCast(Constant *C, Type *InvCastTo, unsigned CastOp, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
Try to cast C to InvC losslessly, satisfying CastOp(InvC) equals C, or CastOp(InvC) is a refined valu...
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
bool all_equal(std::initializer_list< T > Values)
Returns true if all Values in the initializer lists are equal or the list.
Definition STLExtras.h:2166
LLVM_ABI Constant * ConstantFoldCastInstruction(unsigned opcode, Constant *V, Type *DestTy)
LLVM_ABI Constant * ConstantFoldInsertValueInstruction(Constant *Agg, Constant *Val, ArrayRef< unsigned > Idxs)
Attempt to constant fold an insertvalue instruction with the specified operands and indices.
LLVM_ABI Constant * ConstantFoldLoadFromConstPtr(Constant *C, Type *Ty, APInt Offset, const DataLayout &DL)
Return the value that a load from C with offset Offset would produce if it is constant and determinab...
LLVM_ABI Constant * ConstantFoldInstOperands(const Instruction *I, ArrayRef< Constant * > Ops, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, bool AllowNonDeterministic=true)
ConstantFoldInstOperands - Attempt to constant fold an instruction with the specified operands.
LLVM_READONLY APFloat minimum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 minimum semantics.
Definition APFloat.h:1683
LLVM_READONLY APFloat maximumnum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 maximumNumber semantics.
Definition APFloat.h:1723
LLVM_ABI const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=MaxLookupSearchDepth)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
LLVM_ABI Constant * ConstantFoldIntegerCast(Constant *C, Type *DestTy, bool IsSigned, const DataLayout &DL)
Constant fold a zext, sext or trunc, depending on IsSigned and whether the DestTy is wider or narrowe...
LLVM_ABI bool isTriviallyVectorizable(Intrinsic::ID ID)
Identify if the intrinsic is trivially vectorizable.
constexpr detail::IsaCheckPredicate< Types... > IsaPred
Function object wrapper for the llvm::isa type check.
Definition Casting.h:866
LLVM_ABI Constant * ConstantFoldBinaryInstruction(unsigned Opcode, Constant *V1, Constant *V2)
Represent subnormal handling kind for floating point instruction inputs and outputs.
DenormalModeKind Input
Denormal treatment kind for floating point instruction inputs in the default floating-point environme...
DenormalModeKind
Represent handled modes for denormal (aka subnormal) modes in the floating point environment.
@ PreserveSign
The sign of a flushed-to-zero number is preserved in the sign of 0.
@ PositiveZero
Denormals are flushed to positive zero.
@ Dynamic
Denormals have unknown treatment.
@ IEEE
IEEE-754 denormal numbers preserved.
DenormalModeKind Output
Denormal flushing mode for floating point instruction results in the default floating point environme...
static constexpr DenormalMode getDynamic()
static constexpr DenormalMode getIEEE()
Incoming for lane mask phi as machine instruction, incoming register Reg and incoming block Block are...
bool isConstant() const
Returns true if we know the value of all bits.
Definition KnownBits.h:54
const APInt & getConstant() const
Returns the value when all bits have a known value.
Definition KnownBits.h:60