LLVM 22.0.0git
ConstantFolding.cpp
Go to the documentation of this file.
1//===-- ConstantFolding.cpp - Fold instructions into constants ------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines routines for folding instructions into constants.
10//
11// Also, to supplement the basic IR ConstantExpr simplifications,
12// this file defines some additional folding routines that can make use of
13// DataLayout information. These functions cannot go in IR due to library
14// dependency issues.
15//
16//===----------------------------------------------------------------------===//
17
19#include "llvm/ADT/APFloat.h"
20#include "llvm/ADT/APInt.h"
21#include "llvm/ADT/APSInt.h"
22#include "llvm/ADT/ArrayRef.h"
23#include "llvm/ADT/DenseMap.h"
24#include "llvm/ADT/STLExtras.h"
26#include "llvm/ADT/StringRef.h"
31#include "llvm/Config/config.h"
32#include "llvm/IR/Constant.h"
34#include "llvm/IR/Constants.h"
35#include "llvm/IR/DataLayout.h"
37#include "llvm/IR/Function.h"
38#include "llvm/IR/GlobalValue.h"
40#include "llvm/IR/InstrTypes.h"
41#include "llvm/IR/Instruction.h"
44#include "llvm/IR/Intrinsics.h"
45#include "llvm/IR/IntrinsicsAArch64.h"
46#include "llvm/IR/IntrinsicsAMDGPU.h"
47#include "llvm/IR/IntrinsicsARM.h"
48#include "llvm/IR/IntrinsicsNVPTX.h"
49#include "llvm/IR/IntrinsicsWebAssembly.h"
50#include "llvm/IR/IntrinsicsX86.h"
52#include "llvm/IR/Operator.h"
53#include "llvm/IR/Type.h"
54#include "llvm/IR/Value.h"
59#include <cassert>
60#include <cerrno>
61#include <cfenv>
62#include <cmath>
63#include <cstdint>
64
65using namespace llvm;
66
68 "disable-fp-call-folding",
69 cl::desc("Disable constant-folding of FP intrinsics and libcalls."),
70 cl::init(false), cl::Hidden);
71
72namespace {
73
74//===----------------------------------------------------------------------===//
75// Constant Folding internal helper functions
76//===----------------------------------------------------------------------===//
77
78static Constant *foldConstVectorToAPInt(APInt &Result, Type *DestTy,
79 Constant *C, Type *SrcEltTy,
80 unsigned NumSrcElts,
81 const DataLayout &DL) {
82 // Now that we know that the input value is a vector of integers, just shift
83 // and insert them into our result.
84 unsigned BitShift = DL.getTypeSizeInBits(SrcEltTy);
85 for (unsigned i = 0; i != NumSrcElts; ++i) {
86 Constant *Element;
87 if (DL.isLittleEndian())
88 Element = C->getAggregateElement(NumSrcElts - i - 1);
89 else
90 Element = C->getAggregateElement(i);
91
92 if (isa_and_nonnull<UndefValue>(Element)) {
93 Result <<= BitShift;
94 continue;
95 }
96
97 auto *ElementCI = dyn_cast_or_null<ConstantInt>(Element);
98 if (!ElementCI)
99 return ConstantExpr::getBitCast(C, DestTy);
100
101 Result <<= BitShift;
102 Result |= ElementCI->getValue().zext(Result.getBitWidth());
103 }
104
105 return nullptr;
106}
107
108/// Constant fold bitcast, symbolically evaluating it with DataLayout.
109/// This always returns a non-null constant, but it may be a
110/// ConstantExpr if unfoldable.
111Constant *FoldBitCast(Constant *C, Type *DestTy, const DataLayout &DL) {
112 assert(CastInst::castIsValid(Instruction::BitCast, C, DestTy) &&
113 "Invalid constantexpr bitcast!");
114
115 // Catch the obvious splat cases.
116 if (Constant *Res = ConstantFoldLoadFromUniformValue(C, DestTy, DL))
117 return Res;
118
119 if (auto *VTy = dyn_cast<VectorType>(C->getType())) {
120 // Handle a vector->scalar integer/fp cast.
121 if (isa<IntegerType>(DestTy) || DestTy->isFloatingPointTy()) {
122 unsigned NumSrcElts = cast<FixedVectorType>(VTy)->getNumElements();
123 Type *SrcEltTy = VTy->getElementType();
124
125 // If the vector is a vector of floating point, convert it to vector of int
126 // to simplify things.
127 if (SrcEltTy->isFloatingPointTy()) {
128 unsigned FPWidth = SrcEltTy->getPrimitiveSizeInBits();
129 auto *SrcIVTy = FixedVectorType::get(
130 IntegerType::get(C->getContext(), FPWidth), NumSrcElts);
131 // Ask IR to do the conversion now that #elts line up.
132 C = ConstantExpr::getBitCast(C, SrcIVTy);
133 }
134
135 APInt Result(DL.getTypeSizeInBits(DestTy), 0);
136 if (Constant *CE = foldConstVectorToAPInt(Result, DestTy, C,
137 SrcEltTy, NumSrcElts, DL))
138 return CE;
139
140 if (isa<IntegerType>(DestTy))
141 return ConstantInt::get(DestTy, Result);
142
143 APFloat FP(DestTy->getFltSemantics(), Result);
144 return ConstantFP::get(DestTy->getContext(), FP);
145 }
146 }
147
148 // The code below only handles casts to vectors currently.
149 auto *DestVTy = dyn_cast<VectorType>(DestTy);
150 if (!DestVTy)
151 return ConstantExpr::getBitCast(C, DestTy);
152
153 // If this is a scalar -> vector cast, convert the input into a <1 x scalar>
154 // vector so the code below can handle it uniformly.
155 if (!isa<VectorType>(C->getType()) &&
157 Constant *Ops = C; // don't take the address of C!
158 return FoldBitCast(ConstantVector::get(Ops), DestTy, DL);
159 }
160
161 // Some of what follows may extend to cover scalable vectors but the current
162 // implementation is fixed length specific.
163 if (!isa<FixedVectorType>(C->getType()))
164 return ConstantExpr::getBitCast(C, DestTy);
165
166 // If this is a bitcast from constant vector -> vector, fold it.
169 return ConstantExpr::getBitCast(C, DestTy);
170
171 // If the element types match, IR can fold it.
172 unsigned NumDstElt = cast<FixedVectorType>(DestVTy)->getNumElements();
173 unsigned NumSrcElt = cast<FixedVectorType>(C->getType())->getNumElements();
174 if (NumDstElt == NumSrcElt)
175 return ConstantExpr::getBitCast(C, DestTy);
176
177 Type *SrcEltTy = cast<VectorType>(C->getType())->getElementType();
178 Type *DstEltTy = DestVTy->getElementType();
179
180 // Otherwise, we're changing the number of elements in a vector, which
181 // requires endianness information to do the right thing. For example,
182 // bitcast (<2 x i64> <i64 0, i64 1> to <4 x i32>)
183 // folds to (little endian):
184 // <4 x i32> <i32 0, i32 0, i32 1, i32 0>
185 // and to (big endian):
186 // <4 x i32> <i32 0, i32 0, i32 0, i32 1>
187
188 // First thing is first. We only want to think about integer here, so if
189 // we have something in FP form, recast it as integer.
190 if (DstEltTy->isFloatingPointTy()) {
191 // Fold to an vector of integers with same size as our FP type.
192 unsigned FPWidth = DstEltTy->getPrimitiveSizeInBits();
193 auto *DestIVTy = FixedVectorType::get(
194 IntegerType::get(C->getContext(), FPWidth), NumDstElt);
195 // Recursively handle this integer conversion, if possible.
196 C = FoldBitCast(C, DestIVTy, DL);
197
198 // Finally, IR can handle this now that #elts line up.
199 return ConstantExpr::getBitCast(C, DestTy);
200 }
201
202 // Okay, we know the destination is integer, if the input is FP, convert
203 // it to integer first.
204 if (SrcEltTy->isFloatingPointTy()) {
205 unsigned FPWidth = SrcEltTy->getPrimitiveSizeInBits();
206 auto *SrcIVTy = FixedVectorType::get(
207 IntegerType::get(C->getContext(), FPWidth), NumSrcElt);
208 // Ask IR to do the conversion now that #elts line up.
209 C = ConstantExpr::getBitCast(C, SrcIVTy);
210 assert((isa<ConstantVector>(C) || // FIXME: Remove ConstantVector.
212 "Constant folding cannot fail for plain fp->int bitcast!");
213 }
214
215 // Now we know that the input and output vectors are both integer vectors
216 // of the same size, and that their #elements is not the same. Do the
217 // conversion here, which depends on whether the input or output has
218 // more elements.
219 bool isLittleEndian = DL.isLittleEndian();
220
222 if (NumDstElt < NumSrcElt) {
223 // Handle: bitcast (<4 x i32> <i32 0, i32 1, i32 2, i32 3> to <2 x i64>)
225 unsigned Ratio = NumSrcElt/NumDstElt;
226 unsigned SrcBitSize = SrcEltTy->getPrimitiveSizeInBits();
227 unsigned SrcElt = 0;
228 for (unsigned i = 0; i != NumDstElt; ++i) {
229 // Build each element of the result.
230 Constant *Elt = Zero;
231 unsigned ShiftAmt = isLittleEndian ? 0 : SrcBitSize*(Ratio-1);
232 for (unsigned j = 0; j != Ratio; ++j) {
233 Constant *Src = C->getAggregateElement(SrcElt++);
236 cast<VectorType>(C->getType())->getElementType());
237 else
239 if (!Src) // Reject constantexpr elements.
240 return ConstantExpr::getBitCast(C, DestTy);
241
242 // Zero extend the element to the right size.
243 Src = ConstantFoldCastOperand(Instruction::ZExt, Src, Elt->getType(),
244 DL);
245 assert(Src && "Constant folding cannot fail on plain integers");
246
247 // Shift it to the right place, depending on endianness.
249 Instruction::Shl, Src, ConstantInt::get(Src->getType(), ShiftAmt),
250 DL);
251 assert(Src && "Constant folding cannot fail on plain integers");
252
253 ShiftAmt += isLittleEndian ? SrcBitSize : -SrcBitSize;
254
255 // Mix it in.
256 Elt = ConstantFoldBinaryOpOperands(Instruction::Or, Elt, Src, DL);
257 assert(Elt && "Constant folding cannot fail on plain integers");
258 }
259 Result.push_back(Elt);
260 }
261 return ConstantVector::get(Result);
262 }
263
264 // Handle: bitcast (<2 x i64> <i64 0, i64 1> to <4 x i32>)
265 unsigned Ratio = NumDstElt/NumSrcElt;
266 unsigned DstBitSize = DL.getTypeSizeInBits(DstEltTy);
267
268 // Loop over each source value, expanding into multiple results.
269 for (unsigned i = 0; i != NumSrcElt; ++i) {
270 auto *Element = C->getAggregateElement(i);
271
272 if (!Element) // Reject constantexpr elements.
273 return ConstantExpr::getBitCast(C, DestTy);
274
275 if (isa<UndefValue>(Element)) {
276 // Correctly Propagate undef values.
277 Result.append(Ratio, UndefValue::get(DstEltTy));
278 continue;
279 }
280
281 auto *Src = dyn_cast<ConstantInt>(Element);
282 if (!Src)
283 return ConstantExpr::getBitCast(C, DestTy);
284
285 unsigned ShiftAmt = isLittleEndian ? 0 : DstBitSize*(Ratio-1);
286 for (unsigned j = 0; j != Ratio; ++j) {
287 // Shift the piece of the value into the right place, depending on
288 // endianness.
289 APInt Elt = Src->getValue().lshr(ShiftAmt);
290 ShiftAmt += isLittleEndian ? DstBitSize : -DstBitSize;
291
292 // Truncate and remember this piece.
293 Result.push_back(ConstantInt::get(DstEltTy, Elt.trunc(DstBitSize)));
294 }
295 }
296
297 return ConstantVector::get(Result);
298}
299
300} // end anonymous namespace
301
302/// If this constant is a constant offset from a global, return the global and
303/// the constant. Because of constantexprs, this function is recursive.
305 APInt &Offset, const DataLayout &DL,
306 DSOLocalEquivalent **DSOEquiv) {
307 if (DSOEquiv)
308 *DSOEquiv = nullptr;
309
310 // Trivial case, constant is the global.
311 if ((GV = dyn_cast<GlobalValue>(C))) {
312 unsigned BitWidth = DL.getIndexTypeSizeInBits(GV->getType());
313 Offset = APInt(BitWidth, 0);
314 return true;
315 }
316
317 if (auto *FoundDSOEquiv = dyn_cast<DSOLocalEquivalent>(C)) {
318 if (DSOEquiv)
319 *DSOEquiv = FoundDSOEquiv;
320 GV = FoundDSOEquiv->getGlobalValue();
321 unsigned BitWidth = DL.getIndexTypeSizeInBits(GV->getType());
322 Offset = APInt(BitWidth, 0);
323 return true;
324 }
325
326 // Otherwise, if this isn't a constant expr, bail out.
327 auto *CE = dyn_cast<ConstantExpr>(C);
328 if (!CE) return false;
329
330 // Look through ptr->int and ptr->ptr casts.
331 if (CE->getOpcode() == Instruction::PtrToInt ||
332 CE->getOpcode() == Instruction::PtrToAddr ||
333 CE->getOpcode() == Instruction::BitCast)
334 return IsConstantOffsetFromGlobal(CE->getOperand(0), GV, Offset, DL,
335 DSOEquiv);
336
337 // i32* getelementptr ([5 x i32]* @a, i32 0, i32 5)
338 auto *GEP = dyn_cast<GEPOperator>(CE);
339 if (!GEP)
340 return false;
341
342 unsigned BitWidth = DL.getIndexTypeSizeInBits(GEP->getType());
343 APInt TmpOffset(BitWidth, 0);
344
345 // If the base isn't a global+constant, we aren't either.
346 if (!IsConstantOffsetFromGlobal(CE->getOperand(0), GV, TmpOffset, DL,
347 DSOEquiv))
348 return false;
349
350 // Otherwise, add any offset that our operands provide.
351 if (!GEP->accumulateConstantOffset(DL, TmpOffset))
352 return false;
353
354 Offset = TmpOffset;
355 return true;
356}
357
359 const DataLayout &DL) {
360 do {
361 Type *SrcTy = C->getType();
362 if (SrcTy == DestTy)
363 return C;
364
365 TypeSize DestSize = DL.getTypeSizeInBits(DestTy);
366 TypeSize SrcSize = DL.getTypeSizeInBits(SrcTy);
367 if (!TypeSize::isKnownGE(SrcSize, DestSize))
368 return nullptr;
369
370 // Catch the obvious splat cases (since all-zeros can coerce non-integral
371 // pointers legally).
372 if (Constant *Res = ConstantFoldLoadFromUniformValue(C, DestTy, DL))
373 return Res;
374
375 // If the type sizes are the same and a cast is legal, just directly
376 // cast the constant.
377 // But be careful not to coerce non-integral pointers illegally.
378 if (SrcSize == DestSize &&
379 DL.isNonIntegralPointerType(SrcTy->getScalarType()) ==
380 DL.isNonIntegralPointerType(DestTy->getScalarType())) {
381 Instruction::CastOps Cast = Instruction::BitCast;
382 // If we are going from a pointer to int or vice versa, we spell the cast
383 // differently.
384 if (SrcTy->isIntegerTy() && DestTy->isPointerTy())
385 Cast = Instruction::IntToPtr;
386 else if (SrcTy->isPointerTy() && DestTy->isIntegerTy())
387 Cast = Instruction::PtrToInt;
388
389 if (CastInst::castIsValid(Cast, C, DestTy))
390 return ConstantFoldCastOperand(Cast, C, DestTy, DL);
391 }
392
393 // If this isn't an aggregate type, there is nothing we can do to drill down
394 // and find a bitcastable constant.
395 if (!SrcTy->isAggregateType() && !SrcTy->isVectorTy())
396 return nullptr;
397
398 // We're simulating a load through a pointer that was bitcast to point to
399 // a different type, so we can try to walk down through the initial
400 // elements of an aggregate to see if some part of the aggregate is
401 // castable to implement the "load" semantic model.
402 if (SrcTy->isStructTy()) {
403 // Struct types might have leading zero-length elements like [0 x i32],
404 // which are certainly not what we are looking for, so skip them.
405 unsigned Elem = 0;
406 Constant *ElemC;
407 do {
408 ElemC = C->getAggregateElement(Elem++);
409 } while (ElemC && DL.getTypeSizeInBits(ElemC->getType()).isZero());
410 C = ElemC;
411 } else {
412 // For non-byte-sized vector elements, the first element is not
413 // necessarily located at the vector base address.
414 if (auto *VT = dyn_cast<VectorType>(SrcTy))
415 if (!DL.typeSizeEqualsStoreSize(VT->getElementType()))
416 return nullptr;
417
418 C = C->getAggregateElement(0u);
419 }
420 } while (C);
421
422 return nullptr;
423}
424
425namespace {
426
427/// Recursive helper to read bits out of global. C is the constant being copied
428/// out of. ByteOffset is an offset into C. CurPtr is the pointer to copy
429/// results into and BytesLeft is the number of bytes left in
430/// the CurPtr buffer. DL is the DataLayout.
431bool ReadDataFromGlobal(Constant *C, uint64_t ByteOffset, unsigned char *CurPtr,
432 unsigned BytesLeft, const DataLayout &DL) {
433 assert(ByteOffset <= DL.getTypeAllocSize(C->getType()) &&
434 "Out of range access");
435
436 // Reading type padding, return zero.
437 if (ByteOffset >= DL.getTypeStoreSize(C->getType()))
438 return true;
439
440 // If this element is zero or undefined, we can just return since *CurPtr is
441 // zero initialized.
443 return true;
444
445 if (auto *CI = dyn_cast<ConstantInt>(C)) {
446 if ((CI->getBitWidth() & 7) != 0)
447 return false;
448 const APInt &Val = CI->getValue();
449 unsigned IntBytes = unsigned(CI->getBitWidth()/8);
450
451 for (unsigned i = 0; i != BytesLeft && ByteOffset != IntBytes; ++i) {
452 unsigned n = ByteOffset;
453 if (!DL.isLittleEndian())
454 n = IntBytes - n - 1;
455 CurPtr[i] = Val.extractBits(8, n * 8).getZExtValue();
456 ++ByteOffset;
457 }
458 return true;
459 }
460
461 if (auto *CFP = dyn_cast<ConstantFP>(C)) {
462 if (CFP->getType()->isDoubleTy()) {
463 C = FoldBitCast(C, Type::getInt64Ty(C->getContext()), DL);
464 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL);
465 }
466 if (CFP->getType()->isFloatTy()){
467 C = FoldBitCast(C, Type::getInt32Ty(C->getContext()), DL);
468 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL);
469 }
470 if (CFP->getType()->isHalfTy()){
471 C = FoldBitCast(C, Type::getInt16Ty(C->getContext()), DL);
472 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL);
473 }
474 return false;
475 }
476
477 if (auto *CS = dyn_cast<ConstantStruct>(C)) {
478 const StructLayout *SL = DL.getStructLayout(CS->getType());
479 unsigned Index = SL->getElementContainingOffset(ByteOffset);
480 uint64_t CurEltOffset = SL->getElementOffset(Index);
481 ByteOffset -= CurEltOffset;
482
483 while (true) {
484 // If the element access is to the element itself and not to tail padding,
485 // read the bytes from the element.
486 uint64_t EltSize = DL.getTypeAllocSize(CS->getOperand(Index)->getType());
487
488 if (ByteOffset < EltSize &&
489 !ReadDataFromGlobal(CS->getOperand(Index), ByteOffset, CurPtr,
490 BytesLeft, DL))
491 return false;
492
493 ++Index;
494
495 // Check to see if we read from the last struct element, if so we're done.
496 if (Index == CS->getType()->getNumElements())
497 return true;
498
499 // If we read all of the bytes we needed from this element we're done.
500 uint64_t NextEltOffset = SL->getElementOffset(Index);
501
502 if (BytesLeft <= NextEltOffset - CurEltOffset - ByteOffset)
503 return true;
504
505 // Move to the next element of the struct.
506 CurPtr += NextEltOffset - CurEltOffset - ByteOffset;
507 BytesLeft -= NextEltOffset - CurEltOffset - ByteOffset;
508 ByteOffset = 0;
509 CurEltOffset = NextEltOffset;
510 }
511 // not reached.
512 }
513
516 uint64_t NumElts, EltSize;
517 Type *EltTy;
518 if (auto *AT = dyn_cast<ArrayType>(C->getType())) {
519 NumElts = AT->getNumElements();
520 EltTy = AT->getElementType();
521 EltSize = DL.getTypeAllocSize(EltTy);
522 } else {
523 NumElts = cast<FixedVectorType>(C->getType())->getNumElements();
524 EltTy = cast<FixedVectorType>(C->getType())->getElementType();
525 // TODO: For non-byte-sized vectors, current implementation assumes there is
526 // padding to the next byte boundary between elements.
527 if (!DL.typeSizeEqualsStoreSize(EltTy))
528 return false;
529
530 EltSize = DL.getTypeStoreSize(EltTy);
531 }
532 uint64_t Index = ByteOffset / EltSize;
533 uint64_t Offset = ByteOffset - Index * EltSize;
534
535 for (; Index != NumElts; ++Index) {
536 if (!ReadDataFromGlobal(C->getAggregateElement(Index), Offset, CurPtr,
537 BytesLeft, DL))
538 return false;
539
540 uint64_t BytesWritten = EltSize - Offset;
541 assert(BytesWritten <= EltSize && "Not indexing into this element?");
542 if (BytesWritten >= BytesLeft)
543 return true;
544
545 Offset = 0;
546 BytesLeft -= BytesWritten;
547 CurPtr += BytesWritten;
548 }
549 return true;
550 }
551
552 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
553 if (CE->getOpcode() == Instruction::IntToPtr &&
554 CE->getOperand(0)->getType() == DL.getIntPtrType(CE->getType())) {
555 return ReadDataFromGlobal(CE->getOperand(0), ByteOffset, CurPtr,
556 BytesLeft, DL);
557 }
558 }
559
560 // Otherwise, unknown initializer type.
561 return false;
562}
563
564Constant *FoldReinterpretLoadFromConst(Constant *C, Type *LoadTy,
565 int64_t Offset, const DataLayout &DL) {
566 // Bail out early. Not expect to load from scalable global variable.
567 if (isa<ScalableVectorType>(LoadTy))
568 return nullptr;
569
570 auto *IntType = dyn_cast<IntegerType>(LoadTy);
571
572 // If this isn't an integer load we can't fold it directly.
573 if (!IntType) {
574 // If this is a non-integer load, we can try folding it as an int load and
575 // then bitcast the result. This can be useful for union cases. Note
576 // that address spaces don't matter here since we're not going to result in
577 // an actual new load.
578 if (!LoadTy->isFloatingPointTy() && !LoadTy->isPointerTy() &&
579 !LoadTy->isVectorTy())
580 return nullptr;
581
582 Type *MapTy = Type::getIntNTy(C->getContext(),
583 DL.getTypeSizeInBits(LoadTy).getFixedValue());
584 if (Constant *Res = FoldReinterpretLoadFromConst(C, MapTy, Offset, DL)) {
585 if (Res->isNullValue() && !LoadTy->isX86_AMXTy())
586 // Materializing a zero can be done trivially without a bitcast
587 return Constant::getNullValue(LoadTy);
588 Type *CastTy = LoadTy->isPtrOrPtrVectorTy() ? DL.getIntPtrType(LoadTy) : LoadTy;
589 Res = FoldBitCast(Res, CastTy, DL);
590 if (LoadTy->isPtrOrPtrVectorTy()) {
591 // For vector of pointer, we needed to first convert to a vector of integer, then do vector inttoptr
592 if (Res->isNullValue() && !LoadTy->isX86_AMXTy())
593 return Constant::getNullValue(LoadTy);
594 if (DL.isNonIntegralPointerType(LoadTy->getScalarType()))
595 // Be careful not to replace a load of an addrspace value with an inttoptr here
596 return nullptr;
597 Res = ConstantExpr::getIntToPtr(Res, LoadTy);
598 }
599 return Res;
600 }
601 return nullptr;
602 }
603
604 unsigned BytesLoaded = (IntType->getBitWidth() + 7) / 8;
605 if (BytesLoaded > 32 || BytesLoaded == 0)
606 return nullptr;
607
608 // If we're not accessing anything in this constant, the result is undefined.
609 if (Offset <= -1 * static_cast<int64_t>(BytesLoaded))
610 return PoisonValue::get(IntType);
611
612 // TODO: We should be able to support scalable types.
613 TypeSize InitializerSize = DL.getTypeAllocSize(C->getType());
614 if (InitializerSize.isScalable())
615 return nullptr;
616
617 // If we're not accessing anything in this constant, the result is undefined.
618 if (Offset >= (int64_t)InitializerSize.getFixedValue())
619 return PoisonValue::get(IntType);
620
621 unsigned char RawBytes[32] = {0};
622 unsigned char *CurPtr = RawBytes;
623 unsigned BytesLeft = BytesLoaded;
624
625 // If we're loading off the beginning of the global, some bytes may be valid.
626 if (Offset < 0) {
627 CurPtr += -Offset;
628 BytesLeft += Offset;
629 Offset = 0;
630 }
631
632 if (!ReadDataFromGlobal(C, Offset, CurPtr, BytesLeft, DL))
633 return nullptr;
634
635 APInt ResultVal = APInt(IntType->getBitWidth(), 0);
636 if (DL.isLittleEndian()) {
637 ResultVal = RawBytes[BytesLoaded - 1];
638 for (unsigned i = 1; i != BytesLoaded; ++i) {
639 ResultVal <<= 8;
640 ResultVal |= RawBytes[BytesLoaded - 1 - i];
641 }
642 } else {
643 ResultVal = RawBytes[0];
644 for (unsigned i = 1; i != BytesLoaded; ++i) {
645 ResultVal <<= 8;
646 ResultVal |= RawBytes[i];
647 }
648 }
649
650 return ConstantInt::get(IntType->getContext(), ResultVal);
651}
652
653} // anonymous namespace
654
655// If GV is a constant with an initializer read its representation starting
656// at Offset and return it as a constant array of unsigned char. Otherwise
657// return null.
660 if (!GV->isConstant() || !GV->hasDefinitiveInitializer())
661 return nullptr;
662
663 const DataLayout &DL = GV->getDataLayout();
664 Constant *Init = const_cast<Constant *>(GV->getInitializer());
665 TypeSize InitSize = DL.getTypeAllocSize(Init->getType());
666 if (InitSize < Offset)
667 return nullptr;
668
669 uint64_t NBytes = InitSize - Offset;
670 if (NBytes > UINT16_MAX)
671 // Bail for large initializers in excess of 64K to avoid allocating
672 // too much memory.
673 // Offset is assumed to be less than or equal than InitSize (this
674 // is enforced in ReadDataFromGlobal).
675 return nullptr;
676
677 SmallVector<unsigned char, 256> RawBytes(static_cast<size_t>(NBytes));
678 unsigned char *CurPtr = RawBytes.data();
679
680 if (!ReadDataFromGlobal(Init, Offset, CurPtr, NBytes, DL))
681 return nullptr;
682
683 return ConstantDataArray::get(GV->getContext(), RawBytes);
684}
685
686/// If this Offset points exactly to the start of an aggregate element, return
687/// that element, otherwise return nullptr.
689 const DataLayout &DL) {
690 if (Offset.isZero())
691 return Base;
692
694 return nullptr;
695
696 Type *ElemTy = Base->getType();
697 SmallVector<APInt> Indices = DL.getGEPIndicesForOffset(ElemTy, Offset);
698 if (!Offset.isZero() || !Indices[0].isZero())
699 return nullptr;
700
701 Constant *C = Base;
702 for (const APInt &Index : drop_begin(Indices)) {
703 if (Index.isNegative() || Index.getActiveBits() >= 32)
704 return nullptr;
705
706 C = C->getAggregateElement(Index.getZExtValue());
707 if (!C)
708 return nullptr;
709 }
710
711 return C;
712}
713
715 const APInt &Offset,
716 const DataLayout &DL) {
717 if (Constant *AtOffset = getConstantAtOffset(C, Offset, DL))
718 if (Constant *Result = ConstantFoldLoadThroughBitcast(AtOffset, Ty, DL))
719 return Result;
720
721 // Explicitly check for out-of-bounds access, so we return poison even if the
722 // constant is a uniform value.
723 TypeSize Size = DL.getTypeAllocSize(C->getType());
724 if (!Size.isScalable() && Offset.sge(Size.getFixedValue()))
725 return PoisonValue::get(Ty);
726
727 // Try an offset-independent fold of a uniform value.
728 if (Constant *Result = ConstantFoldLoadFromUniformValue(C, Ty, DL))
729 return Result;
730
731 // Try hard to fold loads from bitcasted strange and non-type-safe things.
732 if (Offset.getSignificantBits() <= 64)
733 if (Constant *Result =
734 FoldReinterpretLoadFromConst(C, Ty, Offset.getSExtValue(), DL))
735 return Result;
736
737 return nullptr;
738}
739
744
747 const DataLayout &DL) {
748 // We can only fold loads from constant globals with a definitive initializer.
749 // Check this upfront, to skip expensive offset calculations.
751 if (!GV || !GV->isConstant() || !GV->hasDefinitiveInitializer())
752 return nullptr;
753
754 C = cast<Constant>(C->stripAndAccumulateConstantOffsets(
755 DL, Offset, /* AllowNonInbounds */ true));
756
757 if (C == GV)
758 if (Constant *Result = ConstantFoldLoadFromConst(GV->getInitializer(), Ty,
759 Offset, DL))
760 return Result;
761
762 // If this load comes from anywhere in a uniform constant global, the value
763 // is always the same, regardless of the loaded offset.
764 return ConstantFoldLoadFromUniformValue(GV->getInitializer(), Ty, DL);
765}
766
768 const DataLayout &DL) {
769 APInt Offset(DL.getIndexTypeSizeInBits(C->getType()), 0);
770 return ConstantFoldLoadFromConstPtr(C, Ty, std::move(Offset), DL);
771}
772
774 const DataLayout &DL) {
775 if (isa<PoisonValue>(C))
776 return PoisonValue::get(Ty);
777 if (isa<UndefValue>(C))
778 return UndefValue::get(Ty);
779 // If padding is needed when storing C to memory, then it isn't considered as
780 // uniform.
781 if (!DL.typeSizeEqualsStoreSize(C->getType()))
782 return nullptr;
783 if (C->isNullValue() && !Ty->isX86_AMXTy())
784 return Constant::getNullValue(Ty);
785 if (C->isAllOnesValue() &&
786 (Ty->isIntOrIntVectorTy() || Ty->isFPOrFPVectorTy()))
787 return Constant::getAllOnesValue(Ty);
788 return nullptr;
789}
790
791namespace {
792
793/// One of Op0/Op1 is a constant expression.
794/// Attempt to symbolically evaluate the result of a binary operator merging
795/// these together. If target data info is available, it is provided as DL,
796/// otherwise DL is null.
797Constant *SymbolicallyEvaluateBinop(unsigned Opc, Constant *Op0, Constant *Op1,
798 const DataLayout &DL) {
799 // SROA
800
801 // Fold (and 0xffffffff00000000, (shl x, 32)) -> shl.
802 // Fold (lshr (or X, Y), 32) -> (lshr [X/Y], 32) if one doesn't contribute
803 // bits.
804
805 if (Opc == Instruction::And) {
806 KnownBits Known0 = computeKnownBits(Op0, DL);
807 KnownBits Known1 = computeKnownBits(Op1, DL);
808 if ((Known1.One | Known0.Zero).isAllOnes()) {
809 // All the bits of Op0 that the 'and' could be masking are already zero.
810 return Op0;
811 }
812 if ((Known0.One | Known1.Zero).isAllOnes()) {
813 // All the bits of Op1 that the 'and' could be masking are already zero.
814 return Op1;
815 }
816
817 Known0 &= Known1;
818 if (Known0.isConstant())
819 return ConstantInt::get(Op0->getType(), Known0.getConstant());
820 }
821
822 // If the constant expr is something like &A[123] - &A[4].f, fold this into a
823 // constant. This happens frequently when iterating over a global array.
824 if (Opc == Instruction::Sub) {
825 GlobalValue *GV1, *GV2;
826 APInt Offs1, Offs2;
827
828 if (IsConstantOffsetFromGlobal(Op0, GV1, Offs1, DL))
829 if (IsConstantOffsetFromGlobal(Op1, GV2, Offs2, DL) && GV1 == GV2) {
830 unsigned OpSize = DL.getTypeSizeInBits(Op0->getType());
831
832 // (&GV+C1) - (&GV+C2) -> C1-C2, pointer arithmetic cannot overflow.
833 // PtrToInt may change the bitwidth so we have convert to the right size
834 // first.
835 return ConstantInt::get(Op0->getType(), Offs1.zextOrTrunc(OpSize) -
836 Offs2.zextOrTrunc(OpSize));
837 }
838 }
839
840 return nullptr;
841}
842
843/// If array indices are not pointer-sized integers, explicitly cast them so
844/// that they aren't implicitly casted by the getelementptr.
845Constant *CastGEPIndices(Type *SrcElemTy, ArrayRef<Constant *> Ops,
846 Type *ResultTy, GEPNoWrapFlags NW,
847 std::optional<ConstantRange> InRange,
848 const DataLayout &DL, const TargetLibraryInfo *TLI) {
849 Type *IntIdxTy = DL.getIndexType(ResultTy);
850 Type *IntIdxScalarTy = IntIdxTy->getScalarType();
851
852 bool Any = false;
854 for (unsigned i = 1, e = Ops.size(); i != e; ++i) {
855 if ((i == 1 ||
857 SrcElemTy, Ops.slice(1, i - 1)))) &&
858 Ops[i]->getType()->getScalarType() != IntIdxScalarTy) {
859 Any = true;
860 Type *NewType =
861 Ops[i]->getType()->isVectorTy() ? IntIdxTy : IntIdxScalarTy;
863 CastInst::getCastOpcode(Ops[i], true, NewType, true), Ops[i], NewType,
864 DL);
865 if (!NewIdx)
866 return nullptr;
867 NewIdxs.push_back(NewIdx);
868 } else
869 NewIdxs.push_back(Ops[i]);
870 }
871
872 if (!Any)
873 return nullptr;
874
875 Constant *C =
876 ConstantExpr::getGetElementPtr(SrcElemTy, Ops[0], NewIdxs, NW, InRange);
877 return ConstantFoldConstant(C, DL, TLI);
878}
879
880/// If we can symbolically evaluate the GEP constant expression, do so.
881Constant *SymbolicallyEvaluateGEP(const GEPOperator *GEP,
883 const DataLayout &DL,
884 const TargetLibraryInfo *TLI) {
885 Type *SrcElemTy = GEP->getSourceElementType();
886 Type *ResTy = GEP->getType();
887 if (!SrcElemTy->isSized() || isa<ScalableVectorType>(SrcElemTy))
888 return nullptr;
889
890 if (Constant *C = CastGEPIndices(SrcElemTy, Ops, ResTy, GEP->getNoWrapFlags(),
891 GEP->getInRange(), DL, TLI))
892 return C;
893
894 Constant *Ptr = Ops[0];
895 if (!Ptr->getType()->isPointerTy())
896 return nullptr;
897
898 Type *IntIdxTy = DL.getIndexType(Ptr->getType());
899
900 for (unsigned i = 1, e = Ops.size(); i != e; ++i)
901 if (!isa<ConstantInt>(Ops[i]) || !Ops[i]->getType()->isIntegerTy())
902 return nullptr;
903
904 unsigned BitWidth = DL.getTypeSizeInBits(IntIdxTy);
906 BitWidth,
907 DL.getIndexedOffsetInType(
908 SrcElemTy, ArrayRef((Value *const *)Ops.data() + 1, Ops.size() - 1)),
909 /*isSigned=*/true, /*implicitTrunc=*/true);
910
911 std::optional<ConstantRange> InRange = GEP->getInRange();
912 if (InRange)
913 InRange = InRange->sextOrTrunc(BitWidth);
914
915 // If this is a GEP of a GEP, fold it all into a single GEP.
916 GEPNoWrapFlags NW = GEP->getNoWrapFlags();
917 bool Overflow = false;
918 while (auto *GEP = dyn_cast<GEPOperator>(Ptr)) {
919 NW &= GEP->getNoWrapFlags();
920
921 SmallVector<Value *, 4> NestedOps(llvm::drop_begin(GEP->operands()));
922
923 // Do not try the incorporate the sub-GEP if some index is not a number.
924 bool AllConstantInt = true;
925 for (Value *NestedOp : NestedOps)
926 if (!isa<ConstantInt>(NestedOp)) {
927 AllConstantInt = false;
928 break;
929 }
930 if (!AllConstantInt)
931 break;
932
933 // Adjust inrange offset and intersect inrange attributes
934 if (auto GEPRange = GEP->getInRange()) {
935 auto AdjustedGEPRange = GEPRange->sextOrTrunc(BitWidth).subtract(Offset);
936 InRange =
937 InRange ? InRange->intersectWith(AdjustedGEPRange) : AdjustedGEPRange;
938 }
939
940 Ptr = cast<Constant>(GEP->getOperand(0));
941 SrcElemTy = GEP->getSourceElementType();
942 Offset = Offset.sadd_ov(
943 APInt(BitWidth, DL.getIndexedOffsetInType(SrcElemTy, NestedOps),
944 /*isSigned=*/true, /*implicitTrunc=*/true),
945 Overflow);
946 }
947
948 // Preserving nusw (without inbounds) also requires that the offset
949 // additions did not overflow.
950 if (NW.hasNoUnsignedSignedWrap() && !NW.isInBounds() && Overflow)
952
953 // If the base value for this address is a literal integer value, fold the
954 // getelementptr to the resulting integer value casted to the pointer type.
955 APInt BaseIntVal(DL.getPointerTypeSizeInBits(Ptr->getType()), 0);
956 if (auto *CE = dyn_cast<ConstantExpr>(Ptr)) {
957 if (CE->getOpcode() == Instruction::IntToPtr) {
958 if (auto *Base = dyn_cast<ConstantInt>(CE->getOperand(0)))
959 BaseIntVal = Base->getValue().zextOrTrunc(BaseIntVal.getBitWidth());
960 }
961 }
962
963 if ((Ptr->isNullValue() || BaseIntVal != 0) &&
964 !DL.mustNotIntroduceIntToPtr(Ptr->getType())) {
965
966 // If the index size is smaller than the pointer size, add to the low
967 // bits only.
968 BaseIntVal.insertBits(BaseIntVal.trunc(BitWidth) + Offset, 0);
969 Constant *C = ConstantInt::get(Ptr->getContext(), BaseIntVal);
970 return ConstantExpr::getIntToPtr(C, ResTy);
971 }
972
973 // Try to infer inbounds for GEPs of globals.
974 if (!NW.isInBounds() && Offset.isNonNegative()) {
975 bool CanBeNull, CanBeFreed;
976 uint64_t DerefBytes =
977 Ptr->getPointerDereferenceableBytes(DL, CanBeNull, CanBeFreed);
978 if (DerefBytes != 0 && !CanBeNull && Offset.sle(DerefBytes))
980 }
981
982 // nusw + nneg -> nuw
983 if (NW.hasNoUnsignedSignedWrap() && Offset.isNonNegative())
985
986 // Otherwise canonicalize this to a single ptradd.
987 LLVMContext &Ctx = Ptr->getContext();
989 ConstantInt::get(Ctx, Offset), NW,
990 InRange);
991}
992
993/// Attempt to constant fold an instruction with the
994/// specified opcode and operands. If successful, the constant result is
995/// returned, if not, null is returned. Note that this function can fail when
996/// attempting to fold instructions like loads and stores, which have no
997/// constant expression form.
998Constant *ConstantFoldInstOperandsImpl(const Value *InstOrCE, unsigned Opcode,
1000 const DataLayout &DL,
1001 const TargetLibraryInfo *TLI,
1002 bool AllowNonDeterministic) {
1003 Type *DestTy = InstOrCE->getType();
1004
1005 if (Instruction::isUnaryOp(Opcode))
1006 return ConstantFoldUnaryOpOperand(Opcode, Ops[0], DL);
1007
1008 if (Instruction::isBinaryOp(Opcode)) {
1009 switch (Opcode) {
1010 default:
1011 break;
1012 case Instruction::FAdd:
1013 case Instruction::FSub:
1014 case Instruction::FMul:
1015 case Instruction::FDiv:
1016 case Instruction::FRem:
1017 // Handle floating point instructions separately to account for denormals
1018 // TODO: If a constant expression is being folded rather than an
1019 // instruction, denormals will not be flushed/treated as zero
1020 if (const auto *I = dyn_cast<Instruction>(InstOrCE)) {
1021 return ConstantFoldFPInstOperands(Opcode, Ops[0], Ops[1], DL, I,
1022 AllowNonDeterministic);
1023 }
1024 }
1025 return ConstantFoldBinaryOpOperands(Opcode, Ops[0], Ops[1], DL);
1026 }
1027
1028 if (Instruction::isCast(Opcode))
1029 return ConstantFoldCastOperand(Opcode, Ops[0], DestTy, DL);
1030
1031 if (auto *GEP = dyn_cast<GEPOperator>(InstOrCE)) {
1032 Type *SrcElemTy = GEP->getSourceElementType();
1034 return nullptr;
1035
1036 if (Constant *C = SymbolicallyEvaluateGEP(GEP, Ops, DL, TLI))
1037 return C;
1038
1039 return ConstantExpr::getGetElementPtr(SrcElemTy, Ops[0], Ops.slice(1),
1040 GEP->getNoWrapFlags(),
1041 GEP->getInRange());
1042 }
1043
1044 if (auto *CE = dyn_cast<ConstantExpr>(InstOrCE))
1045 return CE->getWithOperands(Ops);
1046
1047 switch (Opcode) {
1048 default: return nullptr;
1049 case Instruction::ICmp:
1050 case Instruction::FCmp: {
1051 auto *C = cast<CmpInst>(InstOrCE);
1052 return ConstantFoldCompareInstOperands(C->getPredicate(), Ops[0], Ops[1],
1053 DL, TLI, C);
1054 }
1055 case Instruction::Freeze:
1056 return isGuaranteedNotToBeUndefOrPoison(Ops[0]) ? Ops[0] : nullptr;
1057 case Instruction::Call:
1058 if (auto *F = dyn_cast<Function>(Ops.back())) {
1059 const auto *Call = cast<CallBase>(InstOrCE);
1061 return ConstantFoldCall(Call, F, Ops.slice(0, Ops.size() - 1), TLI,
1062 AllowNonDeterministic);
1063 }
1064 return nullptr;
1065 case Instruction::Select:
1066 return ConstantFoldSelectInstruction(Ops[0], Ops[1], Ops[2]);
1067 case Instruction::ExtractElement:
1069 case Instruction::ExtractValue:
1071 Ops[0], cast<ExtractValueInst>(InstOrCE)->getIndices());
1072 case Instruction::InsertElement:
1073 return ConstantExpr::getInsertElement(Ops[0], Ops[1], Ops[2]);
1074 case Instruction::InsertValue:
1076 Ops[0], Ops[1], cast<InsertValueInst>(InstOrCE)->getIndices());
1077 case Instruction::ShuffleVector:
1079 Ops[0], Ops[1], cast<ShuffleVectorInst>(InstOrCE)->getShuffleMask());
1080 case Instruction::Load: {
1081 const auto *LI = dyn_cast<LoadInst>(InstOrCE);
1082 if (LI->isVolatile())
1083 return nullptr;
1084 return ConstantFoldLoadFromConstPtr(Ops[0], LI->getType(), DL);
1085 }
1086 }
1087}
1088
1089} // end anonymous namespace
1090
1091//===----------------------------------------------------------------------===//
1092// Constant Folding public APIs
1093//===----------------------------------------------------------------------===//
1094
1095namespace {
1096
1097Constant *
1098ConstantFoldConstantImpl(const Constant *C, const DataLayout &DL,
1099 const TargetLibraryInfo *TLI,
1102 return const_cast<Constant *>(C);
1103
1105 for (const Use &OldU : C->operands()) {
1106 Constant *OldC = cast<Constant>(&OldU);
1107 Constant *NewC = OldC;
1108 // Recursively fold the ConstantExpr's operands. If we have already folded
1109 // a ConstantExpr, we don't have to process it again.
1110 if (isa<ConstantVector>(OldC) || isa<ConstantExpr>(OldC)) {
1111 auto It = FoldedOps.find(OldC);
1112 if (It == FoldedOps.end()) {
1113 NewC = ConstantFoldConstantImpl(OldC, DL, TLI, FoldedOps);
1114 FoldedOps.insert({OldC, NewC});
1115 } else {
1116 NewC = It->second;
1117 }
1118 }
1119 Ops.push_back(NewC);
1120 }
1121
1122 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1123 if (Constant *Res = ConstantFoldInstOperandsImpl(
1124 CE, CE->getOpcode(), Ops, DL, TLI, /*AllowNonDeterministic=*/true))
1125 return Res;
1126 return const_cast<Constant *>(C);
1127 }
1128
1130 return ConstantVector::get(Ops);
1131}
1132
1133} // end anonymous namespace
1134
1136 const DataLayout &DL,
1137 const TargetLibraryInfo *TLI) {
1138 // Handle PHI nodes quickly here...
1139 if (auto *PN = dyn_cast<PHINode>(I)) {
1140 Constant *CommonValue = nullptr;
1141
1143 for (Value *Incoming : PN->incoming_values()) {
1144 // If the incoming value is undef then skip it. Note that while we could
1145 // skip the value if it is equal to the phi node itself we choose not to
1146 // because that would break the rule that constant folding only applies if
1147 // all operands are constants.
1149 continue;
1150 // If the incoming value is not a constant, then give up.
1151 auto *C = dyn_cast<Constant>(Incoming);
1152 if (!C)
1153 return nullptr;
1154 // Fold the PHI's operands.
1155 C = ConstantFoldConstantImpl(C, DL, TLI, FoldedOps);
1156 // If the incoming value is a different constant to
1157 // the one we saw previously, then give up.
1158 if (CommonValue && C != CommonValue)
1159 return nullptr;
1160 CommonValue = C;
1161 }
1162
1163 // If we reach here, all incoming values are the same constant or undef.
1164 return CommonValue ? CommonValue : UndefValue::get(PN->getType());
1165 }
1166
1167 // Scan the operand list, checking to see if they are all constants, if so,
1168 // hand off to ConstantFoldInstOperandsImpl.
1169 if (!all_of(I->operands(), [](const Use &U) { return isa<Constant>(U); }))
1170 return nullptr;
1171
1174 for (const Use &OpU : I->operands()) {
1175 auto *Op = cast<Constant>(&OpU);
1176 // Fold the Instruction's operands.
1177 Op = ConstantFoldConstantImpl(Op, DL, TLI, FoldedOps);
1178 Ops.push_back(Op);
1179 }
1180
1181 return ConstantFoldInstOperands(I, Ops, DL, TLI);
1182}
1183
1185 const TargetLibraryInfo *TLI) {
1187 return ConstantFoldConstantImpl(C, DL, TLI, FoldedOps);
1188}
1189
1192 const DataLayout &DL,
1193 const TargetLibraryInfo *TLI,
1194 bool AllowNonDeterministic) {
1195 return ConstantFoldInstOperandsImpl(I, I->getOpcode(), Ops, DL, TLI,
1196 AllowNonDeterministic);
1197}
1198
1200 unsigned IntPredicate, Constant *Ops0, Constant *Ops1, const DataLayout &DL,
1201 const TargetLibraryInfo *TLI, const Instruction *I) {
1202 CmpInst::Predicate Predicate = (CmpInst::Predicate)IntPredicate;
1203 // fold: icmp (inttoptr x), null -> icmp x, 0
1204 // fold: icmp null, (inttoptr x) -> icmp 0, x
1205 // fold: icmp (ptrtoint x), 0 -> icmp x, null
1206 // fold: icmp 0, (ptrtoint x) -> icmp null, x
1207 // fold: icmp (inttoptr x), (inttoptr y) -> icmp trunc/zext x, trunc/zext y
1208 // fold: icmp (ptrtoint x), (ptrtoint y) -> icmp x, y
1209 //
1210 // FIXME: The following comment is out of data and the DataLayout is here now.
1211 // ConstantExpr::getCompare cannot do this, because it doesn't have DL
1212 // around to know if bit truncation is happening.
1213 if (auto *CE0 = dyn_cast<ConstantExpr>(Ops0)) {
1214 if (Ops1->isNullValue()) {
1215 if (CE0->getOpcode() == Instruction::IntToPtr) {
1216 Type *IntPtrTy = DL.getIntPtrType(CE0->getType());
1217 // Convert the integer value to the right size to ensure we get the
1218 // proper extension or truncation.
1219 if (Constant *C = ConstantFoldIntegerCast(CE0->getOperand(0), IntPtrTy,
1220 /*IsSigned*/ false, DL)) {
1221 Constant *Null = Constant::getNullValue(C->getType());
1222 return ConstantFoldCompareInstOperands(Predicate, C, Null, DL, TLI);
1223 }
1224 }
1225
1226 // icmp only compares the address part of the pointer, so only do this
1227 // transform if the integer size matches the address size.
1228 if (CE0->getOpcode() == Instruction::PtrToInt ||
1229 CE0->getOpcode() == Instruction::PtrToAddr) {
1230 Type *AddrTy = DL.getAddressType(CE0->getOperand(0)->getType());
1231 if (CE0->getType() == AddrTy) {
1232 Constant *C = CE0->getOperand(0);
1233 Constant *Null = Constant::getNullValue(C->getType());
1234 return ConstantFoldCompareInstOperands(Predicate, C, Null, DL, TLI);
1235 }
1236 }
1237 }
1238
1239 if (auto *CE1 = dyn_cast<ConstantExpr>(Ops1)) {
1240 if (CE0->getOpcode() == CE1->getOpcode()) {
1241 if (CE0->getOpcode() == Instruction::IntToPtr) {
1242 Type *IntPtrTy = DL.getIntPtrType(CE0->getType());
1243
1244 // Convert the integer value to the right size to ensure we get the
1245 // proper extension or truncation.
1246 Constant *C0 = ConstantFoldIntegerCast(CE0->getOperand(0), IntPtrTy,
1247 /*IsSigned*/ false, DL);
1248 Constant *C1 = ConstantFoldIntegerCast(CE1->getOperand(0), IntPtrTy,
1249 /*IsSigned*/ false, DL);
1250 if (C0 && C1)
1251 return ConstantFoldCompareInstOperands(Predicate, C0, C1, DL, TLI);
1252 }
1253
1254 // icmp only compares the address part of the pointer, so only do this
1255 // transform if the integer size matches the address size.
1256 if (CE0->getOpcode() == Instruction::PtrToInt ||
1257 CE0->getOpcode() == Instruction::PtrToAddr) {
1258 Type *AddrTy = DL.getAddressType(CE0->getOperand(0)->getType());
1259 if (CE0->getType() == AddrTy &&
1260 CE0->getOperand(0)->getType() == CE1->getOperand(0)->getType()) {
1262 Predicate, CE0->getOperand(0), CE1->getOperand(0), DL, TLI);
1263 }
1264 }
1265 }
1266 }
1267
1268 // Convert pointer comparison (base+offset1) pred (base+offset2) into
1269 // offset1 pred offset2, for the case where the offset is inbounds. This
1270 // only works for equality and unsigned comparison, as inbounds permits
1271 // crossing the sign boundary. However, the offset comparison itself is
1272 // signed.
1273 if (Ops0->getType()->isPointerTy() && !ICmpInst::isSigned(Predicate)) {
1274 unsigned IndexWidth = DL.getIndexTypeSizeInBits(Ops0->getType());
1275 APInt Offset0(IndexWidth, 0);
1276 bool IsEqPred = ICmpInst::isEquality(Predicate);
1277 Value *Stripped0 = Ops0->stripAndAccumulateConstantOffsets(
1278 DL, Offset0, /*AllowNonInbounds=*/IsEqPred,
1279 /*AllowInvariantGroup=*/false, /*ExternalAnalysis=*/nullptr,
1280 /*LookThroughIntToPtr=*/IsEqPred);
1281 APInt Offset1(IndexWidth, 0);
1282 Value *Stripped1 = Ops1->stripAndAccumulateConstantOffsets(
1283 DL, Offset1, /*AllowNonInbounds=*/IsEqPred,
1284 /*AllowInvariantGroup=*/false, /*ExternalAnalysis=*/nullptr,
1285 /*LookThroughIntToPtr=*/IsEqPred);
1286 if (Stripped0 == Stripped1)
1287 return ConstantInt::getBool(
1288 Ops0->getContext(),
1289 ICmpInst::compare(Offset0, Offset1,
1290 ICmpInst::getSignedPredicate(Predicate)));
1291 }
1292 } else if (isa<ConstantExpr>(Ops1)) {
1293 // If RHS is a constant expression, but the left side isn't, swap the
1294 // operands and try again.
1295 Predicate = ICmpInst::getSwappedPredicate(Predicate);
1296 return ConstantFoldCompareInstOperands(Predicate, Ops1, Ops0, DL, TLI);
1297 }
1298
1299 if (CmpInst::isFPPredicate(Predicate)) {
1300 // Flush any denormal constant float input according to denormal handling
1301 // mode.
1302 Ops0 = FlushFPConstant(Ops0, I, /*IsOutput=*/false);
1303 if (!Ops0)
1304 return nullptr;
1305 Ops1 = FlushFPConstant(Ops1, I, /*IsOutput=*/false);
1306 if (!Ops1)
1307 return nullptr;
1308 }
1309
1310 return ConstantFoldCompareInstruction(Predicate, Ops0, Ops1);
1311}
1312
1314 const DataLayout &DL) {
1316
1317 return ConstantFoldUnaryInstruction(Opcode, Op);
1318}
1319
1321 Constant *RHS,
1322 const DataLayout &DL) {
1324 if (isa<ConstantExpr>(LHS) || isa<ConstantExpr>(RHS))
1325 if (Constant *C = SymbolicallyEvaluateBinop(Opcode, LHS, RHS, DL))
1326 return C;
1327
1329 return ConstantExpr::get(Opcode, LHS, RHS);
1330 return ConstantFoldBinaryInstruction(Opcode, LHS, RHS);
1331}
1332
1335 switch (Mode) {
1337 return nullptr;
1338 case DenormalMode::IEEE:
1339 return ConstantFP::get(Ty->getContext(), APF);
1341 return ConstantFP::get(
1342 Ty->getContext(),
1345 return ConstantFP::get(Ty->getContext(),
1346 APFloat::getZero(APF.getSemantics(), false));
1347 default:
1348 break;
1349 }
1350
1351 llvm_unreachable("unknown denormal mode");
1352}
1353
1354/// Return the denormal mode that can be assumed when executing a floating point
1355/// operation at \p CtxI.
1357 if (!CtxI || !CtxI->getParent() || !CtxI->getFunction())
1358 return DenormalMode::getDynamic();
1359 return CtxI->getFunction()->getDenormalMode(Ty->getFltSemantics());
1360}
1361
1363 const Instruction *Inst,
1364 bool IsOutput) {
1365 const APFloat &APF = CFP->getValueAPF();
1366 if (!APF.isDenormal())
1367 return CFP;
1368
1370 return flushDenormalConstant(CFP->getType(), APF,
1371 IsOutput ? Mode.Output : Mode.Input);
1372}
1373
1375 bool IsOutput) {
1376 if (ConstantFP *CFP = dyn_cast<ConstantFP>(Operand))
1377 return flushDenormalConstantFP(CFP, Inst, IsOutput);
1378
1380 return Operand;
1381
1382 Type *Ty = Operand->getType();
1383 VectorType *VecTy = dyn_cast<VectorType>(Ty);
1384 if (VecTy) {
1385 if (auto *Splat = dyn_cast_or_null<ConstantFP>(Operand->getSplatValue())) {
1386 ConstantFP *Folded = flushDenormalConstantFP(Splat, Inst, IsOutput);
1387 if (!Folded)
1388 return nullptr;
1389 return ConstantVector::getSplat(VecTy->getElementCount(), Folded);
1390 }
1391
1392 Ty = VecTy->getElementType();
1393 }
1394
1395 if (isa<ConstantExpr>(Operand))
1396 return Operand;
1397
1398 if (const auto *CV = dyn_cast<ConstantVector>(Operand)) {
1400 for (unsigned i = 0, e = CV->getNumOperands(); i != e; ++i) {
1401 Constant *Element = CV->getAggregateElement(i);
1402 if (isa<UndefValue>(Element)) {
1403 NewElts.push_back(Element);
1404 continue;
1405 }
1406
1407 ConstantFP *CFP = dyn_cast<ConstantFP>(Element);
1408 if (!CFP)
1409 return nullptr;
1410
1411 ConstantFP *Folded = flushDenormalConstantFP(CFP, Inst, IsOutput);
1412 if (!Folded)
1413 return nullptr;
1414 NewElts.push_back(Folded);
1415 }
1416
1417 return ConstantVector::get(NewElts);
1418 }
1419
1420 if (const auto *CDV = dyn_cast<ConstantDataVector>(Operand)) {
1422 for (unsigned I = 0, E = CDV->getNumElements(); I < E; ++I) {
1423 const APFloat &Elt = CDV->getElementAsAPFloat(I);
1424 if (!Elt.isDenormal()) {
1425 NewElts.push_back(ConstantFP::get(Ty, Elt));
1426 } else {
1427 DenormalMode Mode = getInstrDenormalMode(Inst, Ty);
1428 ConstantFP *Folded =
1429 flushDenormalConstant(Ty, Elt, IsOutput ? Mode.Output : Mode.Input);
1430 if (!Folded)
1431 return nullptr;
1432 NewElts.push_back(Folded);
1433 }
1434 }
1435
1436 return ConstantVector::get(NewElts);
1437 }
1438
1439 return nullptr;
1440}
1441
1443 Constant *RHS, const DataLayout &DL,
1444 const Instruction *I,
1445 bool AllowNonDeterministic) {
1446 if (Instruction::isBinaryOp(Opcode)) {
1447 // Flush denormal inputs if needed.
1448 Constant *Op0 = FlushFPConstant(LHS, I, /* IsOutput */ false);
1449 if (!Op0)
1450 return nullptr;
1451 Constant *Op1 = FlushFPConstant(RHS, I, /* IsOutput */ false);
1452 if (!Op1)
1453 return nullptr;
1454
1455 // If nsz or an algebraic FMF flag is set, the result of the FP operation
1456 // may change due to future optimization. Don't constant fold them if
1457 // non-deterministic results are not allowed.
1458 if (!AllowNonDeterministic)
1460 if (FP->hasNoSignedZeros() || FP->hasAllowReassoc() ||
1461 FP->hasAllowContract() || FP->hasAllowReciprocal())
1462 return nullptr;
1463
1464 // Calculate constant result.
1465 Constant *C = ConstantFoldBinaryOpOperands(Opcode, Op0, Op1, DL);
1466 if (!C)
1467 return nullptr;
1468
1469 // Flush denormal output if needed.
1470 C = FlushFPConstant(C, I, /* IsOutput */ true);
1471 if (!C)
1472 return nullptr;
1473
1474 // The precise NaN value is non-deterministic.
1475 if (!AllowNonDeterministic && C->isNaN())
1476 return nullptr;
1477
1478 return C;
1479 }
1480 // If instruction lacks a parent/function and the denormal mode cannot be
1481 // determined, use the default (IEEE).
1482 return ConstantFoldBinaryOpOperands(Opcode, LHS, RHS, DL);
1483}
1484
1486 Type *DestTy, const DataLayout &DL) {
1487 assert(Instruction::isCast(Opcode));
1488
1489 if (auto *CE = dyn_cast<ConstantExpr>(C))
1490 if (CE->isCast())
1491 if (unsigned NewOp = CastInst::isEliminableCastPair(
1492 Instruction::CastOps(CE->getOpcode()),
1493 Instruction::CastOps(Opcode), CE->getOperand(0)->getType(),
1494 C->getType(), DestTy, &DL))
1495 return ConstantFoldCastOperand(NewOp, CE->getOperand(0), DestTy, DL);
1496
1497 switch (Opcode) {
1498 default:
1499 llvm_unreachable("Missing case");
1500 case Instruction::PtrToAddr:
1501 case Instruction::PtrToInt:
1502 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1503 Constant *FoldedValue = nullptr;
1504 // If the input is an inttoptr, eliminate the pair. This requires knowing
1505 // the width of a pointer, so it can't be done in ConstantExpr::getCast.
1506 if (CE->getOpcode() == Instruction::IntToPtr) {
1507 // zext/trunc the inttoptr to pointer/address size.
1508 Type *MidTy = Opcode == Instruction::PtrToInt
1509 ? DL.getAddressType(CE->getType())
1510 : DL.getIntPtrType(CE->getType());
1511 FoldedValue = ConstantFoldIntegerCast(CE->getOperand(0), MidTy,
1512 /*IsSigned=*/false, DL);
1513 } else if (auto *GEP = dyn_cast<GEPOperator>(CE)) {
1514 // If we have GEP, we can perform the following folds:
1515 // (ptrtoint/ptrtoaddr (gep null, x)) -> x
1516 // (ptrtoint/ptrtoaddr (gep (gep null, x), y) -> x + y, etc.
1517 unsigned BitWidth = DL.getIndexTypeSizeInBits(GEP->getType());
1518 APInt BaseOffset(BitWidth, 0);
1519 auto *Base = cast<Constant>(GEP->stripAndAccumulateConstantOffsets(
1520 DL, BaseOffset, /*AllowNonInbounds=*/true));
1521 if (Base->isNullValue()) {
1522 FoldedValue = ConstantInt::get(CE->getContext(), BaseOffset);
1523 } else {
1524 // ptrtoint/ptrtoaddr (gep i8, Ptr, (sub 0, V))
1525 // -> sub (ptrtoint/ptrtoaddr Ptr), V
1526 if (GEP->getNumIndices() == 1 &&
1527 GEP->getSourceElementType()->isIntegerTy(8)) {
1528 auto *Ptr = cast<Constant>(GEP->getPointerOperand());
1529 auto *Sub = dyn_cast<ConstantExpr>(GEP->getOperand(1));
1530 Type *IntIdxTy = DL.getIndexType(Ptr->getType());
1531 if (Sub && Sub->getType() == IntIdxTy &&
1532 Sub->getOpcode() == Instruction::Sub &&
1533 Sub->getOperand(0)->isNullValue())
1534 FoldedValue = ConstantExpr::getSub(
1535 ConstantExpr::getCast(Opcode, Ptr, IntIdxTy),
1536 Sub->getOperand(1));
1537 }
1538 }
1539 }
1540 if (FoldedValue) {
1541 // Do a zext or trunc to get to the ptrtoint/ptrtoaddr dest size.
1542 return ConstantFoldIntegerCast(FoldedValue, DestTy, /*IsSigned=*/false,
1543 DL);
1544 }
1545 }
1546 break;
1547 case Instruction::IntToPtr:
1548 // If the input is a ptrtoint, turn the pair into a ptr to ptr bitcast if
1549 // the int size is >= the ptr size and the address spaces are the same.
1550 // This requires knowing the width of a pointer, so it can't be done in
1551 // ConstantExpr::getCast.
1552 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1553 if (CE->getOpcode() == Instruction::PtrToInt) {
1554 Constant *SrcPtr = CE->getOperand(0);
1555 unsigned SrcPtrSize = DL.getPointerTypeSizeInBits(SrcPtr->getType());
1556 unsigned MidIntSize = CE->getType()->getScalarSizeInBits();
1557
1558 if (MidIntSize >= SrcPtrSize) {
1559 unsigned SrcAS = SrcPtr->getType()->getPointerAddressSpace();
1560 if (SrcAS == DestTy->getPointerAddressSpace())
1561 return FoldBitCast(CE->getOperand(0), DestTy, DL);
1562 }
1563 }
1564 }
1565 break;
1566 case Instruction::Trunc:
1567 case Instruction::ZExt:
1568 case Instruction::SExt:
1569 case Instruction::FPTrunc:
1570 case Instruction::FPExt:
1571 case Instruction::UIToFP:
1572 case Instruction::SIToFP:
1573 case Instruction::FPToUI:
1574 case Instruction::FPToSI:
1575 case Instruction::AddrSpaceCast:
1576 break;
1577 case Instruction::BitCast:
1578 return FoldBitCast(C, DestTy, DL);
1579 }
1580
1582 return ConstantExpr::getCast(Opcode, C, DestTy);
1583 return ConstantFoldCastInstruction(Opcode, C, DestTy);
1584}
1585
1587 bool IsSigned, const DataLayout &DL) {
1588 Type *SrcTy = C->getType();
1589 if (SrcTy == DestTy)
1590 return C;
1591 if (SrcTy->getScalarSizeInBits() > DestTy->getScalarSizeInBits())
1592 return ConstantFoldCastOperand(Instruction::Trunc, C, DestTy, DL);
1593 if (IsSigned)
1594 return ConstantFoldCastOperand(Instruction::SExt, C, DestTy, DL);
1595 return ConstantFoldCastOperand(Instruction::ZExt, C, DestTy, DL);
1596}
1597
1598//===----------------------------------------------------------------------===//
1599// Constant Folding for Calls
1600//
1601
1603 if (Call->isNoBuiltin())
1604 return false;
1605 if (Call->getFunctionType() != F->getFunctionType())
1606 return false;
1607
1608 // Allow FP calls (both libcalls and intrinsics) to avoid being folded.
1609 // This can be useful for GPU targets or in cross-compilation scenarios
1610 // when the exact target FP behaviour is required, and the host compiler's
1611 // behaviour may be slightly different from the device's run-time behaviour.
1612 if (DisableFPCallFolding && (F->getReturnType()->isFloatingPointTy() ||
1613 any_of(F->args(), [](const Argument &Arg) {
1614 return Arg.getType()->isFloatingPointTy();
1615 })))
1616 return false;
1617
1618 switch (F->getIntrinsicID()) {
1619 // Operations that do not operate floating-point numbers and do not depend on
1620 // FP environment can be folded even in strictfp functions.
1621 case Intrinsic::bswap:
1622 case Intrinsic::ctpop:
1623 case Intrinsic::ctlz:
1624 case Intrinsic::cttz:
1625 case Intrinsic::fshl:
1626 case Intrinsic::fshr:
1627 case Intrinsic::launder_invariant_group:
1628 case Intrinsic::strip_invariant_group:
1629 case Intrinsic::masked_load:
1630 case Intrinsic::get_active_lane_mask:
1631 case Intrinsic::abs:
1632 case Intrinsic::smax:
1633 case Intrinsic::smin:
1634 case Intrinsic::umax:
1635 case Intrinsic::umin:
1636 case Intrinsic::scmp:
1637 case Intrinsic::ucmp:
1638 case Intrinsic::sadd_with_overflow:
1639 case Intrinsic::uadd_with_overflow:
1640 case Intrinsic::ssub_with_overflow:
1641 case Intrinsic::usub_with_overflow:
1642 case Intrinsic::smul_with_overflow:
1643 case Intrinsic::umul_with_overflow:
1644 case Intrinsic::sadd_sat:
1645 case Intrinsic::uadd_sat:
1646 case Intrinsic::ssub_sat:
1647 case Intrinsic::usub_sat:
1648 case Intrinsic::smul_fix:
1649 case Intrinsic::smul_fix_sat:
1650 case Intrinsic::bitreverse:
1651 case Intrinsic::is_constant:
1652 case Intrinsic::vector_reduce_add:
1653 case Intrinsic::vector_reduce_mul:
1654 case Intrinsic::vector_reduce_and:
1655 case Intrinsic::vector_reduce_or:
1656 case Intrinsic::vector_reduce_xor:
1657 case Intrinsic::vector_reduce_smin:
1658 case Intrinsic::vector_reduce_smax:
1659 case Intrinsic::vector_reduce_umin:
1660 case Intrinsic::vector_reduce_umax:
1661 case Intrinsic::vector_extract:
1662 case Intrinsic::vector_insert:
1663 case Intrinsic::vector_interleave2:
1664 case Intrinsic::vector_interleave3:
1665 case Intrinsic::vector_interleave4:
1666 case Intrinsic::vector_interleave5:
1667 case Intrinsic::vector_interleave6:
1668 case Intrinsic::vector_interleave7:
1669 case Intrinsic::vector_interleave8:
1670 case Intrinsic::vector_deinterleave2:
1671 case Intrinsic::vector_deinterleave3:
1672 case Intrinsic::vector_deinterleave4:
1673 case Intrinsic::vector_deinterleave5:
1674 case Intrinsic::vector_deinterleave6:
1675 case Intrinsic::vector_deinterleave7:
1676 case Intrinsic::vector_deinterleave8:
1677 // Target intrinsics
1678 case Intrinsic::amdgcn_perm:
1679 case Intrinsic::amdgcn_wave_reduce_umin:
1680 case Intrinsic::amdgcn_wave_reduce_umax:
1681 case Intrinsic::amdgcn_wave_reduce_max:
1682 case Intrinsic::amdgcn_wave_reduce_min:
1683 case Intrinsic::amdgcn_wave_reduce_add:
1684 case Intrinsic::amdgcn_wave_reduce_sub:
1685 case Intrinsic::amdgcn_wave_reduce_and:
1686 case Intrinsic::amdgcn_wave_reduce_or:
1687 case Intrinsic::amdgcn_wave_reduce_xor:
1688 case Intrinsic::amdgcn_s_wqm:
1689 case Intrinsic::amdgcn_s_quadmask:
1690 case Intrinsic::amdgcn_s_bitreplicate:
1691 case Intrinsic::arm_mve_vctp8:
1692 case Intrinsic::arm_mve_vctp16:
1693 case Intrinsic::arm_mve_vctp32:
1694 case Intrinsic::arm_mve_vctp64:
1695 case Intrinsic::aarch64_sve_convert_from_svbool:
1696 case Intrinsic::wasm_alltrue:
1697 case Intrinsic::wasm_anytrue:
1698 case Intrinsic::wasm_dot:
1699 // WebAssembly float semantics are always known
1700 case Intrinsic::wasm_trunc_signed:
1701 case Intrinsic::wasm_trunc_unsigned:
1702 return true;
1703
1704 // Floating point operations cannot be folded in strictfp functions in
1705 // general case. They can be folded if FP environment is known to compiler.
1706 case Intrinsic::minnum:
1707 case Intrinsic::maxnum:
1708 case Intrinsic::minimum:
1709 case Intrinsic::maximum:
1710 case Intrinsic::minimumnum:
1711 case Intrinsic::maximumnum:
1712 case Intrinsic::log:
1713 case Intrinsic::log2:
1714 case Intrinsic::log10:
1715 case Intrinsic::exp:
1716 case Intrinsic::exp2:
1717 case Intrinsic::exp10:
1718 case Intrinsic::sqrt:
1719 case Intrinsic::sin:
1720 case Intrinsic::cos:
1721 case Intrinsic::sincos:
1722 case Intrinsic::sinh:
1723 case Intrinsic::cosh:
1724 case Intrinsic::atan:
1725 case Intrinsic::pow:
1726 case Intrinsic::powi:
1727 case Intrinsic::ldexp:
1728 case Intrinsic::fma:
1729 case Intrinsic::fmuladd:
1730 case Intrinsic::frexp:
1731 case Intrinsic::fptoui_sat:
1732 case Intrinsic::fptosi_sat:
1733 case Intrinsic::convert_from_fp16:
1734 case Intrinsic::convert_to_fp16:
1735 case Intrinsic::amdgcn_cos:
1736 case Intrinsic::amdgcn_cubeid:
1737 case Intrinsic::amdgcn_cubema:
1738 case Intrinsic::amdgcn_cubesc:
1739 case Intrinsic::amdgcn_cubetc:
1740 case Intrinsic::amdgcn_fmul_legacy:
1741 case Intrinsic::amdgcn_fma_legacy:
1742 case Intrinsic::amdgcn_fract:
1743 case Intrinsic::amdgcn_sin:
1744 // The intrinsics below depend on rounding mode in MXCSR.
1745 case Intrinsic::x86_sse_cvtss2si:
1746 case Intrinsic::x86_sse_cvtss2si64:
1747 case Intrinsic::x86_sse_cvttss2si:
1748 case Intrinsic::x86_sse_cvttss2si64:
1749 case Intrinsic::x86_sse2_cvtsd2si:
1750 case Intrinsic::x86_sse2_cvtsd2si64:
1751 case Intrinsic::x86_sse2_cvttsd2si:
1752 case Intrinsic::x86_sse2_cvttsd2si64:
1753 case Intrinsic::x86_avx512_vcvtss2si32:
1754 case Intrinsic::x86_avx512_vcvtss2si64:
1755 case Intrinsic::x86_avx512_cvttss2si:
1756 case Intrinsic::x86_avx512_cvttss2si64:
1757 case Intrinsic::x86_avx512_vcvtsd2si32:
1758 case Intrinsic::x86_avx512_vcvtsd2si64:
1759 case Intrinsic::x86_avx512_cvttsd2si:
1760 case Intrinsic::x86_avx512_cvttsd2si64:
1761 case Intrinsic::x86_avx512_vcvtss2usi32:
1762 case Intrinsic::x86_avx512_vcvtss2usi64:
1763 case Intrinsic::x86_avx512_cvttss2usi:
1764 case Intrinsic::x86_avx512_cvttss2usi64:
1765 case Intrinsic::x86_avx512_vcvtsd2usi32:
1766 case Intrinsic::x86_avx512_vcvtsd2usi64:
1767 case Intrinsic::x86_avx512_cvttsd2usi:
1768 case Intrinsic::x86_avx512_cvttsd2usi64:
1769
1770 // NVVM FMax intrinsics
1771 case Intrinsic::nvvm_fmax_d:
1772 case Intrinsic::nvvm_fmax_f:
1773 case Intrinsic::nvvm_fmax_ftz_f:
1774 case Intrinsic::nvvm_fmax_ftz_nan_f:
1775 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
1776 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
1777 case Intrinsic::nvvm_fmax_nan_f:
1778 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
1779 case Intrinsic::nvvm_fmax_xorsign_abs_f:
1780
1781 // NVVM FMin intrinsics
1782 case Intrinsic::nvvm_fmin_d:
1783 case Intrinsic::nvvm_fmin_f:
1784 case Intrinsic::nvvm_fmin_ftz_f:
1785 case Intrinsic::nvvm_fmin_ftz_nan_f:
1786 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
1787 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
1788 case Intrinsic::nvvm_fmin_nan_f:
1789 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
1790 case Intrinsic::nvvm_fmin_xorsign_abs_f:
1791
1792 // NVVM float/double to int32/uint32 conversion intrinsics
1793 case Intrinsic::nvvm_f2i_rm:
1794 case Intrinsic::nvvm_f2i_rn:
1795 case Intrinsic::nvvm_f2i_rp:
1796 case Intrinsic::nvvm_f2i_rz:
1797 case Intrinsic::nvvm_f2i_rm_ftz:
1798 case Intrinsic::nvvm_f2i_rn_ftz:
1799 case Intrinsic::nvvm_f2i_rp_ftz:
1800 case Intrinsic::nvvm_f2i_rz_ftz:
1801 case Intrinsic::nvvm_f2ui_rm:
1802 case Intrinsic::nvvm_f2ui_rn:
1803 case Intrinsic::nvvm_f2ui_rp:
1804 case Intrinsic::nvvm_f2ui_rz:
1805 case Intrinsic::nvvm_f2ui_rm_ftz:
1806 case Intrinsic::nvvm_f2ui_rn_ftz:
1807 case Intrinsic::nvvm_f2ui_rp_ftz:
1808 case Intrinsic::nvvm_f2ui_rz_ftz:
1809 case Intrinsic::nvvm_d2i_rm:
1810 case Intrinsic::nvvm_d2i_rn:
1811 case Intrinsic::nvvm_d2i_rp:
1812 case Intrinsic::nvvm_d2i_rz:
1813 case Intrinsic::nvvm_d2ui_rm:
1814 case Intrinsic::nvvm_d2ui_rn:
1815 case Intrinsic::nvvm_d2ui_rp:
1816 case Intrinsic::nvvm_d2ui_rz:
1817
1818 // NVVM float/double to int64/uint64 conversion intrinsics
1819 case Intrinsic::nvvm_f2ll_rm:
1820 case Intrinsic::nvvm_f2ll_rn:
1821 case Intrinsic::nvvm_f2ll_rp:
1822 case Intrinsic::nvvm_f2ll_rz:
1823 case Intrinsic::nvvm_f2ll_rm_ftz:
1824 case Intrinsic::nvvm_f2ll_rn_ftz:
1825 case Intrinsic::nvvm_f2ll_rp_ftz:
1826 case Intrinsic::nvvm_f2ll_rz_ftz:
1827 case Intrinsic::nvvm_f2ull_rm:
1828 case Intrinsic::nvvm_f2ull_rn:
1829 case Intrinsic::nvvm_f2ull_rp:
1830 case Intrinsic::nvvm_f2ull_rz:
1831 case Intrinsic::nvvm_f2ull_rm_ftz:
1832 case Intrinsic::nvvm_f2ull_rn_ftz:
1833 case Intrinsic::nvvm_f2ull_rp_ftz:
1834 case Intrinsic::nvvm_f2ull_rz_ftz:
1835 case Intrinsic::nvvm_d2ll_rm:
1836 case Intrinsic::nvvm_d2ll_rn:
1837 case Intrinsic::nvvm_d2ll_rp:
1838 case Intrinsic::nvvm_d2ll_rz:
1839 case Intrinsic::nvvm_d2ull_rm:
1840 case Intrinsic::nvvm_d2ull_rn:
1841 case Intrinsic::nvvm_d2ull_rp:
1842 case Intrinsic::nvvm_d2ull_rz:
1843
1844 // NVVM math intrinsics:
1845 case Intrinsic::nvvm_ceil_d:
1846 case Intrinsic::nvvm_ceil_f:
1847 case Intrinsic::nvvm_ceil_ftz_f:
1848
1849 case Intrinsic::nvvm_fabs:
1850 case Intrinsic::nvvm_fabs_ftz:
1851
1852 case Intrinsic::nvvm_floor_d:
1853 case Intrinsic::nvvm_floor_f:
1854 case Intrinsic::nvvm_floor_ftz_f:
1855
1856 case Intrinsic::nvvm_rcp_rm_d:
1857 case Intrinsic::nvvm_rcp_rm_f:
1858 case Intrinsic::nvvm_rcp_rm_ftz_f:
1859 case Intrinsic::nvvm_rcp_rn_d:
1860 case Intrinsic::nvvm_rcp_rn_f:
1861 case Intrinsic::nvvm_rcp_rn_ftz_f:
1862 case Intrinsic::nvvm_rcp_rp_d:
1863 case Intrinsic::nvvm_rcp_rp_f:
1864 case Intrinsic::nvvm_rcp_rp_ftz_f:
1865 case Intrinsic::nvvm_rcp_rz_d:
1866 case Intrinsic::nvvm_rcp_rz_f:
1867 case Intrinsic::nvvm_rcp_rz_ftz_f:
1868
1869 case Intrinsic::nvvm_round_d:
1870 case Intrinsic::nvvm_round_f:
1871 case Intrinsic::nvvm_round_ftz_f:
1872
1873 case Intrinsic::nvvm_saturate_d:
1874 case Intrinsic::nvvm_saturate_f:
1875 case Intrinsic::nvvm_saturate_ftz_f:
1876
1877 case Intrinsic::nvvm_sqrt_f:
1878 case Intrinsic::nvvm_sqrt_rn_d:
1879 case Intrinsic::nvvm_sqrt_rn_f:
1880 case Intrinsic::nvvm_sqrt_rn_ftz_f:
1881 return !Call->isStrictFP();
1882
1883 // NVVM add intrinsics with explicit rounding modes
1884 case Intrinsic::nvvm_add_rm_d:
1885 case Intrinsic::nvvm_add_rn_d:
1886 case Intrinsic::nvvm_add_rp_d:
1887 case Intrinsic::nvvm_add_rz_d:
1888 case Intrinsic::nvvm_add_rm_f:
1889 case Intrinsic::nvvm_add_rn_f:
1890 case Intrinsic::nvvm_add_rp_f:
1891 case Intrinsic::nvvm_add_rz_f:
1892 case Intrinsic::nvvm_add_rm_ftz_f:
1893 case Intrinsic::nvvm_add_rn_ftz_f:
1894 case Intrinsic::nvvm_add_rp_ftz_f:
1895 case Intrinsic::nvvm_add_rz_ftz_f:
1896
1897 // NVVM div intrinsics with explicit rounding modes
1898 case Intrinsic::nvvm_div_rm_d:
1899 case Intrinsic::nvvm_div_rn_d:
1900 case Intrinsic::nvvm_div_rp_d:
1901 case Intrinsic::nvvm_div_rz_d:
1902 case Intrinsic::nvvm_div_rm_f:
1903 case Intrinsic::nvvm_div_rn_f:
1904 case Intrinsic::nvvm_div_rp_f:
1905 case Intrinsic::nvvm_div_rz_f:
1906 case Intrinsic::nvvm_div_rm_ftz_f:
1907 case Intrinsic::nvvm_div_rn_ftz_f:
1908 case Intrinsic::nvvm_div_rp_ftz_f:
1909 case Intrinsic::nvvm_div_rz_ftz_f:
1910
1911 // NVVM mul intrinsics with explicit rounding modes
1912 case Intrinsic::nvvm_mul_rm_d:
1913 case Intrinsic::nvvm_mul_rn_d:
1914 case Intrinsic::nvvm_mul_rp_d:
1915 case Intrinsic::nvvm_mul_rz_d:
1916 case Intrinsic::nvvm_mul_rm_f:
1917 case Intrinsic::nvvm_mul_rn_f:
1918 case Intrinsic::nvvm_mul_rp_f:
1919 case Intrinsic::nvvm_mul_rz_f:
1920 case Intrinsic::nvvm_mul_rm_ftz_f:
1921 case Intrinsic::nvvm_mul_rn_ftz_f:
1922 case Intrinsic::nvvm_mul_rp_ftz_f:
1923 case Intrinsic::nvvm_mul_rz_ftz_f:
1924
1925 // NVVM fma intrinsics with explicit rounding modes
1926 case Intrinsic::nvvm_fma_rm_d:
1927 case Intrinsic::nvvm_fma_rn_d:
1928 case Intrinsic::nvvm_fma_rp_d:
1929 case Intrinsic::nvvm_fma_rz_d:
1930 case Intrinsic::nvvm_fma_rm_f:
1931 case Intrinsic::nvvm_fma_rn_f:
1932 case Intrinsic::nvvm_fma_rp_f:
1933 case Intrinsic::nvvm_fma_rz_f:
1934 case Intrinsic::nvvm_fma_rm_ftz_f:
1935 case Intrinsic::nvvm_fma_rn_ftz_f:
1936 case Intrinsic::nvvm_fma_rp_ftz_f:
1937 case Intrinsic::nvvm_fma_rz_ftz_f:
1938
1939 // Sign operations are actually bitwise operations, they do not raise
1940 // exceptions even for SNANs.
1941 case Intrinsic::fabs:
1942 case Intrinsic::copysign:
1943 case Intrinsic::is_fpclass:
1944 // Non-constrained variants of rounding operations means default FP
1945 // environment, they can be folded in any case.
1946 case Intrinsic::ceil:
1947 case Intrinsic::floor:
1948 case Intrinsic::round:
1949 case Intrinsic::roundeven:
1950 case Intrinsic::trunc:
1951 case Intrinsic::nearbyint:
1952 case Intrinsic::rint:
1953 case Intrinsic::canonicalize:
1954
1955 // Constrained intrinsics can be folded if FP environment is known
1956 // to compiler.
1957 case Intrinsic::experimental_constrained_fma:
1958 case Intrinsic::experimental_constrained_fmuladd:
1959 case Intrinsic::experimental_constrained_fadd:
1960 case Intrinsic::experimental_constrained_fsub:
1961 case Intrinsic::experimental_constrained_fmul:
1962 case Intrinsic::experimental_constrained_fdiv:
1963 case Intrinsic::experimental_constrained_frem:
1964 case Intrinsic::experimental_constrained_ceil:
1965 case Intrinsic::experimental_constrained_floor:
1966 case Intrinsic::experimental_constrained_round:
1967 case Intrinsic::experimental_constrained_roundeven:
1968 case Intrinsic::experimental_constrained_trunc:
1969 case Intrinsic::experimental_constrained_nearbyint:
1970 case Intrinsic::experimental_constrained_rint:
1971 case Intrinsic::experimental_constrained_fcmp:
1972 case Intrinsic::experimental_constrained_fcmps:
1973 return true;
1974 default:
1975 return false;
1976 case Intrinsic::not_intrinsic: break;
1977 }
1978
1979 if (!F->hasName() || Call->isStrictFP())
1980 return false;
1981
1982 // In these cases, the check of the length is required. We don't want to
1983 // return true for a name like "cos\0blah" which strcmp would return equal to
1984 // "cos", but has length 8.
1985 StringRef Name = F->getName();
1986 switch (Name[0]) {
1987 default:
1988 return false;
1989 // clang-format off
1990 case 'a':
1991 return Name == "acos" || Name == "acosf" ||
1992 Name == "asin" || Name == "asinf" ||
1993 Name == "atan" || Name == "atanf" ||
1994 Name == "atan2" || Name == "atan2f";
1995 case 'c':
1996 return Name == "ceil" || Name == "ceilf" ||
1997 Name == "cos" || Name == "cosf" ||
1998 Name == "cosh" || Name == "coshf";
1999 case 'e':
2000 return Name == "exp" || Name == "expf" || Name == "exp2" ||
2001 Name == "exp2f" || Name == "erf" || Name == "erff";
2002 case 'f':
2003 return Name == "fabs" || Name == "fabsf" ||
2004 Name == "floor" || Name == "floorf" ||
2005 Name == "fmod" || Name == "fmodf";
2006 case 'i':
2007 return Name == "ilogb" || Name == "ilogbf";
2008 case 'l':
2009 return Name == "log" || Name == "logf" || Name == "logl" ||
2010 Name == "log2" || Name == "log2f" || Name == "log10" ||
2011 Name == "log10f" || Name == "logb" || Name == "logbf" ||
2012 Name == "log1p" || Name == "log1pf";
2013 case 'n':
2014 return Name == "nearbyint" || Name == "nearbyintf";
2015 case 'p':
2016 return Name == "pow" || Name == "powf";
2017 case 'r':
2018 return Name == "remainder" || Name == "remainderf" ||
2019 Name == "rint" || Name == "rintf" ||
2020 Name == "round" || Name == "roundf" ||
2021 Name == "roundeven" || Name == "roundevenf";
2022 case 's':
2023 return Name == "sin" || Name == "sinf" ||
2024 Name == "sinh" || Name == "sinhf" ||
2025 Name == "sqrt" || Name == "sqrtf";
2026 case 't':
2027 return Name == "tan" || Name == "tanf" ||
2028 Name == "tanh" || Name == "tanhf" ||
2029 Name == "trunc" || Name == "truncf";
2030 case '_':
2031 // Check for various function names that get used for the math functions
2032 // when the header files are preprocessed with the macro
2033 // __FINITE_MATH_ONLY__ enabled.
2034 // The '12' here is the length of the shortest name that can match.
2035 // We need to check the size before looking at Name[1] and Name[2]
2036 // so we may as well check a limit that will eliminate mismatches.
2037 if (Name.size() < 12 || Name[1] != '_')
2038 return false;
2039 switch (Name[2]) {
2040 default:
2041 return false;
2042 case 'a':
2043 return Name == "__acos_finite" || Name == "__acosf_finite" ||
2044 Name == "__asin_finite" || Name == "__asinf_finite" ||
2045 Name == "__atan2_finite" || Name == "__atan2f_finite";
2046 case 'c':
2047 return Name == "__cosh_finite" || Name == "__coshf_finite";
2048 case 'e':
2049 return Name == "__exp_finite" || Name == "__expf_finite" ||
2050 Name == "__exp2_finite" || Name == "__exp2f_finite";
2051 case 'l':
2052 return Name == "__log_finite" || Name == "__logf_finite" ||
2053 Name == "__log10_finite" || Name == "__log10f_finite";
2054 case 'p':
2055 return Name == "__pow_finite" || Name == "__powf_finite";
2056 case 's':
2057 return Name == "__sinh_finite" || Name == "__sinhf_finite";
2058 }
2059 // clang-format on
2060 }
2061}
2062
2063namespace {
2064
2065Constant *GetConstantFoldFPValue(double V, Type *Ty) {
2066 if (Ty->isHalfTy() || Ty->isFloatTy()) {
2067 APFloat APF(V);
2068 bool unused;
2069 APF.convert(Ty->getFltSemantics(), APFloat::rmNearestTiesToEven, &unused);
2070 return ConstantFP::get(Ty->getContext(), APF);
2071 }
2072 if (Ty->isDoubleTy())
2073 return ConstantFP::get(Ty->getContext(), APFloat(V));
2074 llvm_unreachable("Can only constant fold half/float/double");
2075}
2076
2077#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2078Constant *GetConstantFoldFPValue128(float128 V, Type *Ty) {
2079 if (Ty->isFP128Ty())
2080 return ConstantFP::get(Ty, V);
2081 llvm_unreachable("Can only constant fold fp128");
2082}
2083#endif
2084
2085/// Clear the floating-point exception state.
2086inline void llvm_fenv_clearexcept() {
2087#if HAVE_DECL_FE_ALL_EXCEPT
2088 feclearexcept(FE_ALL_EXCEPT);
2089#endif
2090 errno = 0;
2091}
2092
2093/// Test if a floating-point exception was raised.
2094inline bool llvm_fenv_testexcept() {
2095 int errno_val = errno;
2096 if (errno_val == ERANGE || errno_val == EDOM)
2097 return true;
2098#if HAVE_DECL_FE_ALL_EXCEPT && HAVE_DECL_FE_INEXACT
2099 if (fetestexcept(FE_ALL_EXCEPT & ~FE_INEXACT))
2100 return true;
2101#endif
2102 return false;
2103}
2104
2105static APFloat FTZPreserveSign(const APFloat &V) {
2106 if (V.isDenormal())
2107 return APFloat::getZero(V.getSemantics(), V.isNegative());
2108 return V;
2109}
2110
2111static APFloat FlushToPositiveZero(const APFloat &V) {
2112 if (V.isDenormal())
2113 return APFloat::getZero(V.getSemantics(), false);
2114 return V;
2115}
2116
2117static APFloat FlushWithDenormKind(const APFloat &V,
2118 DenormalMode::DenormalModeKind DenormKind) {
2121 switch (DenormKind) {
2123 return V;
2125 return FTZPreserveSign(V);
2127 return FlushToPositiveZero(V);
2128 default:
2129 llvm_unreachable("Invalid denormal mode!");
2130 }
2131}
2132
2133Constant *ConstantFoldFP(double (*NativeFP)(double), const APFloat &V, Type *Ty,
2134 DenormalMode DenormMode = DenormalMode::getIEEE()) {
2135 if (!DenormMode.isValid() ||
2136 DenormMode.Input == DenormalMode::DenormalModeKind::Dynamic ||
2137 DenormMode.Output == DenormalMode::DenormalModeKind::Dynamic)
2138 return nullptr;
2139
2140 llvm_fenv_clearexcept();
2141 auto Input = FlushWithDenormKind(V, DenormMode.Input);
2142 double Result = NativeFP(Input.convertToDouble());
2143 if (llvm_fenv_testexcept()) {
2144 llvm_fenv_clearexcept();
2145 return nullptr;
2146 }
2147
2148 Constant *Output = GetConstantFoldFPValue(Result, Ty);
2149 if (DenormMode.Output == DenormalMode::DenormalModeKind::IEEE)
2150 return Output;
2151 const auto *CFP = static_cast<ConstantFP *>(Output);
2152 const auto Res = FlushWithDenormKind(CFP->getValueAPF(), DenormMode.Output);
2153 return ConstantFP::get(Ty->getContext(), Res);
2154}
2155
2156#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2157Constant *ConstantFoldFP128(float128 (*NativeFP)(float128), const APFloat &V,
2158 Type *Ty) {
2159 llvm_fenv_clearexcept();
2160 float128 Result = NativeFP(V.convertToQuad());
2161 if (llvm_fenv_testexcept()) {
2162 llvm_fenv_clearexcept();
2163 return nullptr;
2164 }
2165
2166 return GetConstantFoldFPValue128(Result, Ty);
2167}
2168#endif
2169
2170Constant *ConstantFoldBinaryFP(double (*NativeFP)(double, double),
2171 const APFloat &V, const APFloat &W, Type *Ty) {
2172 llvm_fenv_clearexcept();
2173 double Result = NativeFP(V.convertToDouble(), W.convertToDouble());
2174 if (llvm_fenv_testexcept()) {
2175 llvm_fenv_clearexcept();
2176 return nullptr;
2177 }
2178
2179 return GetConstantFoldFPValue(Result, Ty);
2180}
2181
2182Constant *constantFoldVectorReduce(Intrinsic::ID IID, Constant *Op) {
2183 auto *OpVT = cast<VectorType>(Op->getType());
2184
2185 // This is the same as the underlying binops - poison propagates.
2186 if (Op->containsPoisonElement())
2187 return PoisonValue::get(OpVT->getElementType());
2188
2189 // Shortcut non-accumulating reductions.
2190 if (Constant *SplatVal = Op->getSplatValue()) {
2191 switch (IID) {
2192 case Intrinsic::vector_reduce_and:
2193 case Intrinsic::vector_reduce_or:
2194 case Intrinsic::vector_reduce_smin:
2195 case Intrinsic::vector_reduce_smax:
2196 case Intrinsic::vector_reduce_umin:
2197 case Intrinsic::vector_reduce_umax:
2198 return SplatVal;
2199 case Intrinsic::vector_reduce_add:
2200 if (SplatVal->isNullValue())
2201 return SplatVal;
2202 break;
2203 case Intrinsic::vector_reduce_mul:
2204 if (SplatVal->isNullValue() || SplatVal->isOneValue())
2205 return SplatVal;
2206 break;
2207 case Intrinsic::vector_reduce_xor:
2208 if (SplatVal->isNullValue())
2209 return SplatVal;
2210 if (OpVT->getElementCount().isKnownMultipleOf(2))
2211 return Constant::getNullValue(OpVT->getElementType());
2212 break;
2213 }
2214 }
2215
2217 if (!VT)
2218 return nullptr;
2219
2220 // TODO: Handle undef.
2221 auto *EltC = dyn_cast_or_null<ConstantInt>(Op->getAggregateElement(0U));
2222 if (!EltC)
2223 return nullptr;
2224
2225 APInt Acc = EltC->getValue();
2226 for (unsigned I = 1, E = VT->getNumElements(); I != E; I++) {
2227 if (!(EltC = dyn_cast_or_null<ConstantInt>(Op->getAggregateElement(I))))
2228 return nullptr;
2229 const APInt &X = EltC->getValue();
2230 switch (IID) {
2231 case Intrinsic::vector_reduce_add:
2232 Acc = Acc + X;
2233 break;
2234 case Intrinsic::vector_reduce_mul:
2235 Acc = Acc * X;
2236 break;
2237 case Intrinsic::vector_reduce_and:
2238 Acc = Acc & X;
2239 break;
2240 case Intrinsic::vector_reduce_or:
2241 Acc = Acc | X;
2242 break;
2243 case Intrinsic::vector_reduce_xor:
2244 Acc = Acc ^ X;
2245 break;
2246 case Intrinsic::vector_reduce_smin:
2247 Acc = APIntOps::smin(Acc, X);
2248 break;
2249 case Intrinsic::vector_reduce_smax:
2250 Acc = APIntOps::smax(Acc, X);
2251 break;
2252 case Intrinsic::vector_reduce_umin:
2253 Acc = APIntOps::umin(Acc, X);
2254 break;
2255 case Intrinsic::vector_reduce_umax:
2256 Acc = APIntOps::umax(Acc, X);
2257 break;
2258 }
2259 }
2260
2261 return ConstantInt::get(Op->getContext(), Acc);
2262}
2263
2264/// Attempt to fold an SSE floating point to integer conversion of a constant
2265/// floating point. If roundTowardZero is false, the default IEEE rounding is
2266/// used (toward nearest, ties to even). This matches the behavior of the
2267/// non-truncating SSE instructions in the default rounding mode. The desired
2268/// integer type Ty is used to select how many bits are available for the
2269/// result. Returns null if the conversion cannot be performed, otherwise
2270/// returns the Constant value resulting from the conversion.
2271Constant *ConstantFoldSSEConvertToInt(const APFloat &Val, bool roundTowardZero,
2272 Type *Ty, bool IsSigned) {
2273 // All of these conversion intrinsics form an integer of at most 64bits.
2274 unsigned ResultWidth = Ty->getIntegerBitWidth();
2275 assert(ResultWidth <= 64 &&
2276 "Can only constant fold conversions to 64 and 32 bit ints");
2277
2278 uint64_t UIntVal;
2279 bool isExact = false;
2283 Val.convertToInteger(MutableArrayRef(UIntVal), ResultWidth,
2284 IsSigned, mode, &isExact);
2285 if (status != APFloat::opOK &&
2286 (!roundTowardZero || status != APFloat::opInexact))
2287 return nullptr;
2288 return ConstantInt::get(Ty, UIntVal, IsSigned);
2289}
2290
2291double getValueAsDouble(ConstantFP *Op) {
2292 Type *Ty = Op->getType();
2293
2294 if (Ty->isBFloatTy() || Ty->isHalfTy() || Ty->isFloatTy() || Ty->isDoubleTy())
2295 return Op->getValueAPF().convertToDouble();
2296
2297 bool unused;
2298 APFloat APF = Op->getValueAPF();
2300 return APF.convertToDouble();
2301}
2302
2303static bool getConstIntOrUndef(Value *Op, const APInt *&C) {
2304 if (auto *CI = dyn_cast<ConstantInt>(Op)) {
2305 C = &CI->getValue();
2306 return true;
2307 }
2308 if (isa<UndefValue>(Op)) {
2309 C = nullptr;
2310 return true;
2311 }
2312 return false;
2313}
2314
2315/// Checks if the given intrinsic call, which evaluates to constant, is allowed
2316/// to be folded.
2317///
2318/// \param CI Constrained intrinsic call.
2319/// \param St Exception flags raised during constant evaluation.
2320static bool mayFoldConstrained(ConstrainedFPIntrinsic *CI,
2321 APFloat::opStatus St) {
2322 std::optional<RoundingMode> ORM = CI->getRoundingMode();
2323 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2324
2325 // If the operation does not change exception status flags, it is safe
2326 // to fold.
2327 if (St == APFloat::opStatus::opOK)
2328 return true;
2329
2330 // If evaluation raised FP exception, the result can depend on rounding
2331 // mode. If the latter is unknown, folding is not possible.
2332 if (ORM == RoundingMode::Dynamic)
2333 return false;
2334
2335 // If FP exceptions are ignored, fold the call, even if such exception is
2336 // raised.
2337 if (EB && *EB != fp::ExceptionBehavior::ebStrict)
2338 return true;
2339
2340 // Leave the calculation for runtime so that exception flags be correctly set
2341 // in hardware.
2342 return false;
2343}
2344
2345/// Returns the rounding mode that should be used for constant evaluation.
2346static RoundingMode
2347getEvaluationRoundingMode(const ConstrainedFPIntrinsic *CI) {
2348 std::optional<RoundingMode> ORM = CI->getRoundingMode();
2349 if (!ORM || *ORM == RoundingMode::Dynamic)
2350 // Even if the rounding mode is unknown, try evaluating the operation.
2351 // If it does not raise inexact exception, rounding was not applied,
2352 // so the result is exact and does not depend on rounding mode. Whether
2353 // other FP exceptions are raised, it does not depend on rounding mode.
2355 return *ORM;
2356}
2357
2358/// Try to constant fold llvm.canonicalize for the given caller and value.
2359static Constant *constantFoldCanonicalize(const Type *Ty, const CallBase *CI,
2360 const APFloat &Src) {
2361 // Zero, positive and negative, is always OK to fold.
2362 if (Src.isZero()) {
2363 // Get a fresh 0, since ppc_fp128 does have non-canonical zeros.
2364 return ConstantFP::get(
2365 CI->getContext(),
2366 APFloat::getZero(Src.getSemantics(), Src.isNegative()));
2367 }
2368
2369 if (!Ty->isIEEELikeFPTy())
2370 return nullptr;
2371
2372 // Zero is always canonical and the sign must be preserved.
2373 //
2374 // Denorms and nans may have special encodings, but it should be OK to fold a
2375 // totally average number.
2376 if (Src.isNormal() || Src.isInfinity())
2377 return ConstantFP::get(CI->getContext(), Src);
2378
2379 if (Src.isDenormal() && CI->getParent() && CI->getFunction()) {
2380 DenormalMode DenormMode =
2381 CI->getFunction()->getDenormalMode(Src.getSemantics());
2382
2383 if (DenormMode == DenormalMode::getIEEE())
2384 return ConstantFP::get(CI->getContext(), Src);
2385
2386 if (DenormMode.Input == DenormalMode::Dynamic)
2387 return nullptr;
2388
2389 // If we know if either input or output is flushed, we can fold.
2390 if ((DenormMode.Input == DenormalMode::Dynamic &&
2391 DenormMode.Output == DenormalMode::IEEE) ||
2392 (DenormMode.Input == DenormalMode::IEEE &&
2393 DenormMode.Output == DenormalMode::Dynamic))
2394 return nullptr;
2395
2396 bool IsPositive =
2397 (!Src.isNegative() || DenormMode.Input == DenormalMode::PositiveZero ||
2398 (DenormMode.Output == DenormalMode::PositiveZero &&
2399 DenormMode.Input == DenormalMode::IEEE));
2400
2401 return ConstantFP::get(CI->getContext(),
2402 APFloat::getZero(Src.getSemantics(), !IsPositive));
2403 }
2404
2405 return nullptr;
2406}
2407
2408static Constant *ConstantFoldScalarCall1(StringRef Name,
2409 Intrinsic::ID IntrinsicID,
2410 Type *Ty,
2411 ArrayRef<Constant *> Operands,
2412 const TargetLibraryInfo *TLI,
2413 const CallBase *Call) {
2414 assert(Operands.size() == 1 && "Wrong number of operands.");
2415
2416 if (IntrinsicID == Intrinsic::is_constant) {
2417 // We know we have a "Constant" argument. But we want to only
2418 // return true for manifest constants, not those that depend on
2419 // constants with unknowable values, e.g. GlobalValue or BlockAddress.
2420 if (Operands[0]->isManifestConstant())
2421 return ConstantInt::getTrue(Ty->getContext());
2422 return nullptr;
2423 }
2424
2425 if (isa<UndefValue>(Operands[0])) {
2426 // cosine(arg) is between -1 and 1. cosine(invalid arg) is NaN.
2427 // ctpop() is between 0 and bitwidth, pick 0 for undef.
2428 // fptoui.sat and fptosi.sat can always fold to zero (for a zero input).
2429 if (IntrinsicID == Intrinsic::cos ||
2430 IntrinsicID == Intrinsic::ctpop ||
2431 IntrinsicID == Intrinsic::fptoui_sat ||
2432 IntrinsicID == Intrinsic::fptosi_sat ||
2433 IntrinsicID == Intrinsic::canonicalize)
2434 return Constant::getNullValue(Ty);
2435 if (IntrinsicID == Intrinsic::bswap ||
2436 IntrinsicID == Intrinsic::bitreverse ||
2437 IntrinsicID == Intrinsic::launder_invariant_group ||
2438 IntrinsicID == Intrinsic::strip_invariant_group)
2439 return Operands[0];
2440 }
2441
2442 if (isa<ConstantPointerNull>(Operands[0])) {
2443 // launder(null) == null == strip(null) iff in addrspace 0
2444 if (IntrinsicID == Intrinsic::launder_invariant_group ||
2445 IntrinsicID == Intrinsic::strip_invariant_group) {
2446 // If instruction is not yet put in a basic block (e.g. when cloning
2447 // a function during inlining), Call's caller may not be available.
2448 // So check Call's BB first before querying Call->getCaller.
2449 const Function *Caller =
2450 Call->getParent() ? Call->getCaller() : nullptr;
2451 if (Caller &&
2453 Caller, Operands[0]->getType()->getPointerAddressSpace())) {
2454 return Operands[0];
2455 }
2456 return nullptr;
2457 }
2458 }
2459
2460 if (auto *Op = dyn_cast<ConstantFP>(Operands[0])) {
2461 if (IntrinsicID == Intrinsic::convert_to_fp16) {
2462 APFloat Val(Op->getValueAPF());
2463
2464 bool lost = false;
2466
2467 return ConstantInt::get(Ty->getContext(), Val.bitcastToAPInt());
2468 }
2469
2470 APFloat U = Op->getValueAPF();
2471
2472 if (IntrinsicID == Intrinsic::wasm_trunc_signed ||
2473 IntrinsicID == Intrinsic::wasm_trunc_unsigned) {
2474 bool Signed = IntrinsicID == Intrinsic::wasm_trunc_signed;
2475
2476 if (U.isNaN())
2477 return nullptr;
2478
2479 unsigned Width = Ty->getIntegerBitWidth();
2480 APSInt Int(Width, !Signed);
2481 bool IsExact = false;
2483 U.convertToInteger(Int, APFloat::rmTowardZero, &IsExact);
2484
2486 return ConstantInt::get(Ty, Int);
2487
2488 return nullptr;
2489 }
2490
2491 if (IntrinsicID == Intrinsic::fptoui_sat ||
2492 IntrinsicID == Intrinsic::fptosi_sat) {
2493 // convertToInteger() already has the desired saturation semantics.
2494 APSInt Int(Ty->getIntegerBitWidth(),
2495 IntrinsicID == Intrinsic::fptoui_sat);
2496 bool IsExact;
2497 U.convertToInteger(Int, APFloat::rmTowardZero, &IsExact);
2498 return ConstantInt::get(Ty, Int);
2499 }
2500
2501 if (IntrinsicID == Intrinsic::canonicalize)
2502 return constantFoldCanonicalize(Ty, Call, U);
2503
2504#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2505 if (Ty->isFP128Ty()) {
2506 if (IntrinsicID == Intrinsic::log) {
2507 float128 Result = logf128(Op->getValueAPF().convertToQuad());
2508 return GetConstantFoldFPValue128(Result, Ty);
2509 }
2510
2511 LibFunc Fp128Func = NotLibFunc;
2512 if (TLI && TLI->getLibFunc(Name, Fp128Func) && TLI->has(Fp128Func) &&
2513 Fp128Func == LibFunc_logl)
2514 return ConstantFoldFP128(logf128, Op->getValueAPF(), Ty);
2515 }
2516#endif
2517
2518 if (!Ty->isHalfTy() && !Ty->isFloatTy() && !Ty->isDoubleTy() &&
2519 !Ty->isIntegerTy())
2520 return nullptr;
2521
2522 // Use internal versions of these intrinsics.
2523
2524 if (IntrinsicID == Intrinsic::nearbyint || IntrinsicID == Intrinsic::rint ||
2525 IntrinsicID == Intrinsic::roundeven) {
2526 U.roundToIntegral(APFloat::rmNearestTiesToEven);
2527 return ConstantFP::get(Ty, U);
2528 }
2529
2530 if (IntrinsicID == Intrinsic::round) {
2531 U.roundToIntegral(APFloat::rmNearestTiesToAway);
2532 return ConstantFP::get(Ty, U);
2533 }
2534
2535 if (IntrinsicID == Intrinsic::roundeven) {
2536 U.roundToIntegral(APFloat::rmNearestTiesToEven);
2537 return ConstantFP::get(Ty, U);
2538 }
2539
2540 if (IntrinsicID == Intrinsic::ceil) {
2541 U.roundToIntegral(APFloat::rmTowardPositive);
2542 return ConstantFP::get(Ty, U);
2543 }
2544
2545 if (IntrinsicID == Intrinsic::floor) {
2546 U.roundToIntegral(APFloat::rmTowardNegative);
2547 return ConstantFP::get(Ty, U);
2548 }
2549
2550 if (IntrinsicID == Intrinsic::trunc) {
2551 U.roundToIntegral(APFloat::rmTowardZero);
2552 return ConstantFP::get(Ty, U);
2553 }
2554
2555 if (IntrinsicID == Intrinsic::fabs) {
2556 U.clearSign();
2557 return ConstantFP::get(Ty, U);
2558 }
2559
2560 if (IntrinsicID == Intrinsic::amdgcn_fract) {
2561 // The v_fract instruction behaves like the OpenCL spec, which defines
2562 // fract(x) as fmin(x - floor(x), 0x1.fffffep-1f): "The min() operator is
2563 // there to prevent fract(-small) from returning 1.0. It returns the
2564 // largest positive floating-point number less than 1.0."
2565 APFloat FloorU(U);
2566 FloorU.roundToIntegral(APFloat::rmTowardNegative);
2567 APFloat FractU(U - FloorU);
2568 APFloat AlmostOne(U.getSemantics(), 1);
2569 AlmostOne.next(/*nextDown*/ true);
2570 return ConstantFP::get(Ty, minimum(FractU, AlmostOne));
2571 }
2572
2573 // Rounding operations (floor, trunc, ceil, round and nearbyint) do not
2574 // raise FP exceptions, unless the argument is signaling NaN.
2575
2576 std::optional<APFloat::roundingMode> RM;
2577 switch (IntrinsicID) {
2578 default:
2579 break;
2580 case Intrinsic::experimental_constrained_nearbyint:
2581 case Intrinsic::experimental_constrained_rint: {
2583 RM = CI->getRoundingMode();
2584 if (!RM || *RM == RoundingMode::Dynamic)
2585 return nullptr;
2586 break;
2587 }
2588 case Intrinsic::experimental_constrained_round:
2590 break;
2591 case Intrinsic::experimental_constrained_ceil:
2593 break;
2594 case Intrinsic::experimental_constrained_floor:
2596 break;
2597 case Intrinsic::experimental_constrained_trunc:
2599 break;
2600 }
2601 if (RM) {
2603 if (U.isFinite()) {
2604 APFloat::opStatus St = U.roundToIntegral(*RM);
2605 if (IntrinsicID == Intrinsic::experimental_constrained_rint &&
2606 St == APFloat::opInexact) {
2607 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2608 if (EB == fp::ebStrict)
2609 return nullptr;
2610 }
2611 } else if (U.isSignaling()) {
2612 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2613 if (EB && *EB != fp::ebIgnore)
2614 return nullptr;
2615 U = APFloat::getQNaN(U.getSemantics());
2616 }
2617 return ConstantFP::get(Ty, U);
2618 }
2619
2620 // NVVM float/double to signed/unsigned int32/int64 conversions:
2621 switch (IntrinsicID) {
2622 // f2i
2623 case Intrinsic::nvvm_f2i_rm:
2624 case Intrinsic::nvvm_f2i_rn:
2625 case Intrinsic::nvvm_f2i_rp:
2626 case Intrinsic::nvvm_f2i_rz:
2627 case Intrinsic::nvvm_f2i_rm_ftz:
2628 case Intrinsic::nvvm_f2i_rn_ftz:
2629 case Intrinsic::nvvm_f2i_rp_ftz:
2630 case Intrinsic::nvvm_f2i_rz_ftz:
2631 // f2ui
2632 case Intrinsic::nvvm_f2ui_rm:
2633 case Intrinsic::nvvm_f2ui_rn:
2634 case Intrinsic::nvvm_f2ui_rp:
2635 case Intrinsic::nvvm_f2ui_rz:
2636 case Intrinsic::nvvm_f2ui_rm_ftz:
2637 case Intrinsic::nvvm_f2ui_rn_ftz:
2638 case Intrinsic::nvvm_f2ui_rp_ftz:
2639 case Intrinsic::nvvm_f2ui_rz_ftz:
2640 // d2i
2641 case Intrinsic::nvvm_d2i_rm:
2642 case Intrinsic::nvvm_d2i_rn:
2643 case Intrinsic::nvvm_d2i_rp:
2644 case Intrinsic::nvvm_d2i_rz:
2645 // d2ui
2646 case Intrinsic::nvvm_d2ui_rm:
2647 case Intrinsic::nvvm_d2ui_rn:
2648 case Intrinsic::nvvm_d2ui_rp:
2649 case Intrinsic::nvvm_d2ui_rz:
2650 // f2ll
2651 case Intrinsic::nvvm_f2ll_rm:
2652 case Intrinsic::nvvm_f2ll_rn:
2653 case Intrinsic::nvvm_f2ll_rp:
2654 case Intrinsic::nvvm_f2ll_rz:
2655 case Intrinsic::nvvm_f2ll_rm_ftz:
2656 case Intrinsic::nvvm_f2ll_rn_ftz:
2657 case Intrinsic::nvvm_f2ll_rp_ftz:
2658 case Intrinsic::nvvm_f2ll_rz_ftz:
2659 // f2ull
2660 case Intrinsic::nvvm_f2ull_rm:
2661 case Intrinsic::nvvm_f2ull_rn:
2662 case Intrinsic::nvvm_f2ull_rp:
2663 case Intrinsic::nvvm_f2ull_rz:
2664 case Intrinsic::nvvm_f2ull_rm_ftz:
2665 case Intrinsic::nvvm_f2ull_rn_ftz:
2666 case Intrinsic::nvvm_f2ull_rp_ftz:
2667 case Intrinsic::nvvm_f2ull_rz_ftz:
2668 // d2ll
2669 case Intrinsic::nvvm_d2ll_rm:
2670 case Intrinsic::nvvm_d2ll_rn:
2671 case Intrinsic::nvvm_d2ll_rp:
2672 case Intrinsic::nvvm_d2ll_rz:
2673 // d2ull
2674 case Intrinsic::nvvm_d2ull_rm:
2675 case Intrinsic::nvvm_d2ull_rn:
2676 case Intrinsic::nvvm_d2ull_rp:
2677 case Intrinsic::nvvm_d2ull_rz: {
2678 // In float-to-integer conversion, NaN inputs are converted to 0.
2679 if (U.isNaN()) {
2680 // In float-to-integer conversion, NaN inputs are converted to 0
2681 // when the source and destination bitwidths are both less than 64.
2682 if (nvvm::FPToIntegerIntrinsicNaNZero(IntrinsicID))
2683 return ConstantInt::get(Ty, 0);
2684
2685 // Otherwise, the most significant bit is set.
2686 unsigned BitWidth = Ty->getIntegerBitWidth();
2687 uint64_t Val = 1ULL << (BitWidth - 1);
2688 return ConstantInt::get(Ty, APInt(BitWidth, Val, /*IsSigned=*/false));
2689 }
2690
2691 APFloat::roundingMode RMode =
2693 bool IsFTZ = nvvm::FPToIntegerIntrinsicShouldFTZ(IntrinsicID);
2694 bool IsSigned = nvvm::FPToIntegerIntrinsicResultIsSigned(IntrinsicID);
2695
2696 APSInt ResInt(Ty->getIntegerBitWidth(), !IsSigned);
2697 auto FloatToRound = IsFTZ ? FTZPreserveSign(U) : U;
2698
2699 // Return max/min value for integers if the result is +/-inf or
2700 // is too large to fit in the result's integer bitwidth.
2701 bool IsExact = false;
2702 FloatToRound.convertToInteger(ResInt, RMode, &IsExact);
2703 return ConstantInt::get(Ty, ResInt);
2704 }
2705 }
2706
2707 /// We only fold functions with finite arguments. Folding NaN and inf is
2708 /// likely to be aborted with an exception anyway, and some host libms
2709 /// have known errors raising exceptions.
2710 if (!U.isFinite())
2711 return nullptr;
2712
2713 /// Currently APFloat versions of these functions do not exist, so we use
2714 /// the host native double versions. Float versions are not called
2715 /// directly but for all these it is true (float)(f((double)arg)) ==
2716 /// f(arg). Long double not supported yet.
2717 const APFloat &APF = Op->getValueAPF();
2718
2719 switch (IntrinsicID) {
2720 default: break;
2721 case Intrinsic::log:
2722 if (U.isZero())
2723 return ConstantFP::getInfinity(Ty, true);
2724 if (U.isNegative())
2725 return ConstantFP::getNaN(Ty);
2726 if (U.isExactlyValue(1.0))
2727 return ConstantFP::getZero(Ty);
2728 return ConstantFoldFP(log, APF, Ty);
2729 case Intrinsic::log2:
2730 if (U.isZero())
2731 return ConstantFP::getInfinity(Ty, true);
2732 if (U.isNegative())
2733 return ConstantFP::getNaN(Ty);
2734 if (U.isExactlyValue(1.0))
2735 return ConstantFP::getZero(Ty);
2736 // TODO: What about hosts that lack a C99 library?
2737 return ConstantFoldFP(log2, APF, Ty);
2738 case Intrinsic::log10:
2739 if (U.isZero())
2740 return ConstantFP::getInfinity(Ty, true);
2741 if (U.isNegative())
2742 return ConstantFP::getNaN(Ty);
2743 if (U.isExactlyValue(1.0))
2744 return ConstantFP::getZero(Ty);
2745 // TODO: What about hosts that lack a C99 library?
2746 return ConstantFoldFP(log10, APF, Ty);
2747 case Intrinsic::exp:
2748 return ConstantFoldFP(exp, APF, Ty);
2749 case Intrinsic::exp2:
2750 // Fold exp2(x) as pow(2, x), in case the host lacks a C99 library.
2751 return ConstantFoldBinaryFP(pow, APFloat(2.0), APF, Ty);
2752 case Intrinsic::exp10:
2753 // Fold exp10(x) as pow(10, x), in case the host lacks a C99 library.
2754 return ConstantFoldBinaryFP(pow, APFloat(10.0), APF, Ty);
2755 case Intrinsic::sin:
2756 return ConstantFoldFP(sin, APF, Ty);
2757 case Intrinsic::cos:
2758 return ConstantFoldFP(cos, APF, Ty);
2759 case Intrinsic::sinh:
2760 return ConstantFoldFP(sinh, APF, Ty);
2761 case Intrinsic::cosh:
2762 return ConstantFoldFP(cosh, APF, Ty);
2763 case Intrinsic::atan:
2764 // Implement optional behavior from C's Annex F for +/-0.0.
2765 if (U.isZero())
2766 return ConstantFP::get(Ty, U);
2767 return ConstantFoldFP(atan, APF, Ty);
2768 case Intrinsic::sqrt:
2769 return ConstantFoldFP(sqrt, APF, Ty);
2770
2771 // NVVM Intrinsics:
2772 case Intrinsic::nvvm_ceil_ftz_f:
2773 case Intrinsic::nvvm_ceil_f:
2774 case Intrinsic::nvvm_ceil_d:
2775 return ConstantFoldFP(
2776 ceil, APF, Ty,
2778 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2779
2780 case Intrinsic::nvvm_fabs_ftz:
2781 case Intrinsic::nvvm_fabs:
2782 return ConstantFoldFP(
2783 fabs, APF, Ty,
2785 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2786
2787 case Intrinsic::nvvm_floor_ftz_f:
2788 case Intrinsic::nvvm_floor_f:
2789 case Intrinsic::nvvm_floor_d:
2790 return ConstantFoldFP(
2791 floor, APF, Ty,
2793 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2794
2795 case Intrinsic::nvvm_rcp_rm_ftz_f:
2796 case Intrinsic::nvvm_rcp_rn_ftz_f:
2797 case Intrinsic::nvvm_rcp_rp_ftz_f:
2798 case Intrinsic::nvvm_rcp_rz_ftz_f:
2799 case Intrinsic::nvvm_rcp_rm_d:
2800 case Intrinsic::nvvm_rcp_rm_f:
2801 case Intrinsic::nvvm_rcp_rn_d:
2802 case Intrinsic::nvvm_rcp_rn_f:
2803 case Intrinsic::nvvm_rcp_rp_d:
2804 case Intrinsic::nvvm_rcp_rp_f:
2805 case Intrinsic::nvvm_rcp_rz_d:
2806 case Intrinsic::nvvm_rcp_rz_f: {
2807 APFloat::roundingMode RoundMode = nvvm::GetRCPRoundingMode(IntrinsicID);
2808 bool IsFTZ = nvvm::RCPShouldFTZ(IntrinsicID);
2809
2810 auto Denominator = IsFTZ ? FTZPreserveSign(APF) : APF;
2812 APFloat::opStatus Status = Res.divide(Denominator, RoundMode);
2813
2815 if (IsFTZ)
2816 Res = FTZPreserveSign(Res);
2817 return ConstantFP::get(Ty, Res);
2818 }
2819 return nullptr;
2820 }
2821
2822 case Intrinsic::nvvm_round_ftz_f:
2823 case Intrinsic::nvvm_round_f:
2824 case Intrinsic::nvvm_round_d: {
2825 // nvvm_round is lowered to PTX cvt.rni, which will round to nearest
2826 // integer, choosing even integer if source is equidistant between two
2827 // integers, so the semantics are closer to "rint" rather than "round".
2828 bool IsFTZ = nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID);
2829 auto V = IsFTZ ? FTZPreserveSign(APF) : APF;
2831 return ConstantFP::get(Ty, V);
2832 }
2833
2834 case Intrinsic::nvvm_saturate_ftz_f:
2835 case Intrinsic::nvvm_saturate_d:
2836 case Intrinsic::nvvm_saturate_f: {
2837 bool IsFTZ = nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID);
2838 auto V = IsFTZ ? FTZPreserveSign(APF) : APF;
2839 if (V.isNegative() || V.isZero() || V.isNaN())
2840 return ConstantFP::getZero(Ty);
2842 if (V > One)
2843 return ConstantFP::get(Ty, One);
2844 return ConstantFP::get(Ty, APF);
2845 }
2846
2847 case Intrinsic::nvvm_sqrt_rn_ftz_f:
2848 case Intrinsic::nvvm_sqrt_f:
2849 case Intrinsic::nvvm_sqrt_rn_d:
2850 case Intrinsic::nvvm_sqrt_rn_f:
2851 if (APF.isNegative())
2852 return nullptr;
2853 return ConstantFoldFP(
2854 sqrt, APF, Ty,
2856 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2857
2858 // AMDGCN Intrinsics:
2859 case Intrinsic::amdgcn_cos:
2860 case Intrinsic::amdgcn_sin: {
2861 double V = getValueAsDouble(Op);
2862 if (V < -256.0 || V > 256.0)
2863 // The gfx8 and gfx9 architectures handle arguments outside the range
2864 // [-256, 256] differently. This should be a rare case so bail out
2865 // rather than trying to handle the difference.
2866 return nullptr;
2867 bool IsCos = IntrinsicID == Intrinsic::amdgcn_cos;
2868 double V4 = V * 4.0;
2869 if (V4 == floor(V4)) {
2870 // Force exact results for quarter-integer inputs.
2871 const double SinVals[4] = { 0.0, 1.0, 0.0, -1.0 };
2872 V = SinVals[((int)V4 + (IsCos ? 1 : 0)) & 3];
2873 } else {
2874 if (IsCos)
2875 V = cos(V * 2.0 * numbers::pi);
2876 else
2877 V = sin(V * 2.0 * numbers::pi);
2878 }
2879 return GetConstantFoldFPValue(V, Ty);
2880 }
2881 }
2882
2883 if (!TLI)
2884 return nullptr;
2885
2886 LibFunc Func = NotLibFunc;
2887 if (!TLI->getLibFunc(Name, Func))
2888 return nullptr;
2889
2890 switch (Func) {
2891 default:
2892 break;
2893 case LibFunc_acos:
2894 case LibFunc_acosf:
2895 case LibFunc_acos_finite:
2896 case LibFunc_acosf_finite:
2897 if (TLI->has(Func))
2898 return ConstantFoldFP(acos, APF, Ty);
2899 break;
2900 case LibFunc_asin:
2901 case LibFunc_asinf:
2902 case LibFunc_asin_finite:
2903 case LibFunc_asinf_finite:
2904 if (TLI->has(Func))
2905 return ConstantFoldFP(asin, APF, Ty);
2906 break;
2907 case LibFunc_atan:
2908 case LibFunc_atanf:
2909 // Implement optional behavior from C's Annex F for +/-0.0.
2910 if (U.isZero())
2911 return ConstantFP::get(Ty, U);
2912 if (TLI->has(Func))
2913 return ConstantFoldFP(atan, APF, Ty);
2914 break;
2915 case LibFunc_ceil:
2916 case LibFunc_ceilf:
2917 if (TLI->has(Func)) {
2918 U.roundToIntegral(APFloat::rmTowardPositive);
2919 return ConstantFP::get(Ty, U);
2920 }
2921 break;
2922 case LibFunc_cos:
2923 case LibFunc_cosf:
2924 if (TLI->has(Func))
2925 return ConstantFoldFP(cos, APF, Ty);
2926 break;
2927 case LibFunc_cosh:
2928 case LibFunc_coshf:
2929 case LibFunc_cosh_finite:
2930 case LibFunc_coshf_finite:
2931 if (TLI->has(Func))
2932 return ConstantFoldFP(cosh, APF, Ty);
2933 break;
2934 case LibFunc_exp:
2935 case LibFunc_expf:
2936 case LibFunc_exp_finite:
2937 case LibFunc_expf_finite:
2938 if (TLI->has(Func))
2939 return ConstantFoldFP(exp, APF, Ty);
2940 break;
2941 case LibFunc_exp2:
2942 case LibFunc_exp2f:
2943 case LibFunc_exp2_finite:
2944 case LibFunc_exp2f_finite:
2945 if (TLI->has(Func))
2946 // Fold exp2(x) as pow(2, x), in case the host lacks a C99 library.
2947 return ConstantFoldBinaryFP(pow, APFloat(2.0), APF, Ty);
2948 break;
2949 case LibFunc_fabs:
2950 case LibFunc_fabsf:
2951 if (TLI->has(Func)) {
2952 U.clearSign();
2953 return ConstantFP::get(Ty, U);
2954 }
2955 break;
2956 case LibFunc_floor:
2957 case LibFunc_floorf:
2958 if (TLI->has(Func)) {
2959 U.roundToIntegral(APFloat::rmTowardNegative);
2960 return ConstantFP::get(Ty, U);
2961 }
2962 break;
2963 case LibFunc_log:
2964 case LibFunc_logf:
2965 case LibFunc_log_finite:
2966 case LibFunc_logf_finite:
2967 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
2968 return ConstantFoldFP(log, APF, Ty);
2969 break;
2970 case LibFunc_log2:
2971 case LibFunc_log2f:
2972 case LibFunc_log2_finite:
2973 case LibFunc_log2f_finite:
2974 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
2975 // TODO: What about hosts that lack a C99 library?
2976 return ConstantFoldFP(log2, APF, Ty);
2977 break;
2978 case LibFunc_log10:
2979 case LibFunc_log10f:
2980 case LibFunc_log10_finite:
2981 case LibFunc_log10f_finite:
2982 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
2983 // TODO: What about hosts that lack a C99 library?
2984 return ConstantFoldFP(log10, APF, Ty);
2985 break;
2986 case LibFunc_ilogb:
2987 case LibFunc_ilogbf:
2988 if (!APF.isZero() && TLI->has(Func))
2989 return ConstantInt::get(Ty, ilogb(APF), true);
2990 break;
2991 case LibFunc_logb:
2992 case LibFunc_logbf:
2993 if (!APF.isZero() && TLI->has(Func))
2994 return ConstantFoldFP(logb, APF, Ty);
2995 break;
2996 case LibFunc_log1p:
2997 case LibFunc_log1pf:
2998 // Implement optional behavior from C's Annex F for +/-0.0.
2999 if (U.isZero())
3000 return ConstantFP::get(Ty, U);
3001 if (APF > APFloat::getOne(APF.getSemantics(), true) && TLI->has(Func))
3002 return ConstantFoldFP(log1p, APF, Ty);
3003 break;
3004 case LibFunc_logl:
3005 return nullptr;
3006 case LibFunc_erf:
3007 case LibFunc_erff:
3008 if (TLI->has(Func))
3009 return ConstantFoldFP(erf, APF, Ty);
3010 break;
3011 case LibFunc_nearbyint:
3012 case LibFunc_nearbyintf:
3013 case LibFunc_rint:
3014 case LibFunc_rintf:
3015 case LibFunc_roundeven:
3016 case LibFunc_roundevenf:
3017 if (TLI->has(Func)) {
3018 U.roundToIntegral(APFloat::rmNearestTiesToEven);
3019 return ConstantFP::get(Ty, U);
3020 }
3021 break;
3022 case LibFunc_round:
3023 case LibFunc_roundf:
3024 if (TLI->has(Func)) {
3025 U.roundToIntegral(APFloat::rmNearestTiesToAway);
3026 return ConstantFP::get(Ty, U);
3027 }
3028 break;
3029 case LibFunc_sin:
3030 case LibFunc_sinf:
3031 if (TLI->has(Func))
3032 return ConstantFoldFP(sin, APF, Ty);
3033 break;
3034 case LibFunc_sinh:
3035 case LibFunc_sinhf:
3036 case LibFunc_sinh_finite:
3037 case LibFunc_sinhf_finite:
3038 if (TLI->has(Func))
3039 return ConstantFoldFP(sinh, APF, Ty);
3040 break;
3041 case LibFunc_sqrt:
3042 case LibFunc_sqrtf:
3043 if (!APF.isNegative() && TLI->has(Func))
3044 return ConstantFoldFP(sqrt, APF, Ty);
3045 break;
3046 case LibFunc_tan:
3047 case LibFunc_tanf:
3048 if (TLI->has(Func))
3049 return ConstantFoldFP(tan, APF, Ty);
3050 break;
3051 case LibFunc_tanh:
3052 case LibFunc_tanhf:
3053 if (TLI->has(Func))
3054 return ConstantFoldFP(tanh, APF, Ty);
3055 break;
3056 case LibFunc_trunc:
3057 case LibFunc_truncf:
3058 if (TLI->has(Func)) {
3059 U.roundToIntegral(APFloat::rmTowardZero);
3060 return ConstantFP::get(Ty, U);
3061 }
3062 break;
3063 }
3064 return nullptr;
3065 }
3066
3067 if (auto *Op = dyn_cast<ConstantInt>(Operands[0])) {
3068 switch (IntrinsicID) {
3069 case Intrinsic::bswap:
3070 return ConstantInt::get(Ty->getContext(), Op->getValue().byteSwap());
3071 case Intrinsic::ctpop:
3072 return ConstantInt::get(Ty, Op->getValue().popcount());
3073 case Intrinsic::bitreverse:
3074 return ConstantInt::get(Ty->getContext(), Op->getValue().reverseBits());
3075 case Intrinsic::convert_from_fp16: {
3076 APFloat Val(APFloat::IEEEhalf(), Op->getValue());
3077
3078 bool lost = false;
3079 APFloat::opStatus status = Val.convert(
3080 Ty->getFltSemantics(), APFloat::rmNearestTiesToEven, &lost);
3081
3082 // Conversion is always precise.
3083 (void)status;
3084 assert(status != APFloat::opInexact && !lost &&
3085 "Precision lost during fp16 constfolding");
3086
3087 return ConstantFP::get(Ty, Val);
3088 }
3089
3090 case Intrinsic::amdgcn_s_wqm: {
3091 uint64_t Val = Op->getZExtValue();
3092 Val |= (Val & 0x5555555555555555ULL) << 1 |
3093 ((Val >> 1) & 0x5555555555555555ULL);
3094 Val |= (Val & 0x3333333333333333ULL) << 2 |
3095 ((Val >> 2) & 0x3333333333333333ULL);
3096 return ConstantInt::get(Ty, Val);
3097 }
3098
3099 case Intrinsic::amdgcn_s_quadmask: {
3100 uint64_t Val = Op->getZExtValue();
3101 uint64_t QuadMask = 0;
3102 for (unsigned I = 0; I < Op->getBitWidth() / 4; ++I, Val >>= 4) {
3103 if (!(Val & 0xF))
3104 continue;
3105
3106 QuadMask |= (1ULL << I);
3107 }
3108 return ConstantInt::get(Ty, QuadMask);
3109 }
3110
3111 case Intrinsic::amdgcn_s_bitreplicate: {
3112 uint64_t Val = Op->getZExtValue();
3113 Val = (Val & 0x000000000000FFFFULL) | (Val & 0x00000000FFFF0000ULL) << 16;
3114 Val = (Val & 0x000000FF000000FFULL) | (Val & 0x0000FF000000FF00ULL) << 8;
3115 Val = (Val & 0x000F000F000F000FULL) | (Val & 0x00F000F000F000F0ULL) << 4;
3116 Val = (Val & 0x0303030303030303ULL) | (Val & 0x0C0C0C0C0C0C0C0CULL) << 2;
3117 Val = (Val & 0x1111111111111111ULL) | (Val & 0x2222222222222222ULL) << 1;
3118 Val = Val | Val << 1;
3119 return ConstantInt::get(Ty, Val);
3120 }
3121 }
3122 }
3123
3124 if (Operands[0]->getType()->isVectorTy()) {
3125 auto *Op = cast<Constant>(Operands[0]);
3126 switch (IntrinsicID) {
3127 default: break;
3128 case Intrinsic::vector_reduce_add:
3129 case Intrinsic::vector_reduce_mul:
3130 case Intrinsic::vector_reduce_and:
3131 case Intrinsic::vector_reduce_or:
3132 case Intrinsic::vector_reduce_xor:
3133 case Intrinsic::vector_reduce_smin:
3134 case Intrinsic::vector_reduce_smax:
3135 case Intrinsic::vector_reduce_umin:
3136 case Intrinsic::vector_reduce_umax:
3137 if (Constant *C = constantFoldVectorReduce(IntrinsicID, Operands[0]))
3138 return C;
3139 break;
3140 case Intrinsic::x86_sse_cvtss2si:
3141 case Intrinsic::x86_sse_cvtss2si64:
3142 case Intrinsic::x86_sse2_cvtsd2si:
3143 case Intrinsic::x86_sse2_cvtsd2si64:
3144 if (ConstantFP *FPOp =
3145 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3146 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3147 /*roundTowardZero=*/false, Ty,
3148 /*IsSigned*/true);
3149 break;
3150 case Intrinsic::x86_sse_cvttss2si:
3151 case Intrinsic::x86_sse_cvttss2si64:
3152 case Intrinsic::x86_sse2_cvttsd2si:
3153 case Intrinsic::x86_sse2_cvttsd2si64:
3154 if (ConstantFP *FPOp =
3155 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3156 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3157 /*roundTowardZero=*/true, Ty,
3158 /*IsSigned*/true);
3159 break;
3160
3161 case Intrinsic::wasm_anytrue:
3162 return Op->isZeroValue() ? ConstantInt::get(Ty, 0)
3163 : ConstantInt::get(Ty, 1);
3164
3165 case Intrinsic::wasm_alltrue:
3166 // Check each element individually
3167 unsigned E = cast<FixedVectorType>(Op->getType())->getNumElements();
3168 for (unsigned I = 0; I != E; ++I) {
3169 Constant *Elt = Op->getAggregateElement(I);
3170 // Return false as soon as we find a non-true element.
3171 if (Elt && Elt->isZeroValue())
3172 return ConstantInt::get(Ty, 0);
3173 // Bail as soon as we find an element we cannot prove to be true.
3174 if (!Elt || !isa<ConstantInt>(Elt))
3175 return nullptr;
3176 }
3177
3178 return ConstantInt::get(Ty, 1);
3179 }
3180 }
3181
3182 return nullptr;
3183}
3184
3185static Constant *evaluateCompare(const APFloat &Op1, const APFloat &Op2,
3189 FCmpInst::Predicate Cond = FCmp->getPredicate();
3190 if (FCmp->isSignaling()) {
3191 if (Op1.isNaN() || Op2.isNaN())
3193 } else {
3194 if (Op1.isSignaling() || Op2.isSignaling())
3196 }
3197 bool Result = FCmpInst::compare(Op1, Op2, Cond);
3198 if (mayFoldConstrained(const_cast<ConstrainedFPCmpIntrinsic *>(FCmp), St))
3199 return ConstantInt::get(Call->getType()->getScalarType(), Result);
3200 return nullptr;
3201}
3202
3203static Constant *ConstantFoldLibCall2(StringRef Name, Type *Ty,
3204 ArrayRef<Constant *> Operands,
3205 const TargetLibraryInfo *TLI) {
3206 if (!TLI)
3207 return nullptr;
3208
3209 LibFunc Func = NotLibFunc;
3210 if (!TLI->getLibFunc(Name, Func))
3211 return nullptr;
3212
3213 const auto *Op1 = dyn_cast<ConstantFP>(Operands[0]);
3214 if (!Op1)
3215 return nullptr;
3216
3217 const auto *Op2 = dyn_cast<ConstantFP>(Operands[1]);
3218 if (!Op2)
3219 return nullptr;
3220
3221 const APFloat &Op1V = Op1->getValueAPF();
3222 const APFloat &Op2V = Op2->getValueAPF();
3223
3224 switch (Func) {
3225 default:
3226 break;
3227 case LibFunc_pow:
3228 case LibFunc_powf:
3229 case LibFunc_pow_finite:
3230 case LibFunc_powf_finite:
3231 if (TLI->has(Func))
3232 return ConstantFoldBinaryFP(pow, Op1V, Op2V, Ty);
3233 break;
3234 case LibFunc_fmod:
3235 case LibFunc_fmodf:
3236 if (TLI->has(Func)) {
3237 APFloat V = Op1->getValueAPF();
3238 if (APFloat::opStatus::opOK == V.mod(Op2->getValueAPF()))
3239 return ConstantFP::get(Ty, V);
3240 }
3241 break;
3242 case LibFunc_remainder:
3243 case LibFunc_remainderf:
3244 if (TLI->has(Func)) {
3245 APFloat V = Op1->getValueAPF();
3246 if (APFloat::opStatus::opOK == V.remainder(Op2->getValueAPF()))
3247 return ConstantFP::get(Ty, V);
3248 }
3249 break;
3250 case LibFunc_atan2:
3251 case LibFunc_atan2f:
3252 // atan2(+/-0.0, +/-0.0) is known to raise an exception on some libm
3253 // (Solaris), so we do not assume a known result for that.
3254 if (Op1V.isZero() && Op2V.isZero())
3255 return nullptr;
3256 [[fallthrough]];
3257 case LibFunc_atan2_finite:
3258 case LibFunc_atan2f_finite:
3259 if (TLI->has(Func))
3260 return ConstantFoldBinaryFP(atan2, Op1V, Op2V, Ty);
3261 break;
3262 }
3263
3264 return nullptr;
3265}
3266
3267static Constant *ConstantFoldIntrinsicCall2(Intrinsic::ID IntrinsicID, Type *Ty,
3268 ArrayRef<Constant *> Operands,
3269 const CallBase *Call) {
3270 assert(Operands.size() == 2 && "Wrong number of operands.");
3271
3272 if (Ty->isFloatingPointTy()) {
3273 // TODO: We should have undef handling for all of the FP intrinsics that
3274 // are attempted to be folded in this function.
3275 bool IsOp0Undef = isa<UndefValue>(Operands[0]);
3276 bool IsOp1Undef = isa<UndefValue>(Operands[1]);
3277 switch (IntrinsicID) {
3278 case Intrinsic::maxnum:
3279 case Intrinsic::minnum:
3280 case Intrinsic::maximum:
3281 case Intrinsic::minimum:
3282 case Intrinsic::maximumnum:
3283 case Intrinsic::minimumnum:
3284 case Intrinsic::nvvm_fmax_d:
3285 case Intrinsic::nvvm_fmin_d:
3286 // If one argument is undef, return the other argument.
3287 if (IsOp0Undef)
3288 return Operands[1];
3289 if (IsOp1Undef)
3290 return Operands[0];
3291 break;
3292
3293 case Intrinsic::nvvm_fmax_f:
3294 case Intrinsic::nvvm_fmax_ftz_f:
3295 case Intrinsic::nvvm_fmax_ftz_nan_f:
3296 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3297 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3298 case Intrinsic::nvvm_fmax_nan_f:
3299 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3300 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3301
3302 case Intrinsic::nvvm_fmin_f:
3303 case Intrinsic::nvvm_fmin_ftz_f:
3304 case Intrinsic::nvvm_fmin_ftz_nan_f:
3305 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
3306 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
3307 case Intrinsic::nvvm_fmin_nan_f:
3308 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
3309 case Intrinsic::nvvm_fmin_xorsign_abs_f:
3310 // If one arg is undef, the other arg can be returned only if it is
3311 // constant, as we may need to flush it to sign-preserving zero or
3312 // canonicalize the NaN.
3313 if (!IsOp0Undef && !IsOp1Undef)
3314 break;
3315 if (auto *Op = dyn_cast<ConstantFP>(Operands[IsOp0Undef ? 1 : 0])) {
3316 if (Op->isNaN()) {
3317 APInt NVCanonicalNaN(32, 0x7fffffff);
3318 return ConstantFP::get(
3319 Ty, APFloat(Ty->getFltSemantics(), NVCanonicalNaN));
3320 }
3321 if (nvvm::FMinFMaxShouldFTZ(IntrinsicID))
3322 return ConstantFP::get(Ty, FTZPreserveSign(Op->getValueAPF()));
3323 else
3324 return Op;
3325 }
3326 break;
3327 }
3328 }
3329
3330 if (const auto *Op1 = dyn_cast<ConstantFP>(Operands[0])) {
3331 const APFloat &Op1V = Op1->getValueAPF();
3332
3333 if (const auto *Op2 = dyn_cast<ConstantFP>(Operands[1])) {
3334 if (Op2->getType() != Op1->getType())
3335 return nullptr;
3336 const APFloat &Op2V = Op2->getValueAPF();
3337
3338 if (const auto *ConstrIntr =
3340 RoundingMode RM = getEvaluationRoundingMode(ConstrIntr);
3341 APFloat Res = Op1V;
3343 switch (IntrinsicID) {
3344 default:
3345 return nullptr;
3346 case Intrinsic::experimental_constrained_fadd:
3347 St = Res.add(Op2V, RM);
3348 break;
3349 case Intrinsic::experimental_constrained_fsub:
3350 St = Res.subtract(Op2V, RM);
3351 break;
3352 case Intrinsic::experimental_constrained_fmul:
3353 St = Res.multiply(Op2V, RM);
3354 break;
3355 case Intrinsic::experimental_constrained_fdiv:
3356 St = Res.divide(Op2V, RM);
3357 break;
3358 case Intrinsic::experimental_constrained_frem:
3359 St = Res.mod(Op2V);
3360 break;
3361 case Intrinsic::experimental_constrained_fcmp:
3362 case Intrinsic::experimental_constrained_fcmps:
3363 return evaluateCompare(Op1V, Op2V, ConstrIntr);
3364 }
3365 if (mayFoldConstrained(const_cast<ConstrainedFPIntrinsic *>(ConstrIntr),
3366 St))
3367 return ConstantFP::get(Ty, Res);
3368 return nullptr;
3369 }
3370
3371 switch (IntrinsicID) {
3372 default:
3373 break;
3374 case Intrinsic::copysign:
3375 return ConstantFP::get(Ty, APFloat::copySign(Op1V, Op2V));
3376 case Intrinsic::minnum:
3377 if (Op1V.isSignaling() || Op2V.isSignaling())
3378 return nullptr;
3379 return ConstantFP::get(Ty, minnum(Op1V, Op2V));
3380 case Intrinsic::maxnum:
3381 if (Op1V.isSignaling() || Op2V.isSignaling())
3382 return nullptr;
3383 return ConstantFP::get(Ty, maxnum(Op1V, Op2V));
3384 case Intrinsic::minimum:
3385 return ConstantFP::get(Ty, minimum(Op1V, Op2V));
3386 case Intrinsic::maximum:
3387 return ConstantFP::get(Ty, maximum(Op1V, Op2V));
3388 case Intrinsic::minimumnum:
3389 return ConstantFP::get(Ty, minimumnum(Op1V, Op2V));
3390 case Intrinsic::maximumnum:
3391 return ConstantFP::get(Ty, maximumnum(Op1V, Op2V));
3392
3393 case Intrinsic::nvvm_fmax_d:
3394 case Intrinsic::nvvm_fmax_f:
3395 case Intrinsic::nvvm_fmax_ftz_f:
3396 case Intrinsic::nvvm_fmax_ftz_nan_f:
3397 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3398 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3399 case Intrinsic::nvvm_fmax_nan_f:
3400 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3401 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3402
3403 case Intrinsic::nvvm_fmin_d:
3404 case Intrinsic::nvvm_fmin_f:
3405 case Intrinsic::nvvm_fmin_ftz_f:
3406 case Intrinsic::nvvm_fmin_ftz_nan_f:
3407 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
3408 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
3409 case Intrinsic::nvvm_fmin_nan_f:
3410 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
3411 case Intrinsic::nvvm_fmin_xorsign_abs_f: {
3412
3413 bool ShouldCanonicalizeNaNs = !(IntrinsicID == Intrinsic::nvvm_fmax_d ||
3414 IntrinsicID == Intrinsic::nvvm_fmin_d);
3415 bool IsFTZ = nvvm::FMinFMaxShouldFTZ(IntrinsicID);
3416 bool IsNaNPropagating = nvvm::FMinFMaxPropagatesNaNs(IntrinsicID);
3417 bool IsXorSignAbs = nvvm::FMinFMaxIsXorSignAbs(IntrinsicID);
3418
3419 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3420 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3421
3422 bool XorSign = false;
3423 if (IsXorSignAbs) {
3424 XorSign = A.isNegative() ^ B.isNegative();
3425 A = abs(A);
3426 B = abs(B);
3427 }
3428
3429 bool IsFMax = false;
3430 switch (IntrinsicID) {
3431 case Intrinsic::nvvm_fmax_d:
3432 case Intrinsic::nvvm_fmax_f:
3433 case Intrinsic::nvvm_fmax_ftz_f:
3434 case Intrinsic::nvvm_fmax_ftz_nan_f:
3435 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3436 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3437 case Intrinsic::nvvm_fmax_nan_f:
3438 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3439 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3440 IsFMax = true;
3441 break;
3442 }
3443 APFloat Res = IsFMax ? maximum(A, B) : minimum(A, B);
3444
3445 if (ShouldCanonicalizeNaNs) {
3446 APFloat NVCanonicalNaN(Res.getSemantics(), APInt(32, 0x7fffffff));
3447 if (A.isNaN() && B.isNaN())
3448 return ConstantFP::get(Ty, NVCanonicalNaN);
3449 else if (IsNaNPropagating && (A.isNaN() || B.isNaN()))
3450 return ConstantFP::get(Ty, NVCanonicalNaN);
3451 }
3452
3453 if (A.isNaN() && B.isNaN())
3454 return Operands[1];
3455 else if (A.isNaN())
3456 Res = B;
3457 else if (B.isNaN())
3458 Res = A;
3459
3460 if (IsXorSignAbs && XorSign != Res.isNegative())
3461 Res.changeSign();
3462
3463 return ConstantFP::get(Ty, Res);
3464 }
3465
3466 case Intrinsic::nvvm_add_rm_f:
3467 case Intrinsic::nvvm_add_rn_f:
3468 case Intrinsic::nvvm_add_rp_f:
3469 case Intrinsic::nvvm_add_rz_f:
3470 case Intrinsic::nvvm_add_rm_d:
3471 case Intrinsic::nvvm_add_rn_d:
3472 case Intrinsic::nvvm_add_rp_d:
3473 case Intrinsic::nvvm_add_rz_d:
3474 case Intrinsic::nvvm_add_rm_ftz_f:
3475 case Intrinsic::nvvm_add_rn_ftz_f:
3476 case Intrinsic::nvvm_add_rp_ftz_f:
3477 case Intrinsic::nvvm_add_rz_ftz_f: {
3478
3479 bool IsFTZ = nvvm::FAddShouldFTZ(IntrinsicID);
3480 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3481 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3482
3483 APFloat::roundingMode RoundMode =
3484 nvvm::GetFAddRoundingMode(IntrinsicID);
3485
3486 APFloat Res = A;
3487 APFloat::opStatus Status = Res.add(B, RoundMode);
3488
3489 if (!Res.isNaN() &&
3491 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3492 return ConstantFP::get(Ty, Res);
3493 }
3494 return nullptr;
3495 }
3496
3497 case Intrinsic::nvvm_mul_rm_f:
3498 case Intrinsic::nvvm_mul_rn_f:
3499 case Intrinsic::nvvm_mul_rp_f:
3500 case Intrinsic::nvvm_mul_rz_f:
3501 case Intrinsic::nvvm_mul_rm_d:
3502 case Intrinsic::nvvm_mul_rn_d:
3503 case Intrinsic::nvvm_mul_rp_d:
3504 case Intrinsic::nvvm_mul_rz_d:
3505 case Intrinsic::nvvm_mul_rm_ftz_f:
3506 case Intrinsic::nvvm_mul_rn_ftz_f:
3507 case Intrinsic::nvvm_mul_rp_ftz_f:
3508 case Intrinsic::nvvm_mul_rz_ftz_f: {
3509
3510 bool IsFTZ = nvvm::FMulShouldFTZ(IntrinsicID);
3511 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3512 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3513
3514 APFloat::roundingMode RoundMode =
3515 nvvm::GetFMulRoundingMode(IntrinsicID);
3516
3517 APFloat Res = A;
3518 APFloat::opStatus Status = Res.multiply(B, RoundMode);
3519
3520 if (!Res.isNaN() &&
3522 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3523 return ConstantFP::get(Ty, Res);
3524 }
3525 return nullptr;
3526 }
3527
3528 case Intrinsic::nvvm_div_rm_f:
3529 case Intrinsic::nvvm_div_rn_f:
3530 case Intrinsic::nvvm_div_rp_f:
3531 case Intrinsic::nvvm_div_rz_f:
3532 case Intrinsic::nvvm_div_rm_d:
3533 case Intrinsic::nvvm_div_rn_d:
3534 case Intrinsic::nvvm_div_rp_d:
3535 case Intrinsic::nvvm_div_rz_d:
3536 case Intrinsic::nvvm_div_rm_ftz_f:
3537 case Intrinsic::nvvm_div_rn_ftz_f:
3538 case Intrinsic::nvvm_div_rp_ftz_f:
3539 case Intrinsic::nvvm_div_rz_ftz_f: {
3540 bool IsFTZ = nvvm::FDivShouldFTZ(IntrinsicID);
3541 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3542 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3543 APFloat::roundingMode RoundMode =
3544 nvvm::GetFDivRoundingMode(IntrinsicID);
3545
3546 APFloat Res = A;
3547 APFloat::opStatus Status = Res.divide(B, RoundMode);
3548 if (!Res.isNaN() &&
3550 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3551 return ConstantFP::get(Ty, Res);
3552 }
3553 return nullptr;
3554 }
3555 }
3556
3557 if (!Ty->isHalfTy() && !Ty->isFloatTy() && !Ty->isDoubleTy())
3558 return nullptr;
3559
3560 switch (IntrinsicID) {
3561 default:
3562 break;
3563 case Intrinsic::pow:
3564 return ConstantFoldBinaryFP(pow, Op1V, Op2V, Ty);
3565 case Intrinsic::amdgcn_fmul_legacy:
3566 // The legacy behaviour is that multiplying +/- 0.0 by anything, even
3567 // NaN or infinity, gives +0.0.
3568 if (Op1V.isZero() || Op2V.isZero())
3569 return ConstantFP::getZero(Ty);
3570 return ConstantFP::get(Ty, Op1V * Op2V);
3571 }
3572
3573 } else if (auto *Op2C = dyn_cast<ConstantInt>(Operands[1])) {
3574 switch (IntrinsicID) {
3575 case Intrinsic::ldexp: {
3576 return ConstantFP::get(
3577 Ty->getContext(),
3578 scalbn(Op1V, Op2C->getSExtValue(), APFloat::rmNearestTiesToEven));
3579 }
3580 case Intrinsic::is_fpclass: {
3581 FPClassTest Mask = static_cast<FPClassTest>(Op2C->getZExtValue());
3582 bool Result =
3583 ((Mask & fcSNan) && Op1V.isNaN() && Op1V.isSignaling()) ||
3584 ((Mask & fcQNan) && Op1V.isNaN() && !Op1V.isSignaling()) ||
3585 ((Mask & fcNegInf) && Op1V.isNegInfinity()) ||
3586 ((Mask & fcNegNormal) && Op1V.isNormal() && Op1V.isNegative()) ||
3587 ((Mask & fcNegSubnormal) && Op1V.isDenormal() && Op1V.isNegative()) ||
3588 ((Mask & fcNegZero) && Op1V.isZero() && Op1V.isNegative()) ||
3589 ((Mask & fcPosZero) && Op1V.isZero() && !Op1V.isNegative()) ||
3590 ((Mask & fcPosSubnormal) && Op1V.isDenormal() && !Op1V.isNegative()) ||
3591 ((Mask & fcPosNormal) && Op1V.isNormal() && !Op1V.isNegative()) ||
3592 ((Mask & fcPosInf) && Op1V.isPosInfinity());
3593 return ConstantInt::get(Ty, Result);
3594 }
3595 case Intrinsic::powi: {
3596 int Exp = static_cast<int>(Op2C->getSExtValue());
3597 switch (Ty->getTypeID()) {
3598 case Type::HalfTyID:
3599 case Type::FloatTyID: {
3600 APFloat Res(static_cast<float>(std::pow(Op1V.convertToFloat(), Exp)));
3601 if (Ty->isHalfTy()) {
3602 bool Unused;
3604 &Unused);
3605 }
3606 return ConstantFP::get(Ty, Res);
3607 }
3608 case Type::DoubleTyID:
3609 return ConstantFP::get(Ty, std::pow(Op1V.convertToDouble(), Exp));
3610 default:
3611 return nullptr;
3612 }
3613 }
3614 default:
3615 break;
3616 }
3617 }
3618 return nullptr;
3619 }
3620
3621 if (Operands[0]->getType()->isIntegerTy() &&
3622 Operands[1]->getType()->isIntegerTy()) {
3623 const APInt *C0, *C1;
3624 if (!getConstIntOrUndef(Operands[0], C0) ||
3625 !getConstIntOrUndef(Operands[1], C1))
3626 return nullptr;
3627
3628 switch (IntrinsicID) {
3629 default: break;
3630 case Intrinsic::smax:
3631 case Intrinsic::smin:
3632 case Intrinsic::umax:
3633 case Intrinsic::umin:
3634 if (!C0 && !C1)
3635 return UndefValue::get(Ty);
3636 if (!C0 || !C1)
3637 return MinMaxIntrinsic::getSaturationPoint(IntrinsicID, Ty);
3638 return ConstantInt::get(
3639 Ty, ICmpInst::compare(*C0, *C1,
3640 MinMaxIntrinsic::getPredicate(IntrinsicID))
3641 ? *C0
3642 : *C1);
3643
3644 case Intrinsic::scmp:
3645 case Intrinsic::ucmp:
3646 if (!C0 || !C1)
3647 return ConstantInt::get(Ty, 0);
3648
3649 int Res;
3650 if (IntrinsicID == Intrinsic::scmp)
3651 Res = C0->sgt(*C1) ? 1 : C0->slt(*C1) ? -1 : 0;
3652 else
3653 Res = C0->ugt(*C1) ? 1 : C0->ult(*C1) ? -1 : 0;
3654 return ConstantInt::get(Ty, Res, /*IsSigned=*/true);
3655
3656 case Intrinsic::usub_with_overflow:
3657 case Intrinsic::ssub_with_overflow:
3658 // X - undef -> { 0, false }
3659 // undef - X -> { 0, false }
3660 if (!C0 || !C1)
3661 return Constant::getNullValue(Ty);
3662 [[fallthrough]];
3663 case Intrinsic::uadd_with_overflow:
3664 case Intrinsic::sadd_with_overflow:
3665 // X + undef -> { -1, false }
3666 // undef + x -> { -1, false }
3667 if (!C0 || !C1) {
3668 return ConstantStruct::get(
3669 cast<StructType>(Ty),
3670 {Constant::getAllOnesValue(Ty->getStructElementType(0)),
3671 Constant::getNullValue(Ty->getStructElementType(1))});
3672 }
3673 [[fallthrough]];
3674 case Intrinsic::smul_with_overflow:
3675 case Intrinsic::umul_with_overflow: {
3676 // undef * X -> { 0, false }
3677 // X * undef -> { 0, false }
3678 if (!C0 || !C1)
3679 return Constant::getNullValue(Ty);
3680
3681 APInt Res;
3682 bool Overflow;
3683 switch (IntrinsicID) {
3684 default: llvm_unreachable("Invalid case");
3685 case Intrinsic::sadd_with_overflow:
3686 Res = C0->sadd_ov(*C1, Overflow);
3687 break;
3688 case Intrinsic::uadd_with_overflow:
3689 Res = C0->uadd_ov(*C1, Overflow);
3690 break;
3691 case Intrinsic::ssub_with_overflow:
3692 Res = C0->ssub_ov(*C1, Overflow);
3693 break;
3694 case Intrinsic::usub_with_overflow:
3695 Res = C0->usub_ov(*C1, Overflow);
3696 break;
3697 case Intrinsic::smul_with_overflow:
3698 Res = C0->smul_ov(*C1, Overflow);
3699 break;
3700 case Intrinsic::umul_with_overflow:
3701 Res = C0->umul_ov(*C1, Overflow);
3702 break;
3703 }
3704 Constant *Ops[] = {
3705 ConstantInt::get(Ty->getContext(), Res),
3706 ConstantInt::get(Type::getInt1Ty(Ty->getContext()), Overflow)
3707 };
3709 }
3710 case Intrinsic::uadd_sat:
3711 case Intrinsic::sadd_sat:
3712 if (!C0 && !C1)
3713 return UndefValue::get(Ty);
3714 if (!C0 || !C1)
3715 return Constant::getAllOnesValue(Ty);
3716 if (IntrinsicID == Intrinsic::uadd_sat)
3717 return ConstantInt::get(Ty, C0->uadd_sat(*C1));
3718 else
3719 return ConstantInt::get(Ty, C0->sadd_sat(*C1));
3720 case Intrinsic::usub_sat:
3721 case Intrinsic::ssub_sat:
3722 if (!C0 && !C1)
3723 return UndefValue::get(Ty);
3724 if (!C0 || !C1)
3725 return Constant::getNullValue(Ty);
3726 if (IntrinsicID == Intrinsic::usub_sat)
3727 return ConstantInt::get(Ty, C0->usub_sat(*C1));
3728 else
3729 return ConstantInt::get(Ty, C0->ssub_sat(*C1));
3730 case Intrinsic::cttz:
3731 case Intrinsic::ctlz:
3732 assert(C1 && "Must be constant int");
3733
3734 // cttz(0, 1) and ctlz(0, 1) are poison.
3735 if (C1->isOne() && (!C0 || C0->isZero()))
3736 return PoisonValue::get(Ty);
3737 if (!C0)
3738 return Constant::getNullValue(Ty);
3739 if (IntrinsicID == Intrinsic::cttz)
3740 return ConstantInt::get(Ty, C0->countr_zero());
3741 else
3742 return ConstantInt::get(Ty, C0->countl_zero());
3743
3744 case Intrinsic::abs:
3745 assert(C1 && "Must be constant int");
3746 assert((C1->isOne() || C1->isZero()) && "Must be 0 or 1");
3747
3748 // Undef or minimum val operand with poison min --> poison
3749 if (C1->isOne() && (!C0 || C0->isMinSignedValue()))
3750 return PoisonValue::get(Ty);
3751
3752 // Undef operand with no poison min --> 0 (sign bit must be clear)
3753 if (!C0)
3754 return Constant::getNullValue(Ty);
3755
3756 return ConstantInt::get(Ty, C0->abs());
3757 case Intrinsic::amdgcn_wave_reduce_umin:
3758 case Intrinsic::amdgcn_wave_reduce_umax:
3759 case Intrinsic::amdgcn_wave_reduce_max:
3760 case Intrinsic::amdgcn_wave_reduce_min:
3761 case Intrinsic::amdgcn_wave_reduce_add:
3762 case Intrinsic::amdgcn_wave_reduce_sub:
3763 case Intrinsic::amdgcn_wave_reduce_and:
3764 case Intrinsic::amdgcn_wave_reduce_or:
3765 case Intrinsic::amdgcn_wave_reduce_xor:
3766 return dyn_cast<Constant>(Operands[0]);
3767 }
3768
3769 return nullptr;
3770 }
3771
3772 // Support ConstantVector in case we have an Undef in the top.
3773 if ((isa<ConstantVector>(Operands[0]) ||
3774 isa<ConstantDataVector>(Operands[0])) &&
3775 // Check for default rounding mode.
3776 // FIXME: Support other rounding modes?
3777 isa<ConstantInt>(Operands[1]) &&
3778 cast<ConstantInt>(Operands[1])->getValue() == 4) {
3779 auto *Op = cast<Constant>(Operands[0]);
3780 switch (IntrinsicID) {
3781 default: break;
3782 case Intrinsic::x86_avx512_vcvtss2si32:
3783 case Intrinsic::x86_avx512_vcvtss2si64:
3784 case Intrinsic::x86_avx512_vcvtsd2si32:
3785 case Intrinsic::x86_avx512_vcvtsd2si64:
3786 if (ConstantFP *FPOp =
3787 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3788 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3789 /*roundTowardZero=*/false, Ty,
3790 /*IsSigned*/true);
3791 break;
3792 case Intrinsic::x86_avx512_vcvtss2usi32:
3793 case Intrinsic::x86_avx512_vcvtss2usi64:
3794 case Intrinsic::x86_avx512_vcvtsd2usi32:
3795 case Intrinsic::x86_avx512_vcvtsd2usi64:
3796 if (ConstantFP *FPOp =
3797 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3798 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3799 /*roundTowardZero=*/false, Ty,
3800 /*IsSigned*/false);
3801 break;
3802 case Intrinsic::x86_avx512_cvttss2si:
3803 case Intrinsic::x86_avx512_cvttss2si64:
3804 case Intrinsic::x86_avx512_cvttsd2si:
3805 case Intrinsic::x86_avx512_cvttsd2si64:
3806 if (ConstantFP *FPOp =
3807 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3808 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3809 /*roundTowardZero=*/true, Ty,
3810 /*IsSigned*/true);
3811 break;
3812 case Intrinsic::x86_avx512_cvttss2usi:
3813 case Intrinsic::x86_avx512_cvttss2usi64:
3814 case Intrinsic::x86_avx512_cvttsd2usi:
3815 case Intrinsic::x86_avx512_cvttsd2usi64:
3816 if (ConstantFP *FPOp =
3817 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3818 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3819 /*roundTowardZero=*/true, Ty,
3820 /*IsSigned*/false);
3821 break;
3822 }
3823 }
3824 return nullptr;
3825}
3826
3827static APFloat ConstantFoldAMDGCNCubeIntrinsic(Intrinsic::ID IntrinsicID,
3828 const APFloat &S0,
3829 const APFloat &S1,
3830 const APFloat &S2) {
3831 unsigned ID;
3832 const fltSemantics &Sem = S0.getSemantics();
3833 APFloat MA(Sem), SC(Sem), TC(Sem);
3834 if (abs(S2) >= abs(S0) && abs(S2) >= abs(S1)) {
3835 if (S2.isNegative() && S2.isNonZero() && !S2.isNaN()) {
3836 // S2 < 0
3837 ID = 5;
3838 SC = -S0;
3839 } else {
3840 ID = 4;
3841 SC = S0;
3842 }
3843 MA = S2;
3844 TC = -S1;
3845 } else if (abs(S1) >= abs(S0)) {
3846 if (S1.isNegative() && S1.isNonZero() && !S1.isNaN()) {
3847 // S1 < 0
3848 ID = 3;
3849 TC = -S2;
3850 } else {
3851 ID = 2;
3852 TC = S2;
3853 }
3854 MA = S1;
3855 SC = S0;
3856 } else {
3857 if (S0.isNegative() && S0.isNonZero() && !S0.isNaN()) {
3858 // S0 < 0
3859 ID = 1;
3860 SC = S2;
3861 } else {
3862 ID = 0;
3863 SC = -S2;
3864 }
3865 MA = S0;
3866 TC = -S1;
3867 }
3868 switch (IntrinsicID) {
3869 default:
3870 llvm_unreachable("unhandled amdgcn cube intrinsic");
3871 case Intrinsic::amdgcn_cubeid:
3872 return APFloat(Sem, ID);
3873 case Intrinsic::amdgcn_cubema:
3874 return MA + MA;
3875 case Intrinsic::amdgcn_cubesc:
3876 return SC;
3877 case Intrinsic::amdgcn_cubetc:
3878 return TC;
3879 }
3880}
3881
3882static Constant *ConstantFoldAMDGCNPermIntrinsic(ArrayRef<Constant *> Operands,
3883 Type *Ty) {
3884 const APInt *C0, *C1, *C2;
3885 if (!getConstIntOrUndef(Operands[0], C0) ||
3886 !getConstIntOrUndef(Operands[1], C1) ||
3887 !getConstIntOrUndef(Operands[2], C2))
3888 return nullptr;
3889
3890 if (!C2)
3891 return UndefValue::get(Ty);
3892
3893 APInt Val(32, 0);
3894 unsigned NumUndefBytes = 0;
3895 for (unsigned I = 0; I < 32; I += 8) {
3896 unsigned Sel = C2->extractBitsAsZExtValue(8, I);
3897 unsigned B = 0;
3898
3899 if (Sel >= 13)
3900 B = 0xff;
3901 else if (Sel == 12)
3902 B = 0x00;
3903 else {
3904 const APInt *Src = ((Sel & 10) == 10 || (Sel & 12) == 4) ? C0 : C1;
3905 if (!Src)
3906 ++NumUndefBytes;
3907 else if (Sel < 8)
3908 B = Src->extractBitsAsZExtValue(8, (Sel & 3) * 8);
3909 else
3910 B = Src->extractBitsAsZExtValue(1, (Sel & 1) ? 31 : 15) * 0xff;
3911 }
3912
3913 Val.insertBits(B, I, 8);
3914 }
3915
3916 if (NumUndefBytes == 4)
3917 return UndefValue::get(Ty);
3918
3919 return ConstantInt::get(Ty, Val);
3920}
3921
3922static Constant *ConstantFoldScalarCall3(StringRef Name,
3923 Intrinsic::ID IntrinsicID,
3924 Type *Ty,
3925 ArrayRef<Constant *> Operands,
3926 const TargetLibraryInfo *TLI,
3927 const CallBase *Call) {
3928 assert(Operands.size() == 3 && "Wrong number of operands.");
3929
3930 if (const auto *Op1 = dyn_cast<ConstantFP>(Operands[0])) {
3931 if (const auto *Op2 = dyn_cast<ConstantFP>(Operands[1])) {
3932 if (const auto *Op3 = dyn_cast<ConstantFP>(Operands[2])) {
3933 const APFloat &C1 = Op1->getValueAPF();
3934 const APFloat &C2 = Op2->getValueAPF();
3935 const APFloat &C3 = Op3->getValueAPF();
3936
3937 if (const auto *ConstrIntr = dyn_cast<ConstrainedFPIntrinsic>(Call)) {
3938 RoundingMode RM = getEvaluationRoundingMode(ConstrIntr);
3939 APFloat Res = C1;
3941 switch (IntrinsicID) {
3942 default:
3943 return nullptr;
3944 case Intrinsic::experimental_constrained_fma:
3945 case Intrinsic::experimental_constrained_fmuladd:
3946 St = Res.fusedMultiplyAdd(C2, C3, RM);
3947 break;
3948 }
3949 if (mayFoldConstrained(
3950 const_cast<ConstrainedFPIntrinsic *>(ConstrIntr), St))
3951 return ConstantFP::get(Ty, Res);
3952 return nullptr;
3953 }
3954
3955 switch (IntrinsicID) {
3956 default: break;
3957 case Intrinsic::amdgcn_fma_legacy: {
3958 // The legacy behaviour is that multiplying +/- 0.0 by anything, even
3959 // NaN or infinity, gives +0.0.
3960 if (C1.isZero() || C2.isZero()) {
3961 // It's tempting to just return C3 here, but that would give the
3962 // wrong result if C3 was -0.0.
3963 return ConstantFP::get(Ty, APFloat(0.0f) + C3);
3964 }
3965 [[fallthrough]];
3966 }
3967 case Intrinsic::fma:
3968 case Intrinsic::fmuladd: {
3969 APFloat V = C1;
3971 return ConstantFP::get(Ty, V);
3972 }
3973
3974 case Intrinsic::nvvm_fma_rm_f:
3975 case Intrinsic::nvvm_fma_rn_f:
3976 case Intrinsic::nvvm_fma_rp_f:
3977 case Intrinsic::nvvm_fma_rz_f:
3978 case Intrinsic::nvvm_fma_rm_d:
3979 case Intrinsic::nvvm_fma_rn_d:
3980 case Intrinsic::nvvm_fma_rp_d:
3981 case Intrinsic::nvvm_fma_rz_d:
3982 case Intrinsic::nvvm_fma_rm_ftz_f:
3983 case Intrinsic::nvvm_fma_rn_ftz_f:
3984 case Intrinsic::nvvm_fma_rp_ftz_f:
3985 case Intrinsic::nvvm_fma_rz_ftz_f: {
3986 bool IsFTZ = nvvm::FMAShouldFTZ(IntrinsicID);
3987 APFloat A = IsFTZ ? FTZPreserveSign(C1) : C1;
3988 APFloat B = IsFTZ ? FTZPreserveSign(C2) : C2;
3989 APFloat C = IsFTZ ? FTZPreserveSign(C3) : C3;
3990
3991 APFloat::roundingMode RoundMode =
3992 nvvm::GetFMARoundingMode(IntrinsicID);
3993
3994 APFloat Res = A;
3995 APFloat::opStatus Status = Res.fusedMultiplyAdd(B, C, RoundMode);
3996
3997 if (!Res.isNaN() &&
3999 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
4000 return ConstantFP::get(Ty, Res);
4001 }
4002 return nullptr;
4003 }
4004
4005 case Intrinsic::amdgcn_cubeid:
4006 case Intrinsic::amdgcn_cubema:
4007 case Intrinsic::amdgcn_cubesc:
4008 case Intrinsic::amdgcn_cubetc: {
4009 APFloat V = ConstantFoldAMDGCNCubeIntrinsic(IntrinsicID, C1, C2, C3);
4010 return ConstantFP::get(Ty, V);
4011 }
4012 }
4013 }
4014 }
4015 }
4016
4017 if (IntrinsicID == Intrinsic::smul_fix ||
4018 IntrinsicID == Intrinsic::smul_fix_sat) {
4019 const APInt *C0, *C1;
4020 if (!getConstIntOrUndef(Operands[0], C0) ||
4021 !getConstIntOrUndef(Operands[1], C1))
4022 return nullptr;
4023
4024 // undef * C -> 0
4025 // C * undef -> 0
4026 if (!C0 || !C1)
4027 return Constant::getNullValue(Ty);
4028
4029 // This code performs rounding towards negative infinity in case the result
4030 // cannot be represented exactly for the given scale. Targets that do care
4031 // about rounding should use a target hook for specifying how rounding
4032 // should be done, and provide their own folding to be consistent with
4033 // rounding. This is the same approach as used by
4034 // DAGTypeLegalizer::ExpandIntRes_MULFIX.
4035 unsigned Scale = cast<ConstantInt>(Operands[2])->getZExtValue();
4036 unsigned Width = C0->getBitWidth();
4037 assert(Scale < Width && "Illegal scale.");
4038 unsigned ExtendedWidth = Width * 2;
4039 APInt Product =
4040 (C0->sext(ExtendedWidth) * C1->sext(ExtendedWidth)).ashr(Scale);
4041 if (IntrinsicID == Intrinsic::smul_fix_sat) {
4042 APInt Max = APInt::getSignedMaxValue(Width).sext(ExtendedWidth);
4043 APInt Min = APInt::getSignedMinValue(Width).sext(ExtendedWidth);
4044 Product = APIntOps::smin(Product, Max);
4045 Product = APIntOps::smax(Product, Min);
4046 }
4047 return ConstantInt::get(Ty->getContext(), Product.sextOrTrunc(Width));
4048 }
4049
4050 if (IntrinsicID == Intrinsic::fshl || IntrinsicID == Intrinsic::fshr) {
4051 const APInt *C0, *C1, *C2;
4052 if (!getConstIntOrUndef(Operands[0], C0) ||
4053 !getConstIntOrUndef(Operands[1], C1) ||
4054 !getConstIntOrUndef(Operands[2], C2))
4055 return nullptr;
4056
4057 bool IsRight = IntrinsicID == Intrinsic::fshr;
4058 if (!C2)
4059 return Operands[IsRight ? 1 : 0];
4060 if (!C0 && !C1)
4061 return UndefValue::get(Ty);
4062
4063 // The shift amount is interpreted as modulo the bitwidth. If the shift
4064 // amount is effectively 0, avoid UB due to oversized inverse shift below.
4065 unsigned BitWidth = C2->getBitWidth();
4066 unsigned ShAmt = C2->urem(BitWidth);
4067 if (!ShAmt)
4068 return Operands[IsRight ? 1 : 0];
4069
4070 // (C0 << ShlAmt) | (C1 >> LshrAmt)
4071 unsigned LshrAmt = IsRight ? ShAmt : BitWidth - ShAmt;
4072 unsigned ShlAmt = !IsRight ? ShAmt : BitWidth - ShAmt;
4073 if (!C0)
4074 return ConstantInt::get(Ty, C1->lshr(LshrAmt));
4075 if (!C1)
4076 return ConstantInt::get(Ty, C0->shl(ShlAmt));
4077 return ConstantInt::get(Ty, C0->shl(ShlAmt) | C1->lshr(LshrAmt));
4078 }
4079
4080 if (IntrinsicID == Intrinsic::amdgcn_perm)
4081 return ConstantFoldAMDGCNPermIntrinsic(Operands, Ty);
4082
4083 return nullptr;
4084}
4085
4086static Constant *ConstantFoldScalarCall(StringRef Name,
4087 Intrinsic::ID IntrinsicID,
4088 Type *Ty,
4089 ArrayRef<Constant *> Operands,
4090 const TargetLibraryInfo *TLI,
4091 const CallBase *Call) {
4092 if (IntrinsicID != Intrinsic::not_intrinsic &&
4093 any_of(Operands, IsaPred<PoisonValue>) &&
4094 intrinsicPropagatesPoison(IntrinsicID))
4095 return PoisonValue::get(Ty);
4096
4097 if (Operands.size() == 1)
4098 return ConstantFoldScalarCall1(Name, IntrinsicID, Ty, Operands, TLI, Call);
4099
4100 if (Operands.size() == 2) {
4101 if (Constant *FoldedLibCall =
4102 ConstantFoldLibCall2(Name, Ty, Operands, TLI)) {
4103 return FoldedLibCall;
4104 }
4105 return ConstantFoldIntrinsicCall2(IntrinsicID, Ty, Operands, Call);
4106 }
4107
4108 if (Operands.size() == 3)
4109 return ConstantFoldScalarCall3(Name, IntrinsicID, Ty, Operands, TLI, Call);
4110
4111 return nullptr;
4112}
4113
4114static Constant *ConstantFoldFixedVectorCall(
4115 StringRef Name, Intrinsic::ID IntrinsicID, FixedVectorType *FVTy,
4116 ArrayRef<Constant *> Operands, const DataLayout &DL,
4117 const TargetLibraryInfo *TLI, const CallBase *Call) {
4119 SmallVector<Constant *, 4> Lane(Operands.size());
4120 Type *Ty = FVTy->getElementType();
4121
4122 switch (IntrinsicID) {
4123 case Intrinsic::masked_load: {
4124 auto *SrcPtr = Operands[0];
4125 auto *Mask = Operands[1];
4126 auto *Passthru = Operands[2];
4127
4128 Constant *VecData = ConstantFoldLoadFromConstPtr(SrcPtr, FVTy, DL);
4129
4130 SmallVector<Constant *, 32> NewElements;
4131 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4132 auto *MaskElt = Mask->getAggregateElement(I);
4133 if (!MaskElt)
4134 break;
4135 auto *PassthruElt = Passthru->getAggregateElement(I);
4136 auto *VecElt = VecData ? VecData->getAggregateElement(I) : nullptr;
4137 if (isa<UndefValue>(MaskElt)) {
4138 if (PassthruElt)
4139 NewElements.push_back(PassthruElt);
4140 else if (VecElt)
4141 NewElements.push_back(VecElt);
4142 else
4143 return nullptr;
4144 }
4145 if (MaskElt->isNullValue()) {
4146 if (!PassthruElt)
4147 return nullptr;
4148 NewElements.push_back(PassthruElt);
4149 } else if (MaskElt->isOneValue()) {
4150 if (!VecElt)
4151 return nullptr;
4152 NewElements.push_back(VecElt);
4153 } else {
4154 return nullptr;
4155 }
4156 }
4157 if (NewElements.size() != FVTy->getNumElements())
4158 return nullptr;
4159 return ConstantVector::get(NewElements);
4160 }
4161 case Intrinsic::arm_mve_vctp8:
4162 case Intrinsic::arm_mve_vctp16:
4163 case Intrinsic::arm_mve_vctp32:
4164 case Intrinsic::arm_mve_vctp64: {
4165 if (auto *Op = dyn_cast<ConstantInt>(Operands[0])) {
4166 unsigned Lanes = FVTy->getNumElements();
4167 uint64_t Limit = Op->getZExtValue();
4168
4170 for (unsigned i = 0; i < Lanes; i++) {
4171 if (i < Limit)
4173 else
4175 }
4176 return ConstantVector::get(NCs);
4177 }
4178 return nullptr;
4179 }
4180 case Intrinsic::get_active_lane_mask: {
4181 auto *Op0 = dyn_cast<ConstantInt>(Operands[0]);
4182 auto *Op1 = dyn_cast<ConstantInt>(Operands[1]);
4183 if (Op0 && Op1) {
4184 unsigned Lanes = FVTy->getNumElements();
4185 uint64_t Base = Op0->getZExtValue();
4186 uint64_t Limit = Op1->getZExtValue();
4187
4189 for (unsigned i = 0; i < Lanes; i++) {
4190 if (Base + i < Limit)
4192 else
4194 }
4195 return ConstantVector::get(NCs);
4196 }
4197 return nullptr;
4198 }
4199 case Intrinsic::vector_extract: {
4200 auto *Idx = dyn_cast<ConstantInt>(Operands[1]);
4201 Constant *Vec = Operands[0];
4202 if (!Idx || !isa<FixedVectorType>(Vec->getType()))
4203 return nullptr;
4204
4205 unsigned NumElements = FVTy->getNumElements();
4206 unsigned VecNumElements =
4207 cast<FixedVectorType>(Vec->getType())->getNumElements();
4208 unsigned StartingIndex = Idx->getZExtValue();
4209
4210 // Extracting entire vector is nop
4211 if (NumElements == VecNumElements && StartingIndex == 0)
4212 return Vec;
4213
4214 for (unsigned I = StartingIndex, E = StartingIndex + NumElements; I < E;
4215 ++I) {
4216 Constant *Elt = Vec->getAggregateElement(I);
4217 if (!Elt)
4218 return nullptr;
4219 Result[I - StartingIndex] = Elt;
4220 }
4221
4222 return ConstantVector::get(Result);
4223 }
4224 case Intrinsic::vector_insert: {
4225 Constant *Vec = Operands[0];
4226 Constant *SubVec = Operands[1];
4227 auto *Idx = dyn_cast<ConstantInt>(Operands[2]);
4228 if (!Idx || !isa<FixedVectorType>(Vec->getType()))
4229 return nullptr;
4230
4231 unsigned SubVecNumElements =
4232 cast<FixedVectorType>(SubVec->getType())->getNumElements();
4233 unsigned VecNumElements =
4234 cast<FixedVectorType>(Vec->getType())->getNumElements();
4235 unsigned IdxN = Idx->getZExtValue();
4236 // Replacing entire vector with a subvec is nop
4237 if (SubVecNumElements == VecNumElements && IdxN == 0)
4238 return SubVec;
4239
4240 for (unsigned I = 0; I < VecNumElements; ++I) {
4241 Constant *Elt;
4242 if (I < IdxN + SubVecNumElements)
4243 Elt = SubVec->getAggregateElement(I - IdxN);
4244 else
4245 Elt = Vec->getAggregateElement(I);
4246 if (!Elt)
4247 return nullptr;
4248 Result[I] = Elt;
4249 }
4250 return ConstantVector::get(Result);
4251 }
4252 case Intrinsic::vector_interleave2:
4253 case Intrinsic::vector_interleave3:
4254 case Intrinsic::vector_interleave4:
4255 case Intrinsic::vector_interleave5:
4256 case Intrinsic::vector_interleave6:
4257 case Intrinsic::vector_interleave7:
4258 case Intrinsic::vector_interleave8: {
4259 unsigned NumElements =
4260 cast<FixedVectorType>(Operands[0]->getType())->getNumElements();
4261 unsigned NumOperands = Operands.size();
4262 for (unsigned I = 0; I < NumElements; ++I) {
4263 for (unsigned J = 0; J < NumOperands; ++J) {
4264 Constant *Elt = Operands[J]->getAggregateElement(I);
4265 if (!Elt)
4266 return nullptr;
4267 Result[NumOperands * I + J] = Elt;
4268 }
4269 }
4270 return ConstantVector::get(Result);
4271 }
4272 case Intrinsic::wasm_dot: {
4273 unsigned NumElements =
4274 cast<FixedVectorType>(Operands[0]->getType())->getNumElements();
4275
4276 assert(NumElements == 8 && Result.size() == 4 &&
4277 "wasm dot takes i16x8 and produces i32x4");
4278 assert(Ty->isIntegerTy());
4279 int32_t MulVector[8];
4280
4281 for (unsigned I = 0; I < NumElements; ++I) {
4282 ConstantInt *Elt0 =
4283 cast<ConstantInt>(Operands[0]->getAggregateElement(I));
4284 ConstantInt *Elt1 =
4285 cast<ConstantInt>(Operands[1]->getAggregateElement(I));
4286
4287 MulVector[I] = Elt0->getSExtValue() * Elt1->getSExtValue();
4288 }
4289 for (unsigned I = 0; I < Result.size(); I++) {
4290 int64_t IAdd = (int64_t)MulVector[I * 2] + (int64_t)MulVector[I * 2 + 1];
4291 Result[I] = ConstantInt::get(Ty, IAdd);
4292 }
4293
4294 return ConstantVector::get(Result);
4295 }
4296 default:
4297 break;
4298 }
4299
4300 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4301 // Gather a column of constants.
4302 for (unsigned J = 0, JE = Operands.size(); J != JE; ++J) {
4303 // Some intrinsics use a scalar type for certain arguments.
4304 if (isVectorIntrinsicWithScalarOpAtArg(IntrinsicID, J, /*TTI=*/nullptr)) {
4305 Lane[J] = Operands[J];
4306 continue;
4307 }
4308
4309 Constant *Agg = Operands[J]->getAggregateElement(I);
4310 if (!Agg)
4311 return nullptr;
4312
4313 Lane[J] = Agg;
4314 }
4315
4316 // Use the regular scalar folding to simplify this column.
4317 Constant *Folded =
4318 ConstantFoldScalarCall(Name, IntrinsicID, Ty, Lane, TLI, Call);
4319 if (!Folded)
4320 return nullptr;
4321 Result[I] = Folded;
4322 }
4323
4324 return ConstantVector::get(Result);
4325}
4326
4327static Constant *ConstantFoldScalableVectorCall(
4328 StringRef Name, Intrinsic::ID IntrinsicID, ScalableVectorType *SVTy,
4329 ArrayRef<Constant *> Operands, const DataLayout &DL,
4330 const TargetLibraryInfo *TLI, const CallBase *Call) {
4331 switch (IntrinsicID) {
4332 case Intrinsic::aarch64_sve_convert_from_svbool: {
4333 auto *Src = dyn_cast<Constant>(Operands[0]);
4334 if (!Src || !Src->isNullValue())
4335 break;
4336
4337 return ConstantInt::getFalse(SVTy);
4338 }
4339 case Intrinsic::get_active_lane_mask: {
4340 auto *Op0 = dyn_cast<ConstantInt>(Operands[0]);
4341 auto *Op1 = dyn_cast<ConstantInt>(Operands[1]);
4342 if (Op0 && Op1 && Op0->getValue().uge(Op1->getValue()))
4343 return ConstantVector::getNullValue(SVTy);
4344 break;
4345 }
4346 case Intrinsic::vector_interleave2:
4347 case Intrinsic::vector_interleave3:
4348 case Intrinsic::vector_interleave4:
4349 case Intrinsic::vector_interleave5:
4350 case Intrinsic::vector_interleave6:
4351 case Intrinsic::vector_interleave7:
4352 case Intrinsic::vector_interleave8: {
4353 Constant *SplatVal = Operands[0]->getSplatValue();
4354 if (!SplatVal)
4355 return nullptr;
4356
4357 if (!llvm::all_equal(Operands))
4358 return nullptr;
4359
4360 return ConstantVector::getSplat(SVTy->getElementCount(), SplatVal);
4361 }
4362 default:
4363 break;
4364 }
4365
4366 // If trivially vectorizable, try folding it via the scalar call if all
4367 // operands are splats.
4368
4369 // TODO: ConstantFoldFixedVectorCall should probably check this too?
4370 if (!isTriviallyVectorizable(IntrinsicID))
4371 return nullptr;
4372
4374 for (auto [I, Op] : enumerate(Operands)) {
4375 if (isVectorIntrinsicWithScalarOpAtArg(IntrinsicID, I, /*TTI=*/nullptr)) {
4376 SplatOps.push_back(Op);
4377 continue;
4378 }
4379 Constant *Splat = Op->getSplatValue();
4380 if (!Splat)
4381 return nullptr;
4382 SplatOps.push_back(Splat);
4383 }
4384 Constant *Folded = ConstantFoldScalarCall(
4385 Name, IntrinsicID, SVTy->getElementType(), SplatOps, TLI, Call);
4386 if (!Folded)
4387 return nullptr;
4388 return ConstantVector::getSplat(SVTy->getElementCount(), Folded);
4389}
4390
4391static std::pair<Constant *, Constant *>
4392ConstantFoldScalarFrexpCall(Constant *Op, Type *IntTy) {
4393 if (isa<PoisonValue>(Op))
4394 return {Op, PoisonValue::get(IntTy)};
4395
4396 auto *ConstFP = dyn_cast<ConstantFP>(Op);
4397 if (!ConstFP)
4398 return {};
4399
4400 const APFloat &U = ConstFP->getValueAPF();
4401 int FrexpExp;
4402 APFloat FrexpMant = frexp(U, FrexpExp, APFloat::rmNearestTiesToEven);
4403 Constant *Result0 = ConstantFP::get(ConstFP->getType(), FrexpMant);
4404
4405 // The exponent is an "unspecified value" for inf/nan. We use zero to avoid
4406 // using undef.
4407 Constant *Result1 = FrexpMant.isFinite()
4408 ? ConstantInt::getSigned(IntTy, FrexpExp)
4409 : ConstantInt::getNullValue(IntTy);
4410 return {Result0, Result1};
4411}
4412
4413/// Handle intrinsics that return tuples, which may be tuples of vectors.
4414static Constant *
4415ConstantFoldStructCall(StringRef Name, Intrinsic::ID IntrinsicID,
4416 StructType *StTy, ArrayRef<Constant *> Operands,
4417 const DataLayout &DL, const TargetLibraryInfo *TLI,
4418 const CallBase *Call) {
4419
4420 switch (IntrinsicID) {
4421 case Intrinsic::frexp: {
4422 Type *Ty0 = StTy->getContainedType(0);
4423 Type *Ty1 = StTy->getContainedType(1)->getScalarType();
4424
4425 if (auto *FVTy0 = dyn_cast<FixedVectorType>(Ty0)) {
4426 SmallVector<Constant *, 4> Results0(FVTy0->getNumElements());
4427 SmallVector<Constant *, 4> Results1(FVTy0->getNumElements());
4428
4429 for (unsigned I = 0, E = FVTy0->getNumElements(); I != E; ++I) {
4430 Constant *Lane = Operands[0]->getAggregateElement(I);
4431 std::tie(Results0[I], Results1[I]) =
4432 ConstantFoldScalarFrexpCall(Lane, Ty1);
4433 if (!Results0[I])
4434 return nullptr;
4435 }
4436
4437 return ConstantStruct::get(StTy, ConstantVector::get(Results0),
4438 ConstantVector::get(Results1));
4439 }
4440
4441 auto [Result0, Result1] = ConstantFoldScalarFrexpCall(Operands[0], Ty1);
4442 if (!Result0)
4443 return nullptr;
4444 return ConstantStruct::get(StTy, Result0, Result1);
4445 }
4446 case Intrinsic::sincos: {
4447 Type *Ty = StTy->getContainedType(0);
4448 Type *TyScalar = Ty->getScalarType();
4449
4450 auto ConstantFoldScalarSincosCall =
4451 [&](Constant *Op) -> std::pair<Constant *, Constant *> {
4452 Constant *SinResult =
4453 ConstantFoldScalarCall(Name, Intrinsic::sin, TyScalar, Op, TLI, Call);
4454 Constant *CosResult =
4455 ConstantFoldScalarCall(Name, Intrinsic::cos, TyScalar, Op, TLI, Call);
4456 return std::make_pair(SinResult, CosResult);
4457 };
4458
4459 if (auto *FVTy = dyn_cast<FixedVectorType>(Ty)) {
4460 SmallVector<Constant *> SinResults(FVTy->getNumElements());
4461 SmallVector<Constant *> CosResults(FVTy->getNumElements());
4462
4463 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4464 Constant *Lane = Operands[0]->getAggregateElement(I);
4465 std::tie(SinResults[I], CosResults[I]) =
4466 ConstantFoldScalarSincosCall(Lane);
4467 if (!SinResults[I] || !CosResults[I])
4468 return nullptr;
4469 }
4470
4471 return ConstantStruct::get(StTy, ConstantVector::get(SinResults),
4472 ConstantVector::get(CosResults));
4473 }
4474
4475 auto [SinResult, CosResult] = ConstantFoldScalarSincosCall(Operands[0]);
4476 if (!SinResult || !CosResult)
4477 return nullptr;
4478 return ConstantStruct::get(StTy, SinResult, CosResult);
4479 }
4480 case Intrinsic::vector_deinterleave2:
4481 case Intrinsic::vector_deinterleave3:
4482 case Intrinsic::vector_deinterleave4:
4483 case Intrinsic::vector_deinterleave5:
4484 case Intrinsic::vector_deinterleave6:
4485 case Intrinsic::vector_deinterleave7:
4486 case Intrinsic::vector_deinterleave8: {
4487 unsigned NumResults = StTy->getNumElements();
4488 auto *Vec = Operands[0];
4489 auto *VecTy = cast<VectorType>(Vec->getType());
4490
4491 ElementCount ResultEC =
4492 VecTy->getElementCount().divideCoefficientBy(NumResults);
4493
4494 if (auto *EltC = Vec->getSplatValue()) {
4495 auto *ResultVec = ConstantVector::getSplat(ResultEC, EltC);
4496 SmallVector<Constant *, 8> Results(NumResults, ResultVec);
4497 return ConstantStruct::get(StTy, Results);
4498 }
4499
4500 if (!ResultEC.isFixed())
4501 return nullptr;
4502
4503 unsigned NumElements = ResultEC.getFixedValue();
4505 SmallVector<Constant *> Elements(NumElements);
4506 for (unsigned I = 0; I != NumResults; ++I) {
4507 for (unsigned J = 0; J != NumElements; ++J) {
4508 Constant *Elt = Vec->getAggregateElement(J * NumResults + I);
4509 if (!Elt)
4510 return nullptr;
4511 Elements[J] = Elt;
4512 }
4513 Results[I] = ConstantVector::get(Elements);
4514 }
4515 return ConstantStruct::get(StTy, Results);
4516 }
4517 default:
4518 // TODO: Constant folding of vector intrinsics that fall through here does
4519 // not work (e.g. overflow intrinsics)
4520 return ConstantFoldScalarCall(Name, IntrinsicID, StTy, Operands, TLI, Call);
4521 }
4522
4523 return nullptr;
4524}
4525
4526} // end anonymous namespace
4527
4529 Constant *RHS, Type *Ty,
4532 // Ensure we check flags like StrictFP that might prevent this from getting
4533 // folded before generating a result.
4534 if (Call && !canConstantFoldCallTo(Call, Call->getCalledFunction()))
4535 return nullptr;
4536 return ConstantFoldIntrinsicCall2(ID, Ty, {LHS, RHS}, Call);
4537}
4538
4540 ArrayRef<Constant *> Operands,
4541 const TargetLibraryInfo *TLI,
4542 bool AllowNonDeterministic) {
4543 if (Call->isNoBuiltin())
4544 return nullptr;
4545 if (!F->hasName())
4546 return nullptr;
4547
4548 // If this is not an intrinsic and not recognized as a library call, bail out.
4549 Intrinsic::ID IID = F->getIntrinsicID();
4550 if (IID == Intrinsic::not_intrinsic) {
4551 if (!TLI)
4552 return nullptr;
4553 LibFunc LibF;
4554 if (!TLI->getLibFunc(*F, LibF))
4555 return nullptr;
4556 }
4557
4558 // Conservatively assume that floating-point libcalls may be
4559 // non-deterministic.
4560 Type *Ty = F->getReturnType();
4561 if (!AllowNonDeterministic && Ty->isFPOrFPVectorTy())
4562 return nullptr;
4563
4564 StringRef Name = F->getName();
4565 if (auto *FVTy = dyn_cast<FixedVectorType>(Ty))
4566 return ConstantFoldFixedVectorCall(
4567 Name, IID, FVTy, Operands, F->getDataLayout(), TLI, Call);
4568
4569 if (auto *SVTy = dyn_cast<ScalableVectorType>(Ty))
4570 return ConstantFoldScalableVectorCall(
4571 Name, IID, SVTy, Operands, F->getDataLayout(), TLI, Call);
4572
4573 if (auto *StTy = dyn_cast<StructType>(Ty))
4574 return ConstantFoldStructCall(Name, IID, StTy, Operands,
4575 F->getDataLayout(), TLI, Call);
4576
4577 // TODO: If this is a library function, we already discovered that above,
4578 // so we should pass the LibFunc, not the name (and it might be better
4579 // still to separate intrinsic handling from libcalls).
4580 return ConstantFoldScalarCall(Name, IID, Ty, Operands, TLI, Call);
4581}
4582
4584 const TargetLibraryInfo *TLI) {
4585 // FIXME: Refactor this code; this duplicates logic in LibCallsShrinkWrap
4586 // (and to some extent ConstantFoldScalarCall).
4587 if (Call->isNoBuiltin() || Call->isStrictFP())
4588 return false;
4589 Function *F = Call->getCalledFunction();
4590 if (!F)
4591 return false;
4592
4593 LibFunc Func;
4594 if (!TLI || !TLI->getLibFunc(*F, Func))
4595 return false;
4596
4597 if (Call->arg_size() == 1) {
4598 if (ConstantFP *OpC = dyn_cast<ConstantFP>(Call->getArgOperand(0))) {
4599 const APFloat &Op = OpC->getValueAPF();
4600 switch (Func) {
4601 case LibFunc_logl:
4602 case LibFunc_log:
4603 case LibFunc_logf:
4604 case LibFunc_log2l:
4605 case LibFunc_log2:
4606 case LibFunc_log2f:
4607 case LibFunc_log10l:
4608 case LibFunc_log10:
4609 case LibFunc_log10f:
4610 return Op.isNaN() || (!Op.isZero() && !Op.isNegative());
4611
4612 case LibFunc_ilogb:
4613 return !Op.isNaN() && !Op.isZero() && !Op.isInfinity();
4614
4615 case LibFunc_expl:
4616 case LibFunc_exp:
4617 case LibFunc_expf:
4618 // FIXME: These boundaries are slightly conservative.
4619 if (OpC->getType()->isDoubleTy())
4620 return !(Op < APFloat(-745.0) || Op > APFloat(709.0));
4621 if (OpC->getType()->isFloatTy())
4622 return !(Op < APFloat(-103.0f) || Op > APFloat(88.0f));
4623 break;
4624
4625 case LibFunc_exp2l:
4626 case LibFunc_exp2:
4627 case LibFunc_exp2f:
4628 // FIXME: These boundaries are slightly conservative.
4629 if (OpC->getType()->isDoubleTy())
4630 return !(Op < APFloat(-1074.0) || Op > APFloat(1023.0));
4631 if (OpC->getType()->isFloatTy())
4632 return !(Op < APFloat(-149.0f) || Op > APFloat(127.0f));
4633 break;
4634
4635 case LibFunc_sinl:
4636 case LibFunc_sin:
4637 case LibFunc_sinf:
4638 case LibFunc_cosl:
4639 case LibFunc_cos:
4640 case LibFunc_cosf:
4641 return !Op.isInfinity();
4642
4643 case LibFunc_tanl:
4644 case LibFunc_tan:
4645 case LibFunc_tanf: {
4646 // FIXME: Stop using the host math library.
4647 // FIXME: The computation isn't done in the right precision.
4648 Type *Ty = OpC->getType();
4649 if (Ty->isDoubleTy() || Ty->isFloatTy() || Ty->isHalfTy())
4650 return ConstantFoldFP(tan, OpC->getValueAPF(), Ty) != nullptr;
4651 break;
4652 }
4653
4654 case LibFunc_atan:
4655 case LibFunc_atanf:
4656 case LibFunc_atanl:
4657 // Per POSIX, this MAY fail if Op is denormal. We choose not failing.
4658 return true;
4659
4660 case LibFunc_asinl:
4661 case LibFunc_asin:
4662 case LibFunc_asinf:
4663 case LibFunc_acosl:
4664 case LibFunc_acos:
4665 case LibFunc_acosf:
4666 return !(Op < APFloat::getOne(Op.getSemantics(), true) ||
4667 Op > APFloat::getOne(Op.getSemantics()));
4668
4669 case LibFunc_sinh:
4670 case LibFunc_cosh:
4671 case LibFunc_sinhf:
4672 case LibFunc_coshf:
4673 case LibFunc_sinhl:
4674 case LibFunc_coshl:
4675 // FIXME: These boundaries are slightly conservative.
4676 if (OpC->getType()->isDoubleTy())
4677 return !(Op < APFloat(-710.0) || Op > APFloat(710.0));
4678 if (OpC->getType()->isFloatTy())
4679 return !(Op < APFloat(-89.0f) || Op > APFloat(89.0f));
4680 break;
4681
4682 case LibFunc_sqrtl:
4683 case LibFunc_sqrt:
4684 case LibFunc_sqrtf:
4685 return Op.isNaN() || Op.isZero() || !Op.isNegative();
4686
4687 // FIXME: Add more functions: sqrt_finite, atanh, expm1, log1p,
4688 // maybe others?
4689 default:
4690 break;
4691 }
4692 }
4693 }
4694
4695 if (Call->arg_size() == 2) {
4696 ConstantFP *Op0C = dyn_cast<ConstantFP>(Call->getArgOperand(0));
4697 ConstantFP *Op1C = dyn_cast<ConstantFP>(Call->getArgOperand(1));
4698 if (Op0C && Op1C) {
4699 const APFloat &Op0 = Op0C->getValueAPF();
4700 const APFloat &Op1 = Op1C->getValueAPF();
4701
4702 switch (Func) {
4703 case LibFunc_powl:
4704 case LibFunc_pow:
4705 case LibFunc_powf: {
4706 // FIXME: Stop using the host math library.
4707 // FIXME: The computation isn't done in the right precision.
4708 Type *Ty = Op0C->getType();
4709 if (Ty->isDoubleTy() || Ty->isFloatTy() || Ty->isHalfTy()) {
4710 if (Ty == Op1C->getType())
4711 return ConstantFoldBinaryFP(pow, Op0, Op1, Ty) != nullptr;
4712 }
4713 break;
4714 }
4715
4716 case LibFunc_fmodl:
4717 case LibFunc_fmod:
4718 case LibFunc_fmodf:
4719 case LibFunc_remainderl:
4720 case LibFunc_remainder:
4721 case LibFunc_remainderf:
4722 return Op0.isNaN() || Op1.isNaN() ||
4723 (!Op0.isInfinity() && !Op1.isZero());
4724
4725 case LibFunc_atan2:
4726 case LibFunc_atan2f:
4727 case LibFunc_atan2l:
4728 // Although IEEE-754 says atan2(+/-0.0, +/-0.0) are well-defined, and
4729 // GLIBC and MSVC do not appear to raise an error on those, we
4730 // cannot rely on that behavior. POSIX and C11 say that a domain error
4731 // may occur, so allow for that possibility.
4732 return !Op0.isZero() || !Op1.isZero();
4733
4734 default:
4735 break;
4736 }
4737 }
4738 }
4739
4740 return false;
4741}
4742
4744 unsigned CastOp, const DataLayout &DL,
4745 PreservedCastFlags *Flags) {
4746 switch (CastOp) {
4747 case Instruction::BitCast:
4748 // Bitcast is always lossless.
4749 return ConstantFoldCastOperand(Instruction::BitCast, C, InvCastTo, DL);
4750 case Instruction::Trunc: {
4751 auto *ZExtC = ConstantFoldCastOperand(Instruction::ZExt, C, InvCastTo, DL);
4752 if (Flags) {
4753 // Truncation back on ZExt value is always NUW.
4754 Flags->NUW = true;
4755 // Test positivity of C.
4756 auto *SExtC =
4757 ConstantFoldCastOperand(Instruction::SExt, C, InvCastTo, DL);
4758 Flags->NSW = ZExtC == SExtC;
4759 }
4760 return ZExtC;
4761 }
4762 case Instruction::SExt:
4763 case Instruction::ZExt: {
4764 auto *InvC = ConstantExpr::getTrunc(C, InvCastTo);
4765 auto *CastInvC = ConstantFoldCastOperand(CastOp, InvC, C->getType(), DL);
4766 // Must satisfy CastOp(InvC) == C.
4767 if (!CastInvC || CastInvC != C)
4768 return nullptr;
4769 if (Flags && CastOp == Instruction::ZExt) {
4770 auto *SExtInvC =
4771 ConstantFoldCastOperand(Instruction::SExt, InvC, C->getType(), DL);
4772 // Test positivity of InvC.
4773 Flags->NNeg = CastInvC == SExtInvC;
4774 }
4775 return InvC;
4776 }
4777 default:
4778 return nullptr;
4779 }
4780}
4781
4783 const DataLayout &DL,
4784 PreservedCastFlags *Flags) {
4785 return getLosslessInvCast(C, DestTy, Instruction::ZExt, DL, Flags);
4786}
4787
4789 const DataLayout &DL,
4790 PreservedCastFlags *Flags) {
4791 return getLosslessInvCast(C, DestTy, Instruction::SExt, DL, Flags);
4792}
4793
4794void TargetFolder::anchor() {}
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
constexpr LLT S1
This file declares a class to represent arbitrary precision floating point values and provide a varie...
This file implements a class to represent arbitrary precision integral constant values and operations...
This file implements the APSInt class, which is a simple class that represents an arbitrary sized int...
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Function Alias Analysis Results
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
static Constant * FoldBitCast(Constant *V, Type *DestTy)
static ConstantFP * flushDenormalConstant(Type *Ty, const APFloat &APF, DenormalMode::DenormalModeKind Mode)
Constant * getConstantAtOffset(Constant *Base, APInt Offset, const DataLayout &DL)
If this Offset points exactly to the start of an aggregate element, return that element,...
static cl::opt< bool > DisableFPCallFolding("disable-fp-call-folding", cl::desc("Disable constant-folding of FP intrinsics and libcalls."), cl::init(false), cl::Hidden)
static ConstantFP * flushDenormalConstantFP(ConstantFP *CFP, const Instruction *Inst, bool IsOutput)
static DenormalMode getInstrDenormalMode(const Instruction *CtxI, Type *Ty)
Return the denormal mode that can be assumed when executing a floating point operation at CtxI.
This file contains the declarations for the subclasses of Constant, which represent the different fla...
This file defines the DenseMap class.
Hexagon Common GEP
amode Optimize addressing mode
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
static bool InRange(int64_t Value, unsigned short Shift, int LBound, int HBound)
This file contains the definitions of the enumerations and flags associated with NVVM Intrinsics,...
if(PassOpts->AAPipeline)
const SmallVectorImpl< MachineOperand > & Cond
static cl::opt< RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode > Mode("regalloc-enable-advisor", cl::Hidden, cl::init(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default), cl::desc("Enable regalloc advisor mode"), cl::values(clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default, "default", "Default"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Release, "release", "precompiled"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Development, "development", "for training")))
This file contains some templates that are useful if you are working with the STL at all.
This file defines the SmallVector class.
static TableGen::Emitter::OptClass< SkeletonEmitter > X("gen-skeleton-class", "Generate example skeleton class")
static SymbolRef::Type getType(const Symbol *Sym)
Definition TapiFile.cpp:39
The Input class is used to parse a yaml document into in-memory structs and vectors.
static constexpr roundingMode rmTowardZero
Definition APFloat.h:348
llvm::RoundingMode roundingMode
IEEE-754R 4.3: Rounding-direction attributes.
Definition APFloat.h:342
static const fltSemantics & IEEEdouble()
Definition APFloat.h:297
static constexpr roundingMode rmTowardNegative
Definition APFloat.h:347
static constexpr roundingMode rmNearestTiesToEven
Definition APFloat.h:344
static constexpr roundingMode rmTowardPositive
Definition APFloat.h:346
static const fltSemantics & IEEEhalf()
Definition APFloat.h:294
static constexpr roundingMode rmNearestTiesToAway
Definition APFloat.h:349
opStatus
IEEE-754R 7: Default exception handling.
Definition APFloat.h:360
static APFloat getQNaN(const fltSemantics &Sem, bool Negative=false, const APInt *payload=nullptr)
Factory for QNaN values.
Definition APFloat.h:1102
opStatus divide(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1190
void copySign(const APFloat &RHS)
Definition APFloat.h:1284
LLVM_ABI opStatus convert(const fltSemantics &ToSemantics, roundingMode RM, bool *losesInfo)
Definition APFloat.cpp:6053
opStatus subtract(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1172
bool isNegative() const
Definition APFloat.h:1431
LLVM_ABI double convertToDouble() const
Converts this APFloat to host double value.
Definition APFloat.cpp:6112
bool isPosInfinity() const
Definition APFloat.h:1444
bool isNormal() const
Definition APFloat.h:1435
bool isDenormal() const
Definition APFloat.h:1432
opStatus add(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1163
const fltSemantics & getSemantics() const
Definition APFloat.h:1439
bool isNonZero() const
Definition APFloat.h:1440
bool isFinite() const
Definition APFloat.h:1436
bool isNaN() const
Definition APFloat.h:1429
static APFloat getOne(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative One.
Definition APFloat.h:1070
opStatus multiply(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1181
LLVM_ABI float convertToFloat() const
Converts this APFloat to host float value.
Definition APFloat.cpp:6143
bool isSignaling() const
Definition APFloat.h:1433
opStatus fusedMultiplyAdd(const APFloat &Multiplicand, const APFloat &Addend, roundingMode RM)
Definition APFloat.h:1217
bool isZero() const
Definition APFloat.h:1427
APInt bitcastToAPInt() const
Definition APFloat.h:1335
opStatus convertToInteger(MutableArrayRef< integerPart > Input, unsigned int Width, bool IsSigned, roundingMode RM, bool *IsExact) const
Definition APFloat.h:1314
opStatus mod(const APFloat &RHS)
Definition APFloat.h:1208
bool isNegInfinity() const
Definition APFloat.h:1445
opStatus roundToIntegral(roundingMode RM)
Definition APFloat.h:1230
void changeSign()
Definition APFloat.h:1279
static APFloat getZero(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative Zero.
Definition APFloat.h:1061
bool isInfinity() const
Definition APFloat.h:1428
Class for arbitrary precision integers.
Definition APInt.h:78
LLVM_ABI APInt umul_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1971
LLVM_ABI APInt usub_sat(const APInt &RHS) const
Definition APInt.cpp:2055
bool isMinSignedValue() const
Determine if this is the smallest signed value.
Definition APInt.h:424
uint64_t getZExtValue() const
Get zero extended value.
Definition APInt.h:1541
LLVM_ABI uint64_t extractBitsAsZExtValue(unsigned numBits, unsigned bitPosition) const
Definition APInt.cpp:520
LLVM_ABI APInt zextOrTrunc(unsigned width) const
Zero extend or truncate to width.
Definition APInt.cpp:1033
LLVM_ABI APInt trunc(unsigned width) const
Truncate to new width.
Definition APInt.cpp:936
APInt abs() const
Get the absolute value.
Definition APInt.h:1796
LLVM_ABI APInt sadd_sat(const APInt &RHS) const
Definition APInt.cpp:2026
bool sgt(const APInt &RHS) const
Signed greater than comparison.
Definition APInt.h:1202
LLVM_ABI APInt usub_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1948
bool ugt(const APInt &RHS) const
Unsigned greater than comparison.
Definition APInt.h:1183
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
Definition APInt.h:381
LLVM_ABI APInt urem(const APInt &RHS) const
Unsigned remainder operation.
Definition APInt.cpp:1666
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition APInt.h:1489
bool ult(const APInt &RHS) const
Unsigned less than comparison.
Definition APInt.h:1112
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition APInt.h:210
LLVM_ABI APInt sadd_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1928
LLVM_ABI APInt uadd_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1935
unsigned countr_zero() const
Count the number of trailing zero bits.
Definition APInt.h:1640
unsigned countl_zero() const
The APInt version of std::countl_zero.
Definition APInt.h:1599
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
Definition APInt.h:220
LLVM_ABI APInt sextOrTrunc(unsigned width) const
Sign extend or truncate to width.
Definition APInt.cpp:1041
LLVM_ABI APInt uadd_sat(const APInt &RHS) const
Definition APInt.cpp:2036
APInt ashr(unsigned ShiftAmt) const
Arithmetic right-shift function.
Definition APInt.h:828
LLVM_ABI APInt smul_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1960
LLVM_ABI APInt sext(unsigned width) const
Sign extend to a new width.
Definition APInt.cpp:985
APInt shl(unsigned shiftAmt) const
Left-shift function.
Definition APInt.h:874
bool slt(const APInt &RHS) const
Signed less than comparison.
Definition APInt.h:1131
LLVM_ABI APInt extractBits(unsigned numBits, unsigned bitPosition) const
Return an APInt with the extracted bits [bitPosition,bitPosition+numBits).
Definition APInt.cpp:482
LLVM_ABI APInt ssub_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1941
bool isOne() const
Determine if this is a value of 1.
Definition APInt.h:390
APInt lshr(unsigned shiftAmt) const
Logical right-shift function.
Definition APInt.h:852
LLVM_ABI APInt ssub_sat(const APInt &RHS) const
Definition APInt.cpp:2045
An arbitrary precision integer that knows its signedness.
Definition APSInt.h:24
This class represents an incoming formal argument to a Function.
Definition Argument.h:32
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
size_t size() const
size - Get the array size.
Definition ArrayRef.h:142
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
static LLVM_ABI Instruction::CastOps getCastOpcode(const Value *Val, bool SrcIsSigned, Type *Ty, bool DstIsSigned)
Returns the opcode necessary to cast Val into Ty using usual casting rules.
static LLVM_ABI unsigned isEliminableCastPair(Instruction::CastOps firstOpcode, Instruction::CastOps secondOpcode, Type *SrcTy, Type *MidTy, Type *DstTy, const DataLayout *DL)
Determine how a pair of casts can be eliminated, if they can be at all.
static LLVM_ABI bool castIsValid(Instruction::CastOps op, Type *SrcTy, Type *DstTy)
This method can be used to determine if a cast from SrcTy to DstTy using Opcode op is valid or not.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:676
bool isSigned() const
Definition InstrTypes.h:930
Predicate getSwappedPredicate() const
For example, EQ->EQ, SLE->SGE, ULT->UGT, OEQ->OEQ, ULE->UGE, OLT->OGT, etc.
Definition InstrTypes.h:827
static bool isFPPredicate(Predicate P)
Definition InstrTypes.h:770
static Constant * get(LLVMContext &Context, ArrayRef< ElementTy > Elts)
get() constructor - Return a constant with array type with an element count and element type matching...
Definition Constants.h:723
static LLVM_ABI Constant * getIntToPtr(Constant *C, Type *Ty, bool OnlyIfReduced=false)
static LLVM_ABI Constant * getExtractElement(Constant *Vec, Constant *Idx, Type *OnlyIfReducedTy=nullptr)
static LLVM_ABI bool isDesirableCastOp(unsigned Opcode)
Whether creating a constant expression for this cast is desirable.
static LLVM_ABI Constant * getCast(unsigned ops, Constant *C, Type *Ty, bool OnlyIfReduced=false)
Convenience function for getting a Cast operation.
static LLVM_ABI Constant * getSub(Constant *C1, Constant *C2, bool HasNUW=false, bool HasNSW=false)
static LLVM_ABI Constant * getInsertElement(Constant *Vec, Constant *Elt, Constant *Idx, Type *OnlyIfReducedTy=nullptr)
static LLVM_ABI Constant * getShuffleVector(Constant *V1, Constant *V2, ArrayRef< int > Mask, Type *OnlyIfReducedTy=nullptr)
static bool isSupportedGetElementPtr(const Type *SrcElemTy)
Whether creating a constant expression for this getelementptr type is supported.
Definition Constants.h:1400
static LLVM_ABI Constant * get(unsigned Opcode, Constant *C1, Constant *C2, unsigned Flags=0, Type *OnlyIfReducedTy=nullptr)
get - Return a binary or shift operator constant expression, folding if possible.
static LLVM_ABI bool isDesirableBinOp(unsigned Opcode)
Whether creating a constant expression for this binary operator is desirable.
static Constant * getGetElementPtr(Type *Ty, Constant *C, ArrayRef< Constant * > IdxList, GEPNoWrapFlags NW=GEPNoWrapFlags::none(), std::optional< ConstantRange > InRange=std::nullopt, Type *OnlyIfReducedTy=nullptr)
Getelementptr form.
Definition Constants.h:1287
static LLVM_ABI Constant * getBitCast(Constant *C, Type *Ty, bool OnlyIfReduced=false)
static LLVM_ABI Constant * getTrunc(Constant *C, Type *Ty, bool OnlyIfReduced=false)
ConstantFP - Floating Point Values [float, double].
Definition Constants.h:285
const APFloat & getValueAPF() const
Definition Constants.h:328
static LLVM_ABI Constant * getInfinity(Type *Ty, bool Negative=false)
static LLVM_ABI Constant * getZero(Type *Ty, bool Negative=false)
static LLVM_ABI Constant * getNaN(Type *Ty, bool Negative=false, uint64_t Payload=0)
This is the shared class of boolean and integer constants.
Definition Constants.h:87
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
static LLVM_ABI ConstantInt * getFalse(LLVMContext &Context)
int64_t getSExtValue() const
Return the constant as a 64-bit integer value after it has been sign extended as appropriate for the ...
Definition Constants.h:177
static ConstantInt * getSigned(IntegerType *Ty, int64_t V, bool ImplicitTrunc=true)
Return a ConstantInt with the specified value for the specified type.
Definition Constants.h:138
static LLVM_ABI ConstantInt * getBool(LLVMContext &Context, bool V)
static LLVM_ABI Constant * get(StructType *T, ArrayRef< Constant * > V)
static LLVM_ABI Constant * getSplat(ElementCount EC, Constant *Elt)
Return a ConstantVector with the specified constant in each element.
static LLVM_ABI Constant * get(ArrayRef< Constant * > V)
This is an important base class in LLVM.
Definition Constant.h:43
LLVM_ABI Constant * getSplatValue(bool AllowPoison=false) const
If all elements of the vector constant have the same value, return that value.
static LLVM_ABI Constant * getAllOnesValue(Type *Ty)
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
LLVM_ABI Constant * getAggregateElement(unsigned Elt) const
For aggregates (struct/array/vector) return the constant that corresponds to the specified element if...
LLVM_ABI bool isZeroValue() const
Return true if the value is negative zero or null value.
Definition Constants.cpp:76
LLVM_ABI bool isNullValue() const
Return true if this is the value that would be returned by getNullValue.
Definition Constants.cpp:90
Constrained floating point compare intrinsics.
This is the common base class for constrained floating point intrinsics.
LLVM_ABI std::optional< fp::ExceptionBehavior > getExceptionBehavior() const
LLVM_ABI std::optional< RoundingMode > getRoundingMode() const
Wrapper for a function that represents a value that functionally represents the original function.
Definition Constants.h:960
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64
iterator find(const_arg_type_t< KeyT > Val)
Definition DenseMap.h:178
iterator end()
Definition DenseMap.h:81
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Definition DenseMap.h:241
static LLVM_ABI bool compare(const APFloat &LHS, const APFloat &RHS, FCmpInst::Predicate Pred)
Return result of LHS Pred RHS comparison.
This provides a helper for copying FMF from an instruction or setting specified flags.
Definition IRBuilder.h:93
Class to represent fixed width SIMD vectors.
unsigned getNumElements() const
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
Definition Type.cpp:802
DenormalMode getDenormalMode(const fltSemantics &FPType) const
Returns the denormal handling type for the default rounding mode of the function.
Definition Function.cpp:806
Represents flags for the getelementptr instruction/expression.
static GEPNoWrapFlags inBounds()
GEPNoWrapFlags withoutNoUnsignedSignedWrap() const
static GEPNoWrapFlags noUnsignedWrap()
bool hasNoUnsignedSignedWrap() const
bool isInBounds() const
static LLVM_ABI Type * getIndexedType(Type *Ty, ArrayRef< Value * > IdxList)
Returns the result type of a getelementptr with the given source element type and indexes.
PointerType * getType() const
Global values are always pointers.
LLVM_ABI const DataLayout & getDataLayout() const
Get the data layout of the module this global belongs to.
Definition Globals.cpp:132
const Constant * getInitializer() const
getInitializer - Return the initializer for this global variable.
bool isConstant() const
If the value is a global constant, its value is immutable throughout the runtime execution of the pro...
bool hasDefinitiveInitializer() const
hasDefinitiveInitializer - Whether the global variable has an initializer, and any other instances of...
static LLVM_ABI bool compare(const APInt &LHS, const APInt &RHS, ICmpInst::Predicate Pred)
Return result of LHS Pred RHS comparison.
Predicate getSignedPredicate() const
For example, EQ->EQ, SLE->SLE, UGT->SGT, etc.
bool isEquality() const
Return true if this predicate is either EQ or NE.
bool isCast() const
bool isBinaryOp() const
LLVM_ABI const Function * getFunction() const
Return the function this instruction belongs to.
bool isUnaryOp() const
static LLVM_ABI IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition Type.cpp:318
This is an important class for using LLVM in a threaded context.
Definition LLVMContext.h:68
static APInt getSaturationPoint(Intrinsic::ID ID, unsigned numBits)
Min/max intrinsics are monotonic, they operate on a fixed-bitwidth values, so there is a certain thre...
static ICmpInst::Predicate getPredicate(Intrinsic::ID ID)
Returns the comparison predicate underlying the intrinsic.
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Class to represent scalable SIMD vectors.
void push_back(const T &Elt)
pointer data()
Return a pointer to the vector's buffer, even if empty().
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55
Used to lazily calculate structure layout information for a target machine, based on the DataLayout s...
Definition DataLayout.h:723
LLVM_ABI unsigned getElementContainingOffset(uint64_t FixedOffset) const
Given a valid byte offset into the structure, returns the structure index that contains it.
TypeSize getElementOffset(unsigned Idx) const
Definition DataLayout.h:754
Class to represent struct types.
unsigned getNumElements() const
Random access to the elements.
Provides information about what library functions are available for the current target.
bool has(LibFunc F) const
Tests whether a library function is available.
bool getLibFunc(StringRef funcName, LibFunc &F) const
Searches for a particular function name.
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45
static LLVM_ABI IntegerType * getInt64Ty(LLVMContext &C)
Definition Type.cpp:297
bool isVectorTy() const
True if this is an instance of VectorType.
Definition Type.h:273
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
Definition Type.cpp:296
bool isPointerTy() const
True if this is an instance of PointerType.
Definition Type.h:267
LLVM_ABI unsigned getPointerAddressSpace() const
Get the address space of this pointer or pointer vector type.
@ HalfTyID
16-bit floating point type
Definition Type.h:56
@ FloatTyID
32-bit floating point type
Definition Type.h:58
@ DoubleTyID
64-bit floating point type
Definition Type.h:59
static LLVM_ABI IntegerType * getInt8Ty(LLVMContext &C)
Definition Type.cpp:294
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition Type.h:352
LLVM_ABI TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
Definition Type.cpp:197
static LLVM_ABI IntegerType * getInt16Ty(LLVMContext &C)
Definition Type.cpp:295
bool isSized(SmallPtrSetImpl< Type * > *Visited=nullptr) const
Return true if it makes sense to take the size of this type.
Definition Type.h:311
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
Definition Type.h:128
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
Definition Type.cpp:230
static LLVM_ABI IntegerType * getInt1Ty(LLVMContext &C)
Definition Type.cpp:293
bool isFloatingPointTy() const
Return true if this is one of the floating-point types.
Definition Type.h:184
bool isPtrOrPtrVectorTy() const
Return true if this is a pointer type or a vector of pointer types.
Definition Type.h:270
bool isX86_AMXTy() const
Return true if this is X86 AMX.
Definition Type.h:200
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition Type.h:240
static LLVM_ABI IntegerType * getIntNTy(LLVMContext &C, unsigned N)
Definition Type.cpp:300
Type * getContainedType(unsigned i) const
This method is used to implement the type iterator (defined at the end of the file).
Definition Type.h:381
LLVM_ABI const fltSemantics & getFltSemantics() const
Definition Type.cpp:106
static LLVM_ABI UndefValue * get(Type *T)
Static factory methods - Return an 'undef' object of the specified type.
A Use represents the edge between a Value definition and its users.
Definition Use.h:35
LLVM Value Representation.
Definition Value.h:75
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:256
LLVM_ABI const Value * stripAndAccumulateConstantOffsets(const DataLayout &DL, APInt &Offset, bool AllowNonInbounds, bool AllowInvariantGroup=false, function_ref< bool(Value &Value, APInt &Offset)> ExternalAnalysis=nullptr, bool LookThroughIntToPtr=false) const
Accumulate the constant offset this value has compared to a base pointer.
LLVM_ABI LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.cpp:1106
LLVM_ABI uint64_t getPointerDereferenceableBytes(const DataLayout &DL, bool &CanBeNull, bool &CanBeFreed) const
Returns the number of bytes known to be dereferenceable for the pointer value.
Definition Value.cpp:888
Base class of all SIMD vector types.
ElementCount getElementCount() const
Return an ElementCount instance to represent the (possibly scalable) number of elements in the vector...
Type * getElementType() const
constexpr ScalarTy getFixedValue() const
Definition TypeSize.h:200
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
Definition TypeSize.h:168
constexpr bool isFixed() const
Returns true if the quantity is not scaled by vscale.
Definition TypeSize.h:171
constexpr LeafTy divideCoefficientBy(ScalarTy RHS) const
We do not provide the '/' operator here because division for polynomial types does not work in the sa...
Definition TypeSize.h:252
static constexpr bool isKnownGE(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
Definition TypeSize.h:237
const ParentTy * getParent() const
Definition ilist_node.h:34
CallInst * Call
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
const APInt & smin(const APInt &A, const APInt &B)
Determine the smaller of two APInts considered to be signed.
Definition APInt.h:2249
const APInt & smax(const APInt &A, const APInt &B)
Determine the larger of two APInts considered to be signed.
Definition APInt.h:2254
const APInt & umin(const APInt &A, const APInt &B)
Determine the smaller of two APInts considered to be unsigned.
Definition APInt.h:2259
const APInt & umax(const APInt &A, const APInt &B)
Determine the larger of two APInts considered to be unsigned.
Definition APInt.h:2264
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
@ CE
Windows NT (Windows on ARM)
Definition MCAsmInfo.h:48
initializer< Ty > init(const Ty &Val)
@ ebStrict
This corresponds to "fpexcept.strict".
Definition FPEnv.h:42
@ ebIgnore
This corresponds to "fpexcept.ignore".
Definition FPEnv.h:40
constexpr double pi
APFloat::roundingMode GetFMARoundingMode(Intrinsic::ID IntrinsicID)
DenormalMode GetNVVMDenormMode(bool ShouldFTZ)
bool FPToIntegerIntrinsicNaNZero(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFDivRoundingMode(Intrinsic::ID IntrinsicID)
bool FPToIntegerIntrinsicResultIsSigned(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFPToIntegerRoundingMode(Intrinsic::ID IntrinsicID)
bool RCPShouldFTZ(Intrinsic::ID IntrinsicID)
bool FPToIntegerIntrinsicShouldFTZ(Intrinsic::ID IntrinsicID)
bool FDivShouldFTZ(Intrinsic::ID IntrinsicID)
bool FAddShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMinFMaxIsXorSignAbs(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFMulRoundingMode(Intrinsic::ID IntrinsicID)
bool UnaryMathIntrinsicShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMinFMaxShouldFTZ(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFAddRoundingMode(Intrinsic::ID IntrinsicID)
bool FMAShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMulShouldFTZ(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetRCPRoundingMode(Intrinsic::ID IntrinsicID)
bool FMinFMaxPropagatesNaNs(Intrinsic::ID IntrinsicID)
NodeAddr< FuncNode * > Func
Definition RDFGraph.h:393
LLVM_ABI std::error_code status(const Twine &path, file_status &result, bool follow=true)
Get file status as if by POSIX stat().
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition STLExtras.h:316
@ Offset
Definition DWP.cpp:532
LLVM_ABI Constant * ConstantFoldBinaryIntrinsic(Intrinsic::ID ID, Constant *LHS, Constant *RHS, Type *Ty, Instruction *FMFSource)
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1737
LLVM_ABI Constant * ConstantFoldLoadThroughBitcast(Constant *C, Type *DestTy, const DataLayout &DL)
ConstantFoldLoadThroughBitcast - try to cast constant to destination type returning null if unsuccess...
static double log2(double V)
LLVM_ABI Constant * ConstantFoldSelectInstruction(Constant *Cond, Constant *V1, Constant *V2)
Attempt to constant fold a select instruction with the specified operands.
LLVM_ABI Constant * ConstantFoldFPInstOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL, const Instruction *I, bool AllowNonDeterministic=true)
Attempt to constant fold a floating point binary operation with the specified operands,...
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
Definition STLExtras.h:2530
LLVM_ABI bool canConstantFoldCallTo(const CallBase *Call, const Function *F)
canConstantFoldCallTo - Return true if its even possible to fold a call to the specified function.
unsigned getPointerAddressSpace(const Type *T)
Definition SPIRVUtils.h:367
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
LLVM_ABI Constant * ConstantFoldInstruction(const Instruction *I, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldInstruction - Try to constant fold the specified instruction.
APFloat abs(APFloat X)
Returns the absolute value of the argument.
Definition APFloat.h:1545
LLVM_ABI Constant * ConstantFoldCompareInstruction(CmpInst::Predicate Predicate, Constant *C1, Constant *C2)
LLVM_ABI Constant * ConstantFoldUnaryInstruction(unsigned Opcode, Constant *V)
LLVM_ABI bool IsConstantOffsetFromGlobal(Constant *C, GlobalValue *&GV, APInt &Offset, const DataLayout &DL, DSOLocalEquivalent **DSOEquiv=nullptr)
If this constant is a constant offset from a global, return the global and the constant.
LLVM_ABI bool isMathLibCallNoop(const CallBase *Call, const TargetLibraryInfo *TLI)
Check whether the given call has no side-effects.
LLVM_ABI Constant * ReadByteArrayFromGlobal(const GlobalVariable *GV, uint64_t Offset)
auto dyn_cast_if_present(const Y &Val)
dyn_cast_if_present<X> - Functionally identical to dyn_cast, except that a null (or none in the case ...
Definition Casting.h:732
LLVM_READONLY APFloat maximum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 maximum semantics.
Definition APFloat.h:1625
LLVM_ABI Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
int ilogb(const APFloat &Arg)
Returns the exponent of the internal representation of the APFloat.
Definition APFloat.h:1516
bool isa_and_nonnull(const Y &Val)
Definition Casting.h:676
LLVM_ABI Constant * ConstantFoldCall(const CallBase *Call, Function *F, ArrayRef< Constant * > Operands, const TargetLibraryInfo *TLI=nullptr, bool AllowNonDeterministic=true)
ConstantFoldCall - Attempt to constant fold a call to the specified function with the specified argum...
APFloat frexp(const APFloat &X, int &Exp, APFloat::roundingMode RM)
Equivalent of C standard library function.
Definition APFloat.h:1537
LLVM_ABI Constant * ConstantFoldExtractValueInstruction(Constant *Agg, ArrayRef< unsigned > Idxs)
Attempt to constant fold an extractvalue instruction with the specified operands and indices.
LLVM_ABI Constant * ConstantFoldConstant(const Constant *C, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldConstant - Fold the constant using the specified DataLayout.
auto dyn_cast_or_null(const Y &Val)
Definition Casting.h:753
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1744
LLVM_READONLY APFloat maxnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2008 maxNum semantics.
Definition APFloat.h:1580
LLVM_ABI Constant * ConstantFoldLoadFromUniformValue(Constant *C, Type *Ty, const DataLayout &DL)
If C is a uniform value where all bits are the same (either all zero, all ones, all undef or all pois...
LLVM_ABI Constant * ConstantFoldUnaryOpOperand(unsigned Opcode, Constant *Op, const DataLayout &DL)
Attempt to constant fold a unary operation with the specified operand.
LLVM_ABI Constant * FlushFPConstant(Constant *Operand, const Instruction *I, bool IsOutput)
Attempt to flush float point constant according to denormal mode set in the instruction's parent func...
LLVM_ABI Constant * getLosslessUnsignedTrunc(Constant *C, Type *DestTy, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
LLVM_READONLY APFloat minimumnum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 minimumNumber semantics.
Definition APFloat.h:1611
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
APFloat scalbn(APFloat X, int Exp, APFloat::roundingMode RM)
Returns: X * 2^Exp for integral exponents.
Definition APFloat.h:1525
LLVM_ABI void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
LLVM_ABI bool NullPointerIsDefined(const Function *F, unsigned AS=0)
Check whether null pointer dereferencing is considered undefined behavior for a given function or an ...
LLVM_ABI Constant * getLosslessSignedTrunc(Constant *C, Type *DestTy, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
LLVM_ABI Constant * ConstantFoldCastOperand(unsigned Opcode, Constant *C, Type *DestTy, const DataLayout &DL)
Attempt to constant fold a cast with the specified operand.
LLVM_ABI Constant * ConstantFoldLoadFromConst(Constant *C, Type *Ty, const APInt &Offset, const DataLayout &DL)
Extract value of C at the given Offset reinterpreted as Ty.
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547
LLVM_ABI bool intrinsicPropagatesPoison(Intrinsic::ID IID)
Return whether this intrinsic propagates poison for all operands.
LLVM_ABI Constant * ConstantFoldBinaryOpOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL)
Attempt to constant fold a binary operation with the specified operands.
MutableArrayRef(T &OneElt) -> MutableArrayRef< T >
LLVM_READONLY APFloat minnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2008 minNum semantics.
Definition APFloat.h:1561
@ Sub
Subtraction of integers.
LLVM_ABI bool isVectorIntrinsicWithScalarOpAtArg(Intrinsic::ID ID, unsigned ScalarOpdIdx, const TargetTransformInfo *TTI)
Identifies if the vector form of the intrinsic has a scalar operand.
DWARFExpression::Operation Op
RoundingMode
Rounding mode.
@ NearestTiesToEven
roundTiesToEven.
@ Dynamic
Denotes mode unknown at compile time.
LLVM_ABI bool isGuaranteedNotToBeUndefOrPoison(const Value *V, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Return true if this function can prove that V does not have undef bits and is never poison.
constexpr unsigned BitWidth
LLVM_ABI Constant * getLosslessInvCast(Constant *C, Type *InvCastTo, unsigned CastOp, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
Try to cast C to InvC losslessly, satisfying CastOp(InvC) equals C, or CastOp(InvC) is a refined valu...
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
bool all_equal(std::initializer_list< T > Values)
Returns true if all Values in the initializer lists are equal or the list.
Definition STLExtras.h:2156
LLVM_ABI Constant * ConstantFoldCastInstruction(unsigned opcode, Constant *V, Type *DestTy)
LLVM_ABI Constant * ConstantFoldInsertValueInstruction(Constant *Agg, Constant *Val, ArrayRef< unsigned > Idxs)
Attempt to constant fold an insertvalue instruction with the specified operands and indices.
LLVM_ABI Constant * ConstantFoldLoadFromConstPtr(Constant *C, Type *Ty, APInt Offset, const DataLayout &DL)
Return the value that a load from C with offset Offset would produce if it is constant and determinab...
LLVM_ABI Constant * ConstantFoldInstOperands(const Instruction *I, ArrayRef< Constant * > Ops, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, bool AllowNonDeterministic=true)
ConstantFoldInstOperands - Attempt to constant fold an instruction with the specified operands.
LLVM_READONLY APFloat minimum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 minimum semantics.
Definition APFloat.h:1598
LLVM_READONLY APFloat maximumnum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 maximumNumber semantics.
Definition APFloat.h:1638
LLVM_ABI const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=MaxLookupSearchDepth)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
LLVM_ABI Constant * ConstantFoldIntegerCast(Constant *C, Type *DestTy, bool IsSigned, const DataLayout &DL)
Constant fold a zext, sext or trunc, depending on IsSigned and whether the DestTy is wider or narrowe...
LLVM_ABI bool isTriviallyVectorizable(Intrinsic::ID ID)
Identify if the intrinsic is trivially vectorizable.
constexpr detail::IsaCheckPredicate< Types... > IsaPred
Function object wrapper for the llvm::isa type check.
Definition Casting.h:866
LLVM_ABI Constant * ConstantFoldBinaryInstruction(unsigned Opcode, Constant *V1, Constant *V2)
Represent subnormal handling kind for floating point instruction inputs and outputs.
DenormalModeKind Input
Denormal treatment kind for floating point instruction inputs in the default floating-point environme...
DenormalModeKind
Represent handled modes for denormal (aka subnormal) modes in the floating point environment.
@ PreserveSign
The sign of a flushed-to-zero number is preserved in the sign of 0.
@ PositiveZero
Denormals are flushed to positive zero.
@ Dynamic
Denormals have unknown treatment.
@ IEEE
IEEE-754 denormal numbers preserved.
DenormalModeKind Output
Denormal flushing mode for floating point instruction results in the default floating point environme...
static constexpr DenormalMode getDynamic()
static constexpr DenormalMode getIEEE()
Incoming for lane maks phi as machine instruction, incoming register Reg and incoming block Block are...
bool isConstant() const
Returns true if we know the value of all bits.
Definition KnownBits.h:54
const APInt & getConstant() const
Returns the value when all bits have a known value.
Definition KnownBits.h:60